@llmgateway/models 1.3.1 → 1.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/dist/models.d.ts CHANGED
@@ -3149,6 +3149,18 @@ export declare const models: [{
3149
3149
  readonly vision: false;
3150
3150
  readonly tools: false;
3151
3151
  readonly jsonOutput: true;
3152
+ }, {
3153
+ readonly providerId: "novita";
3154
+ readonly modelName: "meta-llama/llama-3.1-8b-instruct";
3155
+ readonly inputPrice: number;
3156
+ readonly outputPrice: number;
3157
+ readonly requestPrice: 0;
3158
+ readonly contextSize: 16384;
3159
+ readonly maxOutput: 16384;
3160
+ readonly streaming: true;
3161
+ readonly vision: false;
3162
+ readonly tools: false;
3163
+ readonly jsonOutput: true;
3152
3164
  }];
3153
3165
  }, {
3154
3166
  readonly id: "llama-3.1-70b-instruct";
@@ -3259,6 +3271,18 @@ export declare const models: [{
3259
3271
  readonly vision: false;
3260
3272
  readonly tools: true;
3261
3273
  readonly jsonOutput: true;
3274
+ }, {
3275
+ readonly providerId: "novita";
3276
+ readonly modelName: "meta-llama/llama-3.3-70b-instruct";
3277
+ readonly inputPrice: number;
3278
+ readonly outputPrice: number;
3279
+ readonly requestPrice: 0;
3280
+ readonly contextSize: 131072;
3281
+ readonly maxOutput: 120000;
3282
+ readonly streaming: true;
3283
+ readonly vision: false;
3284
+ readonly tools: true;
3285
+ readonly jsonOutput: false;
3262
3286
  }];
3263
3287
  }, {
3264
3288
  readonly id: "llama-3.1-405b-instruct";
@@ -3320,6 +3344,18 @@ export declare const models: [{
3320
3344
  readonly vision: true;
3321
3345
  readonly tools: false;
3322
3346
  readonly jsonOutput: false;
3347
+ }, {
3348
+ readonly providerId: "novita";
3349
+ readonly modelName: "meta-llama/llama-4-scout-17b-16e-instruct";
3350
+ readonly inputPrice: number;
3351
+ readonly outputPrice: number;
3352
+ readonly requestPrice: 0;
3353
+ readonly contextSize: 131072;
3354
+ readonly maxOutput: 131072;
3355
+ readonly streaming: true;
3356
+ readonly vision: true;
3357
+ readonly tools: false;
3358
+ readonly jsonOutput: true;
3323
3359
  }];
3324
3360
  }, {
3325
3361
  readonly id: "llama-4-maverick-17b-instruct";
@@ -3341,6 +3377,76 @@ export declare const models: [{
3341
3377
  readonly vision: true;
3342
3378
  readonly tools: false;
3343
3379
  readonly jsonOutput: false;
3380
+ }, {
3381
+ readonly providerId: "novita";
3382
+ readonly modelName: "meta-llama/llama-4-maverick-17b-128e-instruct-fp8";
3383
+ readonly inputPrice: number;
3384
+ readonly outputPrice: number;
3385
+ readonly requestPrice: 0;
3386
+ readonly contextSize: 1048576;
3387
+ readonly maxOutput: 8192;
3388
+ readonly streaming: true;
3389
+ readonly vision: true;
3390
+ readonly tools: false;
3391
+ readonly jsonOutput: true;
3392
+ }];
3393
+ }, {
3394
+ readonly id: "llama-3-8b-instruct";
3395
+ readonly name: "Llama 3 8B Instruct";
3396
+ readonly description: "Llama 3 8B instruction-following model.";
3397
+ readonly family: "meta";
3398
+ readonly releasedAt: Date;
3399
+ readonly providers: [{
3400
+ readonly providerId: "novita";
3401
+ readonly modelName: "meta-llama/llama-3-8b-instruct";
3402
+ readonly inputPrice: number;
3403
+ readonly outputPrice: number;
3404
+ readonly requestPrice: 0;
3405
+ readonly contextSize: 8192;
3406
+ readonly maxOutput: 8192;
3407
+ readonly streaming: true;
3408
+ readonly vision: false;
3409
+ readonly tools: false;
3410
+ readonly jsonOutput: true;
3411
+ }];
3412
+ }, {
3413
+ readonly id: "llama-3-70b-instruct";
3414
+ readonly name: "Llama 3 70B Instruct";
3415
+ readonly description: "Llama 3 70B instruction-following model.";
3416
+ readonly family: "meta";
3417
+ readonly releasedAt: Date;
3418
+ readonly providers: [{
3419
+ readonly providerId: "novita";
3420
+ readonly modelName: "meta-llama/llama-3-70b-instruct";
3421
+ readonly inputPrice: number;
3422
+ readonly outputPrice: number;
3423
+ readonly requestPrice: 0;
3424
+ readonly contextSize: 8192;
3425
+ readonly maxOutput: 8000;
3426
+ readonly streaming: true;
3427
+ readonly vision: false;
3428
+ readonly tools: false;
3429
+ readonly jsonOutput: true;
3430
+ }];
3431
+ }, {
3432
+ readonly id: "llama-3.2-3b-instruct";
3433
+ readonly name: "Llama 3.2 3B Instruct";
3434
+ readonly description: "Compact Llama 3.2 3B for efficient inference.";
3435
+ readonly family: "meta";
3436
+ readonly releasedAt: Date;
3437
+ readonly providers: [{
3438
+ readonly providerId: "novita";
3439
+ readonly stability: "unstable";
3440
+ readonly modelName: "meta-llama/llama-3.2-3b-instruct";
3441
+ readonly inputPrice: number;
3442
+ readonly outputPrice: number;
3443
+ readonly requestPrice: 0;
3444
+ readonly contextSize: 32768;
3445
+ readonly maxOutput: 32000;
3446
+ readonly streaming: true;
3447
+ readonly vision: false;
3448
+ readonly tools: false;
3449
+ readonly jsonOutput: true;
3344
3450
  }];
3345
3451
  }, {
3346
3452
  readonly id: "deepseek-v3";
@@ -3887,6 +3993,26 @@ export declare const models: [{
3887
3993
  readonly tools: true;
3888
3994
  readonly jsonOutput: true;
3889
3995
  }];
3996
+ }, {
3997
+ readonly id: "kimi-k2.5";
3998
+ readonly name: "Kimi K2.5";
3999
+ readonly description: "Moonshot's native multimodal model with visual coding and agentic capabilities.";
4000
+ readonly family: "moonshot";
4001
+ readonly releasedAt: Date;
4002
+ readonly providers: [{
4003
+ readonly providerId: "moonshot";
4004
+ readonly modelName: "kimi-k2.5";
4005
+ readonly inputPrice: number;
4006
+ readonly outputPrice: number;
4007
+ readonly cachedInputPrice: number;
4008
+ readonly requestPrice: 0;
4009
+ readonly contextSize: 262144;
4010
+ readonly maxOutput: 32768;
4011
+ readonly streaming: true;
4012
+ readonly vision: true;
4013
+ readonly tools: true;
4014
+ readonly jsonOutput: true;
4015
+ }];
3890
4016
  }, {
3891
4017
  readonly id: "qwen-max";
3892
4018
  readonly name: "Qwen Max";
@@ -3894,6 +4020,7 @@ export declare const models: [{
3894
4020
  readonly family: "alibaba";
3895
4021
  readonly releasedAt: Date;
3896
4022
  readonly providers: [{
4023
+ readonly test: "skip";
3897
4024
  readonly providerId: "alibaba";
3898
4025
  readonly modelName: "qwen-max";
3899
4026
  readonly inputPrice: number;
@@ -3913,6 +4040,7 @@ export declare const models: [{
3913
4040
  readonly family: "alibaba";
3914
4041
  readonly releasedAt: Date;
3915
4042
  readonly providers: [{
4043
+ readonly test: "skip";
3916
4044
  readonly providerId: "alibaba";
3917
4045
  readonly modelName: "qwen-max-latest";
3918
4046
  readonly inputPrice: number;
@@ -3936,6 +4064,20 @@ export declare const models: [{
3936
4064
  readonly modelName: "qwen-plus";
3937
4065
  readonly inputPrice: number;
3938
4066
  readonly outputPrice: number;
4067
+ readonly cachedInputPrice: number;
4068
+ readonly pricingTiers: [{
4069
+ readonly name: "Up to 256K";
4070
+ readonly upToTokens: 256000;
4071
+ readonly inputPrice: number;
4072
+ readonly outputPrice: number;
4073
+ readonly cachedInputPrice: number;
4074
+ }, {
4075
+ readonly name: "Over 256K";
4076
+ readonly upToTokens: number;
4077
+ readonly inputPrice: number;
4078
+ readonly outputPrice: number;
4079
+ readonly cachedInputPrice: number;
4080
+ }];
3939
4081
  readonly requestPrice: 0;
3940
4082
  readonly contextSize: 131072;
3941
4083
  readonly maxOutput: 32000;
@@ -3955,6 +4097,20 @@ export declare const models: [{
3955
4097
  readonly modelName: "qwen-plus-latest";
3956
4098
  readonly inputPrice: number;
3957
4099
  readonly outputPrice: number;
4100
+ readonly cachedInputPrice: number;
4101
+ readonly pricingTiers: [{
4102
+ readonly name: "Up to 256K";
4103
+ readonly upToTokens: 256000;
4104
+ readonly inputPrice: number;
4105
+ readonly outputPrice: number;
4106
+ readonly cachedInputPrice: number;
4107
+ }, {
4108
+ readonly name: "Over 256K";
4109
+ readonly upToTokens: number;
4110
+ readonly inputPrice: number;
4111
+ readonly outputPrice: number;
4112
+ readonly cachedInputPrice: number;
4113
+ }];
3958
4114
  readonly requestPrice: 0;
3959
4115
  readonly contextSize: 1000000;
3960
4116
  readonly maxOutput: 32000;
@@ -3974,6 +4130,20 @@ export declare const models: [{
3974
4130
  readonly modelName: "qwen-flash";
3975
4131
  readonly inputPrice: number;
3976
4132
  readonly outputPrice: number;
4133
+ readonly cachedInputPrice: number;
4134
+ readonly pricingTiers: [{
4135
+ readonly name: "Up to 256K";
4136
+ readonly upToTokens: 256000;
4137
+ readonly inputPrice: number;
4138
+ readonly outputPrice: number;
4139
+ readonly cachedInputPrice: number;
4140
+ }, {
4141
+ readonly name: "Over 256K";
4142
+ readonly upToTokens: number;
4143
+ readonly inputPrice: number;
4144
+ readonly outputPrice: number;
4145
+ readonly cachedInputPrice: number;
4146
+ }];
3977
4147
  readonly requestPrice: 0;
3978
4148
  readonly contextSize: 1000000;
3979
4149
  readonly maxOutput: 32000;
@@ -4094,6 +4264,19 @@ export declare const models: [{
4094
4264
  readonly vision: false;
4095
4265
  readonly tools: true;
4096
4266
  readonly jsonOutput: true;
4267
+ }, {
4268
+ readonly providerId: "novita";
4269
+ readonly modelName: "qwen/qwen3-235b-a22b-instruct-2507";
4270
+ readonly inputPrice: number;
4271
+ readonly outputPrice: number;
4272
+ readonly requestPrice: 0;
4273
+ readonly contextSize: 131072;
4274
+ readonly maxOutput: 16384;
4275
+ readonly reasoning: false;
4276
+ readonly streaming: true;
4277
+ readonly vision: false;
4278
+ readonly tools: true;
4279
+ readonly jsonOutput: true;
4097
4280
  }];
4098
4281
  }, {
4099
4282
  readonly id: "qwen3-235b-a22b-thinking-2507";
@@ -4115,6 +4298,39 @@ export declare const models: [{
4115
4298
  readonly tools: true;
4116
4299
  readonly stability: "unstable";
4117
4300
  readonly jsonOutput: true;
4301
+ }, {
4302
+ readonly providerId: "novita";
4303
+ readonly modelName: "qwen/qwen3-235b-a22b-thinking-2507";
4304
+ readonly inputPrice: number;
4305
+ readonly outputPrice: number;
4306
+ readonly requestPrice: 0;
4307
+ readonly contextSize: 131072;
4308
+ readonly maxOutput: 32768;
4309
+ readonly reasoning: false;
4310
+ readonly streaming: true;
4311
+ readonly vision: false;
4312
+ readonly tools: true;
4313
+ readonly jsonOutput: false;
4314
+ }];
4315
+ }, {
4316
+ readonly id: "qwen3-235b-a22b-fp8";
4317
+ readonly name: "Qwen3 235B A22B FP8";
4318
+ readonly description: "Qwen 3 235B MoE with FP8 quantization.";
4319
+ readonly family: "alibaba";
4320
+ readonly releasedAt: Date;
4321
+ readonly providers: [{
4322
+ readonly providerId: "novita";
4323
+ readonly modelName: "qwen/qwen3-235b-a22b-fp8";
4324
+ readonly inputPrice: number;
4325
+ readonly outputPrice: number;
4326
+ readonly requestPrice: 0;
4327
+ readonly contextSize: 40960;
4328
+ readonly maxOutput: 20000;
4329
+ readonly reasoning: false;
4330
+ readonly streaming: true;
4331
+ readonly vision: false;
4332
+ readonly tools: false;
4333
+ readonly jsonOutput: true;
4118
4334
  }];
4119
4335
  }, {
4120
4336
  readonly id: "qwen3-14b";
@@ -4322,6 +4538,18 @@ export declare const models: [{
4322
4538
  readonly vision: false;
4323
4539
  readonly tools: true;
4324
4540
  readonly jsonOutput: true;
4541
+ }, {
4542
+ readonly providerId: "novita";
4543
+ readonly modelName: "qwen/qwen3-coder-480b-a35b-instruct";
4544
+ readonly inputPrice: number;
4545
+ readonly outputPrice: number;
4546
+ readonly requestPrice: 0;
4547
+ readonly contextSize: 262144;
4548
+ readonly maxOutput: 65536;
4549
+ readonly streaming: true;
4550
+ readonly vision: false;
4551
+ readonly tools: true;
4552
+ readonly jsonOutput: true;
4325
4553
  }];
4326
4554
  }, {
4327
4555
  readonly id: "qwen3-coder-30b-a3b-instruct";
@@ -4341,6 +4569,18 @@ export declare const models: [{
4341
4569
  readonly vision: false;
4342
4570
  readonly tools: true;
4343
4571
  readonly jsonOutput: true;
4572
+ }, {
4573
+ readonly providerId: "novita";
4574
+ readonly modelName: "qwen/qwen3-coder-30b-a3b-instruct";
4575
+ readonly inputPrice: number;
4576
+ readonly outputPrice: number;
4577
+ readonly requestPrice: 0;
4578
+ readonly contextSize: 160000;
4579
+ readonly maxOutput: 32768;
4580
+ readonly streaming: true;
4581
+ readonly vision: false;
4582
+ readonly tools: true;
4583
+ readonly jsonOutput: true;
4344
4584
  }];
4345
4585
  }, {
4346
4586
  readonly id: "qwen3-30b-a3b-instruct-2507";
@@ -4440,6 +4680,19 @@ export declare const models: [{
4440
4680
  readonly vision: false;
4441
4681
  readonly tools: true;
4442
4682
  readonly jsonOutput: false;
4683
+ }, {
4684
+ readonly providerId: "novita";
4685
+ readonly modelName: "qwen/qwen3-next-80b-a3b-thinking";
4686
+ readonly inputPrice: number;
4687
+ readonly outputPrice: number;
4688
+ readonly requestPrice: 0;
4689
+ readonly contextSize: 131072;
4690
+ readonly maxOutput: 32768;
4691
+ readonly reasoning: true;
4692
+ readonly streaming: true;
4693
+ readonly vision: false;
4694
+ readonly tools: true;
4695
+ readonly jsonOutput: false;
4443
4696
  }];
4444
4697
  }, {
4445
4698
  readonly id: "qwen3-next-80b-a3b-instruct";
@@ -4459,6 +4712,18 @@ export declare const models: [{
4459
4712
  readonly vision: false;
4460
4713
  readonly tools: true;
4461
4714
  readonly jsonOutput: true;
4715
+ }, {
4716
+ readonly providerId: "novita";
4717
+ readonly modelName: "qwen/qwen3-next-80b-a3b-instruct";
4718
+ readonly inputPrice: number;
4719
+ readonly outputPrice: number;
4720
+ readonly requestPrice: 0;
4721
+ readonly contextSize: 131072;
4722
+ readonly maxOutput: 32768;
4723
+ readonly streaming: true;
4724
+ readonly vision: false;
4725
+ readonly tools: true;
4726
+ readonly jsonOutput: true;
4462
4727
  }];
4463
4728
  }, {
4464
4729
  readonly id: "qwen3-max";
@@ -4482,6 +4747,18 @@ export declare const models: [{
4482
4747
  readonly vision: true;
4483
4748
  readonly tools: true;
4484
4749
  readonly jsonOutput: true;
4750
+ }, {
4751
+ readonly providerId: "novita";
4752
+ readonly modelName: "qwen/qwen3-max";
4753
+ readonly inputPrice: number;
4754
+ readonly outputPrice: number;
4755
+ readonly requestPrice: 0;
4756
+ readonly contextSize: 262144;
4757
+ readonly maxOutput: 65536;
4758
+ readonly streaming: true;
4759
+ readonly vision: false;
4760
+ readonly tools: true;
4761
+ readonly jsonOutput: true;
4485
4762
  }];
4486
4763
  }, {
4487
4764
  readonly id: "qwen3-coder";
@@ -4504,31 +4781,130 @@ export declare const models: [{
4504
4781
  readonly jsonOutput: true;
4505
4782
  }];
4506
4783
  }, {
4507
- readonly id: "qwen-image-plus";
4508
- readonly name: "Qwen Image Plus";
4509
- readonly description: "Alibaba's Qwen Image Plus model for text-to-image generation with excellent text rendering capabilities.";
4784
+ readonly id: "qwen3-vl-30b-a3b-instruct";
4785
+ readonly name: "Qwen3 VL 30B A3B Instruct";
4786
+ readonly description: "Vision-language Qwen 3 MoE model, 30B size.";
4510
4787
  readonly family: "alibaba";
4511
- readonly output: ["text", "image"];
4512
4788
  readonly releasedAt: Date;
4513
4789
  readonly providers: [{
4514
- readonly test: "skip";
4515
- readonly providerId: "alibaba";
4516
- readonly modelName: "qwen-image-plus";
4517
- readonly inputPrice: 0;
4518
- readonly outputPrice: 0;
4519
- readonly requestPrice: 0.03;
4520
- readonly contextSize: 2000;
4521
- readonly maxOutput: 4096;
4522
- readonly streaming: false;
4523
- readonly vision: false;
4524
- readonly tools: false;
4790
+ readonly providerId: "novita";
4791
+ readonly modelName: "qwen/qwen3-vl-30b-a3b-instruct";
4792
+ readonly inputPrice: number;
4793
+ readonly outputPrice: number;
4794
+ readonly requestPrice: 0;
4795
+ readonly contextSize: 131072;
4796
+ readonly maxOutput: 32768;
4797
+ readonly streaming: true;
4798
+ readonly vision: true;
4799
+ readonly tools: true;
4525
4800
  readonly jsonOutput: false;
4526
- readonly imageGenerations: true;
4527
4801
  }];
4528
4802
  }, {
4529
- readonly id: "qwen-image-max";
4530
- readonly name: "Qwen Image Max";
4531
- readonly description: "Alibaba's flagship Qwen Image Max model for highest quality text-to-image generation.";
4803
+ readonly id: "qwen3-vl-30b-a3b-thinking";
4804
+ readonly name: "Qwen3 VL 30B A3B Thinking";
4805
+ readonly description: "Vision-language Qwen 3 MoE with reasoning capabilities.";
4806
+ readonly family: "alibaba";
4807
+ readonly releasedAt: Date;
4808
+ readonly providers: [{
4809
+ readonly providerId: "novita";
4810
+ readonly modelName: "qwen/qwen3-vl-30b-a3b-thinking";
4811
+ readonly inputPrice: number;
4812
+ readonly outputPrice: number;
4813
+ readonly requestPrice: 0;
4814
+ readonly contextSize: 131072;
4815
+ readonly maxOutput: 32768;
4816
+ readonly reasoning: true;
4817
+ readonly streaming: true;
4818
+ readonly vision: true;
4819
+ readonly tools: true;
4820
+ readonly jsonOutput: true;
4821
+ }];
4822
+ }, {
4823
+ readonly id: "qwen3-32b-fp8";
4824
+ readonly name: "Qwen3 32B FP8";
4825
+ readonly description: "Qwen 3 32B with FP8 quantization.";
4826
+ readonly family: "alibaba";
4827
+ readonly releasedAt: Date;
4828
+ readonly providers: [{
4829
+ readonly providerId: "novita";
4830
+ readonly modelName: "qwen/qwen3-32b-fp8";
4831
+ readonly inputPrice: number;
4832
+ readonly outputPrice: number;
4833
+ readonly requestPrice: 0;
4834
+ readonly contextSize: 40960;
4835
+ readonly maxOutput: 20000;
4836
+ readonly reasoning: false;
4837
+ readonly streaming: true;
4838
+ readonly vision: false;
4839
+ readonly tools: false;
4840
+ readonly jsonOutput: false;
4841
+ }];
4842
+ }, {
4843
+ readonly id: "qwen3-30b-a3b-fp8";
4844
+ readonly name: "Qwen3 30B A3B FP8";
4845
+ readonly description: "Qwen 3 30B MoE with FP8 quantization.";
4846
+ readonly family: "alibaba";
4847
+ readonly releasedAt: Date;
4848
+ readonly providers: [{
4849
+ readonly providerId: "novita";
4850
+ readonly modelName: "qwen/qwen3-30b-a3b-fp8";
4851
+ readonly inputPrice: number;
4852
+ readonly outputPrice: number;
4853
+ readonly requestPrice: 0;
4854
+ readonly contextSize: 40960;
4855
+ readonly maxOutput: 20000;
4856
+ readonly reasoning: false;
4857
+ readonly streaming: true;
4858
+ readonly vision: false;
4859
+ readonly tools: false;
4860
+ readonly jsonOutput: false;
4861
+ }];
4862
+ }, {
4863
+ readonly id: "qwen3-4b-fp8";
4864
+ readonly name: "Qwen3 4B FP8";
4865
+ readonly description: "Lightweight Qwen 3 4B with FP8 quantization.";
4866
+ readonly family: "alibaba";
4867
+ readonly releasedAt: Date;
4868
+ readonly providers: [{
4869
+ readonly providerId: "novita";
4870
+ readonly modelName: "qwen/qwen3-4b-fp8";
4871
+ readonly inputPrice: number;
4872
+ readonly outputPrice: number;
4873
+ readonly requestPrice: 0;
4874
+ readonly contextSize: 128000;
4875
+ readonly maxOutput: 20000;
4876
+ readonly reasoning: false;
4877
+ readonly streaming: true;
4878
+ readonly vision: false;
4879
+ readonly tools: false;
4880
+ readonly jsonOutput: false;
4881
+ }];
4882
+ }, {
4883
+ readonly id: "qwen-image-plus";
4884
+ readonly name: "Qwen Image Plus";
4885
+ readonly description: "Alibaba's Qwen Image Plus model for text-to-image generation with excellent text rendering capabilities.";
4886
+ readonly family: "alibaba";
4887
+ readonly output: ["text", "image"];
4888
+ readonly releasedAt: Date;
4889
+ readonly providers: [{
4890
+ readonly test: "skip";
4891
+ readonly providerId: "alibaba";
4892
+ readonly modelName: "qwen-image-plus";
4893
+ readonly inputPrice: 0;
4894
+ readonly outputPrice: 0;
4895
+ readonly requestPrice: 0.03;
4896
+ readonly contextSize: 2000;
4897
+ readonly maxOutput: 4096;
4898
+ readonly streaming: false;
4899
+ readonly vision: false;
4900
+ readonly tools: false;
4901
+ readonly jsonOutput: false;
4902
+ readonly imageGenerations: true;
4903
+ }];
4904
+ }, {
4905
+ readonly id: "qwen-image-max";
4906
+ readonly name: "Qwen Image Max";
4907
+ readonly description: "Alibaba's flagship Qwen Image Max model for highest quality text-to-image generation.";
4532
4908
  readonly family: "alibaba";
4533
4909
  readonly output: ["text", "image"];
4534
4910
  readonly releasedAt: Date;
@@ -4591,6 +4967,341 @@ export declare const models: [{
4591
4967
  readonly jsonOutput: false;
4592
4968
  readonly imageGenerations: true;
4593
4969
  }];
4970
+ }, {
4971
+ readonly id: "qwq-plus";
4972
+ readonly name: "QwQ Plus";
4973
+ readonly description: "Alibaba's reasoning model with enhanced math and code capabilities.";
4974
+ readonly family: "alibaba";
4975
+ readonly releasedAt: Date;
4976
+ readonly providers: [{
4977
+ readonly providerId: "alibaba";
4978
+ readonly modelName: "qwq-plus";
4979
+ readonly inputPrice: number;
4980
+ readonly outputPrice: number;
4981
+ readonly requestPrice: 0;
4982
+ readonly contextSize: 131072;
4983
+ readonly maxOutput: 8192;
4984
+ readonly reasoning: true;
4985
+ readonly reasoningOutput: "omit";
4986
+ readonly streaming: true;
4987
+ readonly vision: false;
4988
+ readonly tools: false;
4989
+ readonly jsonOutput: false;
4990
+ }];
4991
+ }, {
4992
+ readonly id: "qwen-coder-plus";
4993
+ readonly name: "Qwen Coder Plus";
4994
+ readonly description: "Alibaba's code-specialized model based on Qwen2.5.";
4995
+ readonly family: "alibaba";
4996
+ readonly releasedAt: Date;
4997
+ readonly providers: [{
4998
+ readonly test: "skip";
4999
+ readonly providerId: "alibaba";
5000
+ readonly modelName: "qwen-coder-plus";
5001
+ readonly inputPrice: number;
5002
+ readonly outputPrice: number;
5003
+ readonly requestPrice: 0;
5004
+ readonly contextSize: 131072;
5005
+ readonly maxOutput: 8192;
5006
+ readonly streaming: true;
5007
+ readonly vision: false;
5008
+ readonly tools: true;
5009
+ readonly jsonOutput: true;
5010
+ }];
5011
+ }, {
5012
+ readonly id: "qwen3-coder-flash";
5013
+ readonly name: "Qwen3 Coder Flash";
5014
+ readonly description: "Fast, cost-effective Qwen 3 model for code generation.";
5015
+ readonly family: "alibaba";
5016
+ readonly releasedAt: Date;
5017
+ readonly providers: [{
5018
+ readonly providerId: "alibaba";
5019
+ readonly modelName: "qwen3-coder-flash";
5020
+ readonly inputPrice: number;
5021
+ readonly outputPrice: number;
5022
+ readonly cachedInputPrice: number;
5023
+ readonly pricingTiers: [{
5024
+ readonly name: "Up to 32K";
5025
+ readonly upToTokens: 32000;
5026
+ readonly inputPrice: number;
5027
+ readonly outputPrice: number;
5028
+ readonly cachedInputPrice: number;
5029
+ }, {
5030
+ readonly name: "32K-128K";
5031
+ readonly upToTokens: 128000;
5032
+ readonly inputPrice: number;
5033
+ readonly outputPrice: number;
5034
+ readonly cachedInputPrice: number;
5035
+ }, {
5036
+ readonly name: "128K-256K";
5037
+ readonly upToTokens: 256000;
5038
+ readonly inputPrice: number;
5039
+ readonly outputPrice: number;
5040
+ readonly cachedInputPrice: number;
5041
+ }, {
5042
+ readonly name: "Over 256K";
5043
+ readonly upToTokens: number;
5044
+ readonly inputPrice: number;
5045
+ readonly outputPrice: number;
5046
+ readonly cachedInputPrice: number;
5047
+ }];
5048
+ readonly requestPrice: 0;
5049
+ readonly contextSize: 1000000;
5050
+ readonly maxOutput: 65536;
5051
+ readonly streaming: true;
5052
+ readonly vision: false;
5053
+ readonly tools: true;
5054
+ readonly jsonOutput: true;
5055
+ }];
5056
+ }, {
5057
+ readonly id: "qwen3-vl-plus";
5058
+ readonly name: "Qwen3 VL Plus";
5059
+ readonly description: "Qwen 3 vision-language model with balanced performance.";
5060
+ readonly family: "alibaba";
5061
+ readonly releasedAt: Date;
5062
+ readonly providers: [{
5063
+ readonly providerId: "alibaba";
5064
+ readonly modelName: "qwen3-vl-plus";
5065
+ readonly inputPrice: number;
5066
+ readonly outputPrice: number;
5067
+ readonly cachedInputPrice: number;
5068
+ readonly pricingTiers: [{
5069
+ readonly name: "Up to 32K";
5070
+ readonly upToTokens: 32000;
5071
+ readonly inputPrice: number;
5072
+ readonly outputPrice: number;
5073
+ readonly cachedInputPrice: number;
5074
+ }, {
5075
+ readonly name: "32K-128K";
5076
+ readonly upToTokens: 128000;
5077
+ readonly inputPrice: number;
5078
+ readonly outputPrice: number;
5079
+ readonly cachedInputPrice: number;
5080
+ }, {
5081
+ readonly name: "Over 128K";
5082
+ readonly upToTokens: number;
5083
+ readonly inputPrice: number;
5084
+ readonly outputPrice: number;
5085
+ readonly cachedInputPrice: number;
5086
+ }];
5087
+ readonly requestPrice: 0;
5088
+ readonly contextSize: 262144;
5089
+ readonly maxOutput: 32768;
5090
+ readonly streaming: true;
5091
+ readonly vision: true;
5092
+ readonly tools: false;
5093
+ readonly jsonOutput: true;
5094
+ }];
5095
+ }, {
5096
+ readonly id: "qwen3-vl-flash";
5097
+ readonly name: "Qwen3 VL Flash";
5098
+ readonly description: "Fast Qwen 3 vision-language model for quick image tasks.";
5099
+ readonly family: "alibaba";
5100
+ readonly releasedAt: Date;
5101
+ readonly providers: [{
5102
+ readonly providerId: "alibaba";
5103
+ readonly modelName: "qwen3-vl-flash";
5104
+ readonly inputPrice: number;
5105
+ readonly outputPrice: number;
5106
+ readonly cachedInputPrice: number;
5107
+ readonly pricingTiers: [{
5108
+ readonly name: "Up to 32K";
5109
+ readonly upToTokens: 32000;
5110
+ readonly inputPrice: number;
5111
+ readonly outputPrice: number;
5112
+ readonly cachedInputPrice: number;
5113
+ }, {
5114
+ readonly name: "32K-128K";
5115
+ readonly upToTokens: 128000;
5116
+ readonly inputPrice: number;
5117
+ readonly outputPrice: number;
5118
+ readonly cachedInputPrice: number;
5119
+ }, {
5120
+ readonly name: "Over 128K";
5121
+ readonly upToTokens: number;
5122
+ readonly inputPrice: number;
5123
+ readonly outputPrice: number;
5124
+ readonly cachedInputPrice: number;
5125
+ }];
5126
+ readonly requestPrice: 0;
5127
+ readonly contextSize: 262144;
5128
+ readonly maxOutput: 32768;
5129
+ readonly streaming: true;
5130
+ readonly vision: true;
5131
+ readonly tools: true;
5132
+ readonly jsonOutput: true;
5133
+ }];
5134
+ }, {
5135
+ readonly id: "qwen3-vl-235b-a22b-instruct";
5136
+ readonly name: "Qwen3 VL 235B A22B Instruct";
5137
+ readonly description: "Large Qwen 3 MoE vision-language instruction model.";
5138
+ readonly family: "alibaba";
5139
+ readonly releasedAt: Date;
5140
+ readonly providers: [{
5141
+ readonly providerId: "alibaba";
5142
+ readonly modelName: "qwen3-vl-235b-a22b-instruct";
5143
+ readonly inputPrice: number;
5144
+ readonly outputPrice: number;
5145
+ readonly requestPrice: 0;
5146
+ readonly contextSize: 131072;
5147
+ readonly maxOutput: 32768;
5148
+ readonly streaming: true;
5149
+ readonly vision: true;
5150
+ readonly tools: true;
5151
+ readonly jsonOutput: true;
5152
+ }, {
5153
+ readonly providerId: "novita";
5154
+ readonly modelName: "qwen/qwen3-vl-235b-a22b-instruct";
5155
+ readonly inputPrice: number;
5156
+ readonly outputPrice: number;
5157
+ readonly requestPrice: 0;
5158
+ readonly contextSize: 131072;
5159
+ readonly maxOutput: 32768;
5160
+ readonly streaming: true;
5161
+ readonly vision: true;
5162
+ readonly tools: true;
5163
+ readonly jsonOutput: true;
5164
+ }];
5165
+ }, {
5166
+ readonly id: "qwen3-vl-235b-a22b-thinking";
5167
+ readonly name: "Qwen3 VL 235B A22B Thinking";
5168
+ readonly description: "Large Qwen 3 MoE vision-language model with reasoning capabilities.";
5169
+ readonly family: "alibaba";
5170
+ readonly releasedAt: Date;
5171
+ readonly providers: [{
5172
+ readonly providerId: "alibaba";
5173
+ readonly modelName: "qwen3-vl-235b-a22b-thinking";
5174
+ readonly inputPrice: number;
5175
+ readonly outputPrice: number;
5176
+ readonly requestPrice: 0;
5177
+ readonly contextSize: 131072;
5178
+ readonly maxOutput: 32768;
5179
+ readonly reasoning: true;
5180
+ readonly reasoningOutput: "omit";
5181
+ readonly streaming: true;
5182
+ readonly vision: true;
5183
+ readonly tools: false;
5184
+ readonly jsonOutput: false;
5185
+ }, {
5186
+ readonly providerId: "novita";
5187
+ readonly modelName: "qwen/qwen3-vl-235b-a22b-thinking";
5188
+ readonly inputPrice: number;
5189
+ readonly outputPrice: number;
5190
+ readonly requestPrice: 0;
5191
+ readonly contextSize: 131072;
5192
+ readonly maxOutput: 32768;
5193
+ readonly reasoning: true;
5194
+ readonly streaming: true;
5195
+ readonly vision: true;
5196
+ readonly tools: false;
5197
+ readonly jsonOutput: false;
5198
+ }];
5199
+ }, {
5200
+ readonly id: "qwen2-5-vl-32b-instruct";
5201
+ readonly name: "Qwen2.5 VL 32B Instruct";
5202
+ readonly description: "Vision-language Qwen 2.5 model, 32B size.";
5203
+ readonly family: "alibaba";
5204
+ readonly releasedAt: Date;
5205
+ readonly providers: [{
5206
+ readonly test: "skip";
5207
+ readonly providerId: "alibaba";
5208
+ readonly modelName: "qwen2.5-vl-32b-instruct";
5209
+ readonly inputPrice: number;
5210
+ readonly outputPrice: number;
5211
+ readonly requestPrice: 0;
5212
+ readonly contextSize: 131072;
5213
+ readonly maxOutput: 32768;
5214
+ readonly streaming: true;
5215
+ readonly vision: true;
5216
+ readonly tools: false;
5217
+ readonly jsonOutput: true;
5218
+ }];
5219
+ }, {
5220
+ readonly id: "qwen3-max-2026-01-23";
5221
+ readonly name: "Qwen3 Max 2026-01-23";
5222
+ readonly description: "Latest Qwen 3 flagship model with integrated thinking mode and tool support.";
5223
+ readonly family: "alibaba";
5224
+ readonly releasedAt: Date;
5225
+ readonly providers: [{
5226
+ readonly test: "skip";
5227
+ readonly providerId: "alibaba";
5228
+ readonly modelName: "qwen3-max-2026-01-23";
5229
+ readonly inputPrice: number;
5230
+ readonly outputPrice: number;
5231
+ readonly cachedInputPrice: number;
5232
+ readonly pricingTiers: [{
5233
+ readonly name: "Up to 32K";
5234
+ readonly upToTokens: 32000;
5235
+ readonly inputPrice: number;
5236
+ readonly outputPrice: number;
5237
+ readonly cachedInputPrice: number;
5238
+ }, {
5239
+ readonly name: "32K-128K";
5240
+ readonly upToTokens: 128000;
5241
+ readonly inputPrice: number;
5242
+ readonly outputPrice: number;
5243
+ readonly cachedInputPrice: number;
5244
+ }, {
5245
+ readonly name: "Over 128K";
5246
+ readonly upToTokens: number;
5247
+ readonly inputPrice: number;
5248
+ readonly outputPrice: number;
5249
+ readonly cachedInputPrice: number;
5250
+ }];
5251
+ readonly requestPrice: 0;
5252
+ readonly contextSize: 262144;
5253
+ readonly maxOutput: 65536;
5254
+ readonly reasoning: true;
5255
+ readonly reasoningOutput: "omit";
5256
+ readonly streaming: true;
5257
+ readonly vision: true;
5258
+ readonly tools: true;
5259
+ readonly jsonOutput: true;
5260
+ }];
5261
+ }, {
5262
+ readonly id: "qwen-image-edit-plus";
5263
+ readonly name: "Qwen Image Edit Plus";
5264
+ readonly description: "Alibaba's image editing model for modifying existing images.";
5265
+ readonly family: "alibaba";
5266
+ readonly output: ["text", "image"];
5267
+ readonly releasedAt: Date;
5268
+ readonly providers: [{
5269
+ readonly test: "skip";
5270
+ readonly providerId: "alibaba";
5271
+ readonly modelName: "qwen-image-edit-plus";
5272
+ readonly inputPrice: 0;
5273
+ readonly outputPrice: 0;
5274
+ readonly requestPrice: 0.04;
5275
+ readonly contextSize: 2000;
5276
+ readonly maxOutput: 4096;
5277
+ readonly streaming: false;
5278
+ readonly vision: true;
5279
+ readonly tools: false;
5280
+ readonly jsonOutput: false;
5281
+ readonly imageGenerations: true;
5282
+ }];
5283
+ }, {
5284
+ readonly id: "qwen-image-edit-max";
5285
+ readonly name: "Qwen Image Edit Max";
5286
+ readonly description: "Alibaba's flagship image editing model for high-quality image modifications.";
5287
+ readonly family: "alibaba";
5288
+ readonly output: ["text", "image"];
5289
+ readonly releasedAt: Date;
5290
+ readonly providers: [{
5291
+ readonly test: "skip";
5292
+ readonly providerId: "alibaba";
5293
+ readonly modelName: "qwen-image-edit-max";
5294
+ readonly inputPrice: 0;
5295
+ readonly outputPrice: 0;
5296
+ readonly requestPrice: 0.08;
5297
+ readonly contextSize: 2000;
5298
+ readonly maxOutput: 4096;
5299
+ readonly streaming: false;
5300
+ readonly vision: true;
5301
+ readonly tools: false;
5302
+ readonly jsonOutput: false;
5303
+ readonly imageGenerations: true;
5304
+ }];
4594
5305
  }, {
4595
5306
  readonly id: "seed-1-6-250615";
4596
5307
  readonly name: "Seed 1.6 (250615)";
@@ -4741,6 +5452,26 @@ export declare const models: [{
4741
5452
  readonly jsonOutput: true;
4742
5453
  readonly deactivatedAt: Date;
4743
5454
  }];
5455
+ }, {
5456
+ readonly id: "hermes-2-pro-llama-3-8b";
5457
+ readonly name: "Hermes 2 Pro Llama 3 8B";
5458
+ readonly description: "Nous Research Hermes 2 Pro based on Llama 3 8B.";
5459
+ readonly family: "nousresearch";
5460
+ readonly releasedAt: Date;
5461
+ readonly providers: [{
5462
+ readonly providerId: "novita";
5463
+ readonly stability: "unstable";
5464
+ readonly modelName: "nousresearch/hermes-2-pro-llama-3-8b";
5465
+ readonly inputPrice: number;
5466
+ readonly outputPrice: number;
5467
+ readonly requestPrice: 0;
5468
+ readonly contextSize: 8192;
5469
+ readonly maxOutput: 8192;
5470
+ readonly streaming: true;
5471
+ readonly vision: false;
5472
+ readonly tools: false;
5473
+ readonly jsonOutput: false;
5474
+ }];
4744
5475
  }, {
4745
5476
  readonly id: "deepseek-r1t2-chimera-free";
4746
5477
  readonly name: "DeepSeek R1T2 Chimera (Free)";