@llmgateway/models 1.4.0 → 1.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -249,6 +249,19 @@ export declare const alibabaModels: [{
249
249
  readonly vision: false;
250
250
  readonly tools: true;
251
251
  readonly jsonOutput: true;
252
+ }, {
253
+ readonly providerId: "novita";
254
+ readonly modelName: "qwen/qwen3-235b-a22b-instruct-2507";
255
+ readonly inputPrice: number;
256
+ readonly outputPrice: number;
257
+ readonly requestPrice: 0;
258
+ readonly contextSize: 131072;
259
+ readonly maxOutput: 16384;
260
+ readonly reasoning: false;
261
+ readonly streaming: true;
262
+ readonly vision: false;
263
+ readonly tools: true;
264
+ readonly jsonOutput: true;
252
265
  }];
253
266
  }, {
254
267
  readonly id: "qwen3-235b-a22b-thinking-2507";
@@ -270,6 +283,39 @@ export declare const alibabaModels: [{
270
283
  readonly tools: true;
271
284
  readonly stability: "unstable";
272
285
  readonly jsonOutput: true;
286
+ }, {
287
+ readonly providerId: "novita";
288
+ readonly modelName: "qwen/qwen3-235b-a22b-thinking-2507";
289
+ readonly inputPrice: number;
290
+ readonly outputPrice: number;
291
+ readonly requestPrice: 0;
292
+ readonly contextSize: 131072;
293
+ readonly maxOutput: 32768;
294
+ readonly reasoning: false;
295
+ readonly streaming: true;
296
+ readonly vision: false;
297
+ readonly tools: true;
298
+ readonly jsonOutput: false;
299
+ }];
300
+ }, {
301
+ readonly id: "qwen3-235b-a22b-fp8";
302
+ readonly name: "Qwen3 235B A22B FP8";
303
+ readonly description: "Qwen 3 235B MoE with FP8 quantization.";
304
+ readonly family: "alibaba";
305
+ readonly releasedAt: Date;
306
+ readonly providers: [{
307
+ readonly providerId: "novita";
308
+ readonly modelName: "qwen/qwen3-235b-a22b-fp8";
309
+ readonly inputPrice: number;
310
+ readonly outputPrice: number;
311
+ readonly requestPrice: 0;
312
+ readonly contextSize: 40960;
313
+ readonly maxOutput: 20000;
314
+ readonly reasoning: false;
315
+ readonly streaming: true;
316
+ readonly vision: false;
317
+ readonly tools: false;
318
+ readonly jsonOutput: true;
273
319
  }];
274
320
  }, {
275
321
  readonly id: "qwen3-14b";
@@ -477,6 +523,18 @@ export declare const alibabaModels: [{
477
523
  readonly vision: false;
478
524
  readonly tools: true;
479
525
  readonly jsonOutput: true;
526
+ }, {
527
+ readonly providerId: "novita";
528
+ readonly modelName: "qwen/qwen3-coder-480b-a35b-instruct";
529
+ readonly inputPrice: number;
530
+ readonly outputPrice: number;
531
+ readonly requestPrice: 0;
532
+ readonly contextSize: 262144;
533
+ readonly maxOutput: 65536;
534
+ readonly streaming: true;
535
+ readonly vision: false;
536
+ readonly tools: true;
537
+ readonly jsonOutput: true;
480
538
  }];
481
539
  }, {
482
540
  readonly id: "qwen3-coder-30b-a3b-instruct";
@@ -496,6 +554,18 @@ export declare const alibabaModels: [{
496
554
  readonly vision: false;
497
555
  readonly tools: true;
498
556
  readonly jsonOutput: true;
557
+ }, {
558
+ readonly providerId: "novita";
559
+ readonly modelName: "qwen/qwen3-coder-30b-a3b-instruct";
560
+ readonly inputPrice: number;
561
+ readonly outputPrice: number;
562
+ readonly requestPrice: 0;
563
+ readonly contextSize: 160000;
564
+ readonly maxOutput: 32768;
565
+ readonly streaming: true;
566
+ readonly vision: false;
567
+ readonly tools: true;
568
+ readonly jsonOutput: true;
499
569
  }];
500
570
  }, {
501
571
  readonly id: "qwen3-30b-a3b-instruct-2507";
@@ -595,6 +665,19 @@ export declare const alibabaModels: [{
595
665
  readonly vision: false;
596
666
  readonly tools: true;
597
667
  readonly jsonOutput: false;
668
+ }, {
669
+ readonly providerId: "novita";
670
+ readonly modelName: "qwen/qwen3-next-80b-a3b-thinking";
671
+ readonly inputPrice: number;
672
+ readonly outputPrice: number;
673
+ readonly requestPrice: 0;
674
+ readonly contextSize: 131072;
675
+ readonly maxOutput: 32768;
676
+ readonly reasoning: true;
677
+ readonly streaming: true;
678
+ readonly vision: false;
679
+ readonly tools: true;
680
+ readonly jsonOutput: false;
598
681
  }];
599
682
  }, {
600
683
  readonly id: "qwen3-next-80b-a3b-instruct";
@@ -614,6 +697,18 @@ export declare const alibabaModels: [{
614
697
  readonly vision: false;
615
698
  readonly tools: true;
616
699
  readonly jsonOutput: true;
700
+ }, {
701
+ readonly providerId: "novita";
702
+ readonly modelName: "qwen/qwen3-next-80b-a3b-instruct";
703
+ readonly inputPrice: number;
704
+ readonly outputPrice: number;
705
+ readonly requestPrice: 0;
706
+ readonly contextSize: 131072;
707
+ readonly maxOutput: 32768;
708
+ readonly streaming: true;
709
+ readonly vision: false;
710
+ readonly tools: true;
711
+ readonly jsonOutput: true;
617
712
  }];
618
713
  }, {
619
714
  readonly id: "qwen3-max";
@@ -637,6 +732,18 @@ export declare const alibabaModels: [{
637
732
  readonly vision: true;
638
733
  readonly tools: true;
639
734
  readonly jsonOutput: true;
735
+ }, {
736
+ readonly providerId: "novita";
737
+ readonly modelName: "qwen/qwen3-max";
738
+ readonly inputPrice: number;
739
+ readonly outputPrice: number;
740
+ readonly requestPrice: 0;
741
+ readonly contextSize: 262144;
742
+ readonly maxOutput: 65536;
743
+ readonly streaming: true;
744
+ readonly vision: false;
745
+ readonly tools: true;
746
+ readonly jsonOutput: true;
640
747
  }];
641
748
  }, {
642
749
  readonly id: "qwen3-coder";
@@ -658,6 +765,105 @@ export declare const alibabaModels: [{
658
765
  readonly tools: true;
659
766
  readonly jsonOutput: true;
660
767
  }];
768
+ }, {
769
+ readonly id: "qwen3-vl-30b-a3b-instruct";
770
+ readonly name: "Qwen3 VL 30B A3B Instruct";
771
+ readonly description: "Vision-language Qwen 3 MoE model, 30B size.";
772
+ readonly family: "alibaba";
773
+ readonly releasedAt: Date;
774
+ readonly providers: [{
775
+ readonly providerId: "novita";
776
+ readonly modelName: "qwen/qwen3-vl-30b-a3b-instruct";
777
+ readonly inputPrice: number;
778
+ readonly outputPrice: number;
779
+ readonly requestPrice: 0;
780
+ readonly contextSize: 131072;
781
+ readonly maxOutput: 32768;
782
+ readonly streaming: true;
783
+ readonly vision: true;
784
+ readonly tools: true;
785
+ readonly jsonOutput: false;
786
+ }];
787
+ }, {
788
+ readonly id: "qwen3-vl-30b-a3b-thinking";
789
+ readonly name: "Qwen3 VL 30B A3B Thinking";
790
+ readonly description: "Vision-language Qwen 3 MoE with reasoning capabilities.";
791
+ readonly family: "alibaba";
792
+ readonly releasedAt: Date;
793
+ readonly providers: [{
794
+ readonly providerId: "novita";
795
+ readonly modelName: "qwen/qwen3-vl-30b-a3b-thinking";
796
+ readonly inputPrice: number;
797
+ readonly outputPrice: number;
798
+ readonly requestPrice: 0;
799
+ readonly contextSize: 131072;
800
+ readonly maxOutput: 32768;
801
+ readonly reasoning: true;
802
+ readonly streaming: true;
803
+ readonly vision: true;
804
+ readonly tools: true;
805
+ readonly jsonOutput: true;
806
+ }];
807
+ }, {
808
+ readonly id: "qwen3-32b-fp8";
809
+ readonly name: "Qwen3 32B FP8";
810
+ readonly description: "Qwen 3 32B with FP8 quantization.";
811
+ readonly family: "alibaba";
812
+ readonly releasedAt: Date;
813
+ readonly providers: [{
814
+ readonly providerId: "novita";
815
+ readonly modelName: "qwen/qwen3-32b-fp8";
816
+ readonly inputPrice: number;
817
+ readonly outputPrice: number;
818
+ readonly requestPrice: 0;
819
+ readonly contextSize: 40960;
820
+ readonly maxOutput: 20000;
821
+ readonly reasoning: false;
822
+ readonly streaming: true;
823
+ readonly vision: false;
824
+ readonly tools: false;
825
+ readonly jsonOutput: false;
826
+ }];
827
+ }, {
828
+ readonly id: "qwen3-30b-a3b-fp8";
829
+ readonly name: "Qwen3 30B A3B FP8";
830
+ readonly description: "Qwen 3 30B MoE with FP8 quantization.";
831
+ readonly family: "alibaba";
832
+ readonly releasedAt: Date;
833
+ readonly providers: [{
834
+ readonly providerId: "novita";
835
+ readonly modelName: "qwen/qwen3-30b-a3b-fp8";
836
+ readonly inputPrice: number;
837
+ readonly outputPrice: number;
838
+ readonly requestPrice: 0;
839
+ readonly contextSize: 40960;
840
+ readonly maxOutput: 20000;
841
+ readonly reasoning: false;
842
+ readonly streaming: true;
843
+ readonly vision: false;
844
+ readonly tools: false;
845
+ readonly jsonOutput: false;
846
+ }];
847
+ }, {
848
+ readonly id: "qwen3-4b-fp8";
849
+ readonly name: "Qwen3 4B FP8";
850
+ readonly description: "Lightweight Qwen 3 4B with FP8 quantization.";
851
+ readonly family: "alibaba";
852
+ readonly releasedAt: Date;
853
+ readonly providers: [{
854
+ readonly providerId: "novita";
855
+ readonly modelName: "qwen/qwen3-4b-fp8";
856
+ readonly inputPrice: number;
857
+ readonly outputPrice: number;
858
+ readonly requestPrice: 0;
859
+ readonly contextSize: 128000;
860
+ readonly maxOutput: 20000;
861
+ readonly reasoning: false;
862
+ readonly streaming: true;
863
+ readonly vision: false;
864
+ readonly tools: false;
865
+ readonly jsonOutput: false;
866
+ }];
661
867
  }, {
662
868
  readonly id: "qwen-image-plus";
663
869
  readonly name: "Qwen Image Plus";
@@ -928,6 +1134,18 @@ export declare const alibabaModels: [{
928
1134
  readonly vision: true;
929
1135
  readonly tools: true;
930
1136
  readonly jsonOutput: true;
1137
+ }, {
1138
+ readonly providerId: "novita";
1139
+ readonly modelName: "qwen/qwen3-vl-235b-a22b-instruct";
1140
+ readonly inputPrice: number;
1141
+ readonly outputPrice: number;
1142
+ readonly requestPrice: 0;
1143
+ readonly contextSize: 131072;
1144
+ readonly maxOutput: 32768;
1145
+ readonly streaming: true;
1146
+ readonly vision: true;
1147
+ readonly tools: true;
1148
+ readonly jsonOutput: true;
931
1149
  }];
932
1150
  }, {
933
1151
  readonly id: "qwen3-vl-235b-a22b-thinking";
@@ -949,6 +1167,19 @@ export declare const alibabaModels: [{
949
1167
  readonly vision: true;
950
1168
  readonly tools: false;
951
1169
  readonly jsonOutput: false;
1170
+ }, {
1171
+ readonly providerId: "novita";
1172
+ readonly modelName: "qwen/qwen3-vl-235b-a22b-thinking";
1173
+ readonly inputPrice: number;
1174
+ readonly outputPrice: number;
1175
+ readonly requestPrice: 0;
1176
+ readonly contextSize: 131072;
1177
+ readonly maxOutput: 32768;
1178
+ readonly reasoning: true;
1179
+ readonly streaming: true;
1180
+ readonly vision: true;
1181
+ readonly tools: false;
1182
+ readonly jsonOutput: false;
952
1183
  }];
953
1184
  }, {
954
1185
  readonly id: "qwen2-5-vl-32b-instruct";
@@ -289,6 +289,20 @@ export const alibabaModels = [
289
289
  tools: true,
290
290
  jsonOutput: true,
291
291
  },
292
+ {
293
+ providerId: "novita",
294
+ modelName: "qwen/qwen3-235b-a22b-instruct-2507",
295
+ inputPrice: 0.09 / 1e6,
296
+ outputPrice: 0.58 / 1e6,
297
+ requestPrice: 0,
298
+ contextSize: 131072,
299
+ maxOutput: 16384,
300
+ reasoning: false,
301
+ streaming: true,
302
+ vision: false,
303
+ tools: true,
304
+ jsonOutput: true,
305
+ },
292
306
  ],
293
307
  },
294
308
  {
@@ -313,6 +327,43 @@ export const alibabaModels = [
313
327
  stability: "unstable",
314
328
  jsonOutput: true,
315
329
  },
330
+ {
331
+ providerId: "novita",
332
+ modelName: "qwen/qwen3-235b-a22b-thinking-2507",
333
+ inputPrice: 0.3 / 1e6,
334
+ outputPrice: 3 / 1e6,
335
+ requestPrice: 0,
336
+ contextSize: 131072,
337
+ maxOutput: 32768,
338
+ reasoning: false,
339
+ streaming: true,
340
+ vision: false,
341
+ tools: true,
342
+ jsonOutput: false,
343
+ },
344
+ ],
345
+ },
346
+ {
347
+ id: "qwen3-235b-a22b-fp8",
348
+ name: "Qwen3 235B A22B FP8",
349
+ description: "Qwen 3 235B MoE with FP8 quantization.",
350
+ family: "alibaba",
351
+ releasedAt: new Date("2025-04-28"),
352
+ providers: [
353
+ {
354
+ providerId: "novita",
355
+ modelName: "qwen/qwen3-235b-a22b-fp8",
356
+ inputPrice: 0.2 / 1e6,
357
+ outputPrice: 0.8 / 1e6,
358
+ requestPrice: 0,
359
+ contextSize: 40960,
360
+ maxOutput: 20000,
361
+ reasoning: false,
362
+ streaming: true,
363
+ vision: false,
364
+ tools: false,
365
+ jsonOutput: true,
366
+ },
316
367
  ],
317
368
  },
318
369
  {
@@ -551,6 +602,19 @@ export const alibabaModels = [
551
602
  tools: true,
552
603
  jsonOutput: true,
553
604
  },
605
+ {
606
+ providerId: "novita",
607
+ modelName: "qwen/qwen3-coder-480b-a35b-instruct",
608
+ inputPrice: 0.3 / 1e6,
609
+ outputPrice: 1.3 / 1e6,
610
+ requestPrice: 0,
611
+ contextSize: 262144,
612
+ maxOutput: 65536,
613
+ streaming: true,
614
+ vision: false,
615
+ tools: true,
616
+ jsonOutput: true,
617
+ },
554
618
  ],
555
619
  },
556
620
  {
@@ -573,6 +637,19 @@ export const alibabaModels = [
573
637
  tools: true,
574
638
  jsonOutput: true,
575
639
  },
640
+ {
641
+ providerId: "novita",
642
+ modelName: "qwen/qwen3-coder-30b-a3b-instruct",
643
+ inputPrice: 0.07 / 1e6,
644
+ outputPrice: 0.27 / 1e6,
645
+ requestPrice: 0,
646
+ contextSize: 160000,
647
+ maxOutput: 32768,
648
+ streaming: true,
649
+ vision: false,
650
+ tools: true,
651
+ jsonOutput: true,
652
+ },
576
653
  ],
577
654
  },
578
655
  {
@@ -687,6 +764,20 @@ export const alibabaModels = [
687
764
  tools: true,
688
765
  jsonOutput: false,
689
766
  },
767
+ {
768
+ providerId: "novita",
769
+ modelName: "qwen/qwen3-next-80b-a3b-thinking",
770
+ inputPrice: 0.15 / 1e6,
771
+ outputPrice: 1.5 / 1e6,
772
+ requestPrice: 0,
773
+ contextSize: 131072,
774
+ maxOutput: 32768,
775
+ reasoning: true,
776
+ streaming: true,
777
+ vision: false,
778
+ tools: true,
779
+ jsonOutput: false,
780
+ },
690
781
  ],
691
782
  },
692
783
  {
@@ -709,6 +800,19 @@ export const alibabaModels = [
709
800
  tools: true,
710
801
  jsonOutput: true,
711
802
  },
803
+ {
804
+ providerId: "novita",
805
+ modelName: "qwen/qwen3-next-80b-a3b-instruct",
806
+ inputPrice: 0.15 / 1e6,
807
+ outputPrice: 1.5 / 1e6,
808
+ requestPrice: 0,
809
+ contextSize: 131072,
810
+ maxOutput: 32768,
811
+ streaming: true,
812
+ vision: false,
813
+ tools: true,
814
+ jsonOutput: true,
815
+ },
712
816
  ],
713
817
  },
714
818
  {
@@ -735,6 +839,19 @@ export const alibabaModels = [
735
839
  tools: true,
736
840
  jsonOutput: true,
737
841
  },
842
+ {
843
+ providerId: "novita",
844
+ modelName: "qwen/qwen3-max",
845
+ inputPrice: 0.845 / 1e6,
846
+ outputPrice: 3.38 / 1e6,
847
+ requestPrice: 0,
848
+ contextSize: 262144,
849
+ maxOutput: 65536,
850
+ streaming: true,
851
+ vision: false,
852
+ tools: true,
853
+ jsonOutput: true,
854
+ },
738
855
  ],
739
856
  },
740
857
  {
@@ -760,6 +877,120 @@ export const alibabaModels = [
760
877
  },
761
878
  ],
762
879
  },
880
+ {
881
+ id: "qwen3-vl-30b-a3b-instruct",
882
+ name: "Qwen3 VL 30B A3B Instruct",
883
+ description: "Vision-language Qwen 3 MoE model, 30B size.",
884
+ family: "alibaba",
885
+ releasedAt: new Date("2025-10-05"),
886
+ providers: [
887
+ {
888
+ providerId: "novita",
889
+ modelName: "qwen/qwen3-vl-30b-a3b-instruct",
890
+ inputPrice: 0.2 / 1e6,
891
+ outputPrice: 0.7 / 1e6,
892
+ requestPrice: 0,
893
+ contextSize: 131072,
894
+ maxOutput: 32768,
895
+ streaming: true,
896
+ vision: true,
897
+ tools: true,
898
+ jsonOutput: false,
899
+ },
900
+ ],
901
+ },
902
+ {
903
+ id: "qwen3-vl-30b-a3b-thinking",
904
+ name: "Qwen3 VL 30B A3B Thinking",
905
+ description: "Vision-language Qwen 3 MoE with reasoning capabilities.",
906
+ family: "alibaba",
907
+ releasedAt: new Date("2025-10-11"),
908
+ providers: [
909
+ {
910
+ providerId: "novita",
911
+ modelName: "qwen/qwen3-vl-30b-a3b-thinking",
912
+ inputPrice: 0.2 / 1e6,
913
+ outputPrice: 1 / 1e6,
914
+ requestPrice: 0,
915
+ contextSize: 131072,
916
+ maxOutput: 32768,
917
+ reasoning: true,
918
+ streaming: true,
919
+ vision: true,
920
+ tools: true,
921
+ jsonOutput: true,
922
+ },
923
+ ],
924
+ },
925
+ {
926
+ id: "qwen3-32b-fp8",
927
+ name: "Qwen3 32B FP8",
928
+ description: "Qwen 3 32B with FP8 quantization.",
929
+ family: "alibaba",
930
+ releasedAt: new Date("2025-04-28"),
931
+ providers: [
932
+ {
933
+ providerId: "novita",
934
+ modelName: "qwen/qwen3-32b-fp8",
935
+ inputPrice: 0.1 / 1e6,
936
+ outputPrice: 0.45 / 1e6,
937
+ requestPrice: 0,
938
+ contextSize: 40960,
939
+ maxOutput: 20000,
940
+ reasoning: false,
941
+ streaming: true,
942
+ vision: false,
943
+ tools: false,
944
+ jsonOutput: false,
945
+ },
946
+ ],
947
+ },
948
+ {
949
+ id: "qwen3-30b-a3b-fp8",
950
+ name: "Qwen3 30B A3B FP8",
951
+ description: "Qwen 3 30B MoE with FP8 quantization.",
952
+ family: "alibaba",
953
+ releasedAt: new Date("2025-04-28"),
954
+ providers: [
955
+ {
956
+ providerId: "novita",
957
+ modelName: "qwen/qwen3-30b-a3b-fp8",
958
+ inputPrice: 0.09 / 1e6,
959
+ outputPrice: 0.45 / 1e6,
960
+ requestPrice: 0,
961
+ contextSize: 40960,
962
+ maxOutput: 20000,
963
+ reasoning: false,
964
+ streaming: true,
965
+ vision: false,
966
+ tools: false,
967
+ jsonOutput: false,
968
+ },
969
+ ],
970
+ },
971
+ {
972
+ id: "qwen3-4b-fp8",
973
+ name: "Qwen3 4B FP8",
974
+ description: "Lightweight Qwen 3 4B with FP8 quantization.",
975
+ family: "alibaba",
976
+ releasedAt: new Date("2025-04-28"),
977
+ providers: [
978
+ {
979
+ providerId: "novita",
980
+ modelName: "qwen/qwen3-4b-fp8",
981
+ inputPrice: 0.03 / 1e6,
982
+ outputPrice: 0.03 / 1e6,
983
+ requestPrice: 0,
984
+ contextSize: 128000,
985
+ maxOutput: 20000,
986
+ reasoning: false,
987
+ streaming: true,
988
+ vision: false,
989
+ tools: false,
990
+ jsonOutput: false,
991
+ },
992
+ ],
993
+ },
763
994
  {
764
995
  id: "qwen-image-plus",
765
996
  name: "Qwen Image Plus",
@@ -1072,6 +1303,19 @@ export const alibabaModels = [
1072
1303
  tools: true,
1073
1304
  jsonOutput: true,
1074
1305
  },
1306
+ {
1307
+ providerId: "novita",
1308
+ modelName: "qwen/qwen3-vl-235b-a22b-instruct",
1309
+ inputPrice: 0.3 / 1e6,
1310
+ outputPrice: 1.5 / 1e6,
1311
+ requestPrice: 0,
1312
+ contextSize: 131072,
1313
+ maxOutput: 32768,
1314
+ streaming: true,
1315
+ vision: true,
1316
+ tools: true,
1317
+ jsonOutput: true,
1318
+ },
1075
1319
  ],
1076
1320
  },
1077
1321
  {
@@ -1096,6 +1340,20 @@ export const alibabaModels = [
1096
1340
  tools: false,
1097
1341
  jsonOutput: false,
1098
1342
  },
1343
+ {
1344
+ providerId: "novita",
1345
+ modelName: "qwen/qwen3-vl-235b-a22b-thinking",
1346
+ inputPrice: 0.98 / 1e6,
1347
+ outputPrice: 3.95 / 1e6,
1348
+ requestPrice: 0,
1349
+ contextSize: 131072,
1350
+ maxOutput: 32768,
1351
+ reasoning: true,
1352
+ streaming: true,
1353
+ vision: true,
1354
+ tools: false,
1355
+ jsonOutput: false,
1356
+ },
1099
1357
  ],
1100
1358
  },
1101
1359
  {