xinference 1.9.1__py3-none-any.whl → 1.10.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of xinference might be problematic. Click here for more details.

Files changed (34) hide show
  1. xinference/_version.py +3 -3
  2. xinference/api/restful_api.py +415 -1
  3. xinference/constants.py +2 -0
  4. xinference/core/supervisor.py +29 -1
  5. xinference/model/audio/core.py +5 -0
  6. xinference/model/audio/kokoro.py +1 -1
  7. xinference/model/audio/kokoro_zh.py +124 -0
  8. xinference/model/audio/model_spec.json +20 -0
  9. xinference/model/embedding/sentence_transformers/core.py +4 -4
  10. xinference/model/embedding/vllm/core.py +7 -1
  11. xinference/model/image/model_spec.json +2 -3
  12. xinference/model/llm/core.py +10 -0
  13. xinference/model/llm/llama_cpp/core.py +1 -0
  14. xinference/model/llm/llm_family.json +40 -20
  15. xinference/model/llm/llm_family.py +1 -0
  16. xinference/model/llm/mlx/core.py +52 -33
  17. xinference/model/llm/sglang/core.py +2 -44
  18. xinference/model/llm/tool_parsers/__init__.py +58 -0
  19. xinference/model/llm/tool_parsers/abstract_tool_parser.py +33 -0
  20. xinference/model/llm/tool_parsers/deepseek_r1_tool_parser.py +128 -0
  21. xinference/model/llm/tool_parsers/deepseek_v3_tool_parser.py +145 -0
  22. xinference/model/llm/tool_parsers/glm4_tool_parser.py +123 -0
  23. xinference/model/llm/tool_parsers/llama3_tool_parser.py +77 -0
  24. xinference/model/llm/tool_parsers/qwen_tool_parser.py +320 -0
  25. xinference/model/llm/transformers/core.py +1 -1
  26. xinference/model/llm/utils.py +127 -45
  27. xinference/model/llm/vllm/core.py +2 -61
  28. xinference/types.py +105 -2
  29. {xinference-1.9.1.dist-info → xinference-1.10.0.dist-info}/METADATA +7 -3
  30. {xinference-1.9.1.dist-info → xinference-1.10.0.dist-info}/RECORD +34 -26
  31. {xinference-1.9.1.dist-info → xinference-1.10.0.dist-info}/WHEEL +0 -0
  32. {xinference-1.9.1.dist-info → xinference-1.10.0.dist-info}/entry_points.txt +0 -0
  33. {xinference-1.9.1.dist-info → xinference-1.10.0.dist-info}/licenses/LICENSE +0 -0
  34. {xinference-1.9.1.dist-info → xinference-1.10.0.dist-info}/top_level.txt +0 -0
xinference/types.py CHANGED
@@ -351,6 +351,11 @@ class ModelAndPrompt(BaseModel):
351
351
  prompt: str
352
352
 
353
353
 
354
+ class ModelAndMessages(BaseModel):
355
+ model: str
356
+ messages: List[Dict[str, Any]]
357
+
358
+
354
359
  class CreateCompletionTorch(BaseModel):
355
360
  echo: bool = echo_field
356
361
  max_tokens: Optional[int] = max_tokens_field
@@ -371,7 +376,6 @@ class CreateCompletionTorch(BaseModel):
371
376
  # This type is for openai API compatibility
372
377
  CreateCompletionOpenAI: BaseModel
373
378
 
374
-
375
379
  from openai.types.completion_create_params import CompletionCreateParamsNonStreaming
376
380
 
377
381
  CreateCompletionOpenAI = create_model_from_typeddict(
@@ -395,7 +399,6 @@ class CreateChatModel(BaseModel):
395
399
  # Currently, chat calls generates, so the params share the same one.
396
400
  CreateChatCompletionTorch = CreateCompletionTorch
397
401
 
398
-
399
402
  from ._compat import CreateChatCompletionOpenAI
400
403
 
401
404
 
@@ -462,3 +465,103 @@ class PeftModelConfig:
462
465
  image_lora_load_kwargs=data.get("image_lora_load_kwargs"),
463
466
  image_lora_fuse_kwargs=data.get("image_lora_fuse_kwargs"),
464
467
  )
468
+
469
+
470
+ # This type is for Anthropic API compatibility
471
+ ANTHROPIC_AVAILABLE = False
472
+
473
+ try:
474
+ from anthropic.types import ContentBlock, Usage
475
+
476
+ ANTHROPIC_AVAILABLE = True
477
+ except ImportError:
478
+ ContentBlock = None
479
+ Usage = None
480
+
481
+ # Use TYPE_CHECKING to avoid runtime issues with mypy
482
+ from typing import TYPE_CHECKING
483
+
484
+ if TYPE_CHECKING:
485
+ # For type checking, define the types as if Anthropic is available
486
+ from anthropic.types import ContentBlock as ContentBlock_
487
+ from anthropic.types import Usage as Usage_
488
+
489
+ class AnthropicMessage(TypedDict):
490
+ id: str
491
+ type: str
492
+ role: str
493
+ content: List[ContentBlock_]
494
+ model: str
495
+ stop_reason: str
496
+ stop_sequence: str
497
+ usage: Usage_
498
+ container: Dict[str, Any]
499
+
500
+ class MessageCreateParams(TypedDict):
501
+ model: str
502
+ messages: List[Dict[str, Any]]
503
+ max_tokens: int
504
+ stream: NotRequired[bool]
505
+ temperature: NotRequired[float]
506
+ top_p: NotRequired[float]
507
+ top_k: NotRequired[int]
508
+ stop_sequences: NotRequired[List[str]]
509
+ metadata: NotRequired[Dict[str, Any]]
510
+ tools: NotRequired[List[Dict[str, Any]]]
511
+ tool_choice: NotRequired[Union[str, Dict[str, Any]]]
512
+
513
+ CreateMessageAnthropic: BaseModel
514
+
515
+ class CreateMessage(
516
+ ModelAndMessages,
517
+ ):
518
+ pass
519
+
520
+ else:
521
+ # Runtime definitions
522
+ if ANTHROPIC_AVAILABLE:
523
+
524
+ class AnthropicMessage(TypedDict):
525
+ id: str
526
+ type: str
527
+ role: str
528
+ content: List[ContentBlock]
529
+ model: str
530
+ stop_reason: str
531
+ stop_sequence: str
532
+ usage: Usage
533
+ container: Dict[str, Any]
534
+
535
+ class MessageCreateParams(TypedDict):
536
+ model: str
537
+ messages: List[Dict[str, Any]]
538
+ max_tokens: int
539
+ stream: NotRequired[bool]
540
+ temperature: NotRequired[float]
541
+ top_p: NotRequired[float]
542
+ top_k: NotRequired[int]
543
+ stop_sequences: NotRequired[List[str]]
544
+ metadata: NotRequired[Dict[str, Any]]
545
+ tools: NotRequired[List[Dict[str, Any]]]
546
+ tool_choice: NotRequired[Union[str, Dict[str, Any]]]
547
+
548
+ CreateMessageAnthropic: BaseModel = create_model_from_typeddict(
549
+ MessageCreateParams,
550
+ )
551
+ CreateMessageAnthropic = fix_forward_ref(CreateMessageAnthropic)
552
+
553
+ class CreateMessage(CreateMessageAnthropic):
554
+ pass
555
+
556
+ else:
557
+ # Define dummy types when Anthropic is not available
558
+ class AnthropicMessage:
559
+ pass
560
+
561
+ class MessageCreateParams:
562
+ pass
563
+
564
+ CreateMessageAnthropic = None
565
+
566
+ class CreateMessage:
567
+ pass
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: xinference
3
- Version: 1.9.1
3
+ Version: 1.10.0
4
4
  Summary: Model Serving Made Easy
5
5
  Home-page: https://github.com/xorbitsai/inference
6
6
  Author: Qin Xuye
@@ -61,12 +61,14 @@ Requires-Dist: jieba>=0.42.0; extra == "dev"
61
61
  Requires-Dist: flake8>=3.8.0; extra == "dev"
62
62
  Requires-Dist: black; extra == "dev"
63
63
  Requires-Dist: openai>=1.40.0; extra == "dev"
64
+ Requires-Dist: anthropic; extra == "dev"
64
65
  Requires-Dist: langchain; extra == "dev"
65
66
  Requires-Dist: langchain-community; extra == "dev"
66
67
  Requires-Dist: orjson; extra == "dev"
67
68
  Requires-Dist: sphinx-tabs; extra == "dev"
68
69
  Requires-Dist: sphinx-design; extra == "dev"
69
70
  Provides-Extra: all
71
+ Requires-Dist: anthropic; extra == "all"
70
72
  Requires-Dist: uv; extra == "all"
71
73
  Requires-Dist: xllamacpp>=0.2.0; extra == "all"
72
74
  Requires-Dist: transformers>=4.46.0; extra == "all"
@@ -115,7 +117,7 @@ Requires-Dist: torchvision; extra == "all"
115
117
  Requires-Dist: gguf; extra == "all"
116
118
  Requires-Dist: diffusers>=0.32.0; extra == "all"
117
119
  Requires-Dist: imageio-ffmpeg; extra == "all"
118
- Requires-Dist: funasr<1.1.17; extra == "all"
120
+ Requires-Dist: funasr==1.2.7; extra == "all"
119
121
  Requires-Dist: omegaconf~=2.3.0; extra == "all"
120
122
  Requires-Dist: nemo_text_processing<1.1.0; sys_platform == "linux" and extra == "all"
121
123
  Requires-Dist: WeTextProcessing<1.0.4; sys_platform == "linux" and extra == "all"
@@ -230,7 +232,7 @@ Provides-Extra: video
230
232
  Requires-Dist: diffusers>=0.32.0; extra == "video"
231
233
  Requires-Dist: imageio-ffmpeg; extra == "video"
232
234
  Provides-Extra: audio
233
- Requires-Dist: funasr<1.1.17; extra == "audio"
235
+ Requires-Dist: funasr==1.2.7; extra == "audio"
234
236
  Requires-Dist: omegaconf~=2.3.0; extra == "audio"
235
237
  Requires-Dist: nemo_text_processing<1.1.0; sys_platform == "linux" and extra == "audio"
236
238
  Requires-Dist: WeTextProcessing<1.0.4; sys_platform == "linux" and extra == "audio"
@@ -292,6 +294,8 @@ Provides-Extra: benchmark
292
294
  Requires-Dist: psutil; extra == "benchmark"
293
295
  Provides-Extra: virtualenv
294
296
  Requires-Dist: uv; extra == "virtualenv"
297
+ Provides-Extra: anthropic
298
+ Requires-Dist: anthropic; extra == "anthropic"
295
299
  Dynamic: description
296
300
  Dynamic: description-content-type
297
301
  Dynamic: license-file
@@ -1,15 +1,15 @@
1
1
  xinference/__init__.py,sha256=nmTTrYbIpj964ZF6ojtgOM7E85JBOj1EyQbmYjbj1jw,915
2
2
  xinference/_compat.py,sha256=YF-lS6tX06zkFi2oFS0yq_LBn4hX_8u0Ft0vKxGALwA,4238
3
- xinference/_version.py,sha256=6_x_pxOSXblLpDA4uTiOqGAId7aIL16mW_MYzD04Vms,497
3
+ xinference/_version.py,sha256=_EWji1MNqQ79G4kHRFbbD_UdNhdfHKrUEJFT8lnM8fs,498
4
4
  xinference/conftest.py,sha256=vETDpRBVIlWbWi7OTwf7og89U25KyYGyI7yPIB3O8N8,9564
5
- xinference/constants.py,sha256=HiQr-_L39O4_GNPQbbUGwi5YYSJN_vI9WVSvJhZMmDU,5000
5
+ xinference/constants.py,sha256=643I-3Hd-3BU6DRCMrohsW5HYp990WjYi1cbFwAxCL8,5117
6
6
  xinference/device_utils.py,sha256=vt3GpNNfEfuJzXPb49bUnADyM2r4SqgG03ODiJO86sA,4953
7
7
  xinference/fields.py,sha256=FaL9-jXDkn6kwupCmo-F6hh2JvMPJJzRWSUB1NKuhKc,5352
8
8
  xinference/isolation.py,sha256=gTU1em5fxg1m-7hxieWBMZvVkXZX4GZYmeT7XxXsYrU,2699
9
- xinference/types.py,sha256=uRCkC6yHyYWe5mgLpwyGuAeDnkCZa9ScGvWE8WiRGjI,11789
9
+ xinference/types.py,sha256=JvYmp3k693GhubCwz4nOeLTYMKi0eANjR8e6MwcHSl0,14617
10
10
  xinference/utils.py,sha256=xMuOg3LZhTUf7inEhm-HmXCIoly0pHaWtMKMnnf8XGk,2273
11
11
  xinference/api/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
12
- xinference/api/restful_api.py,sha256=ws77VtNtxzWbeogTH2mmNHaeFmMqqnnS41afjahmyL8,102642
12
+ xinference/api/restful_api.py,sha256=I0aZwL6lKNxZDpApiFbxHVOoo24hdj3OswTC7UmsYMk,119876
13
13
  xinference/api/oauth2/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
14
14
  xinference/api/oauth2/auth_service.py,sha256=74JzB42fbbmBu4Q1dW3A9Fp_N7167KgRGB42Z0NHjAM,6119
15
15
  xinference/api/oauth2/types.py,sha256=K923sv_XySIUtM2Eozl9IG082IJcDOS5SFLrPZ5ELBg,996
@@ -28,7 +28,7 @@ xinference/core/model.py,sha256=9go5zbuDZ7MvUvymdp4cgX65K1LgxUw-xggZ04eBSfc,3966
28
28
  xinference/core/progress_tracker.py,sha256=CNCc1ZVscvp-JJznPTYJDPuis7ya6ZothZUIalDcxDo,6798
29
29
  xinference/core/resource.py,sha256=aTV89dmuKxw5JnwQglRkA2Wxu1EBLM5WjmLxITSXYgs,1808
30
30
  xinference/core/status_guard.py,sha256=VLhyqpobdclfyzcROqf4bmGDiKpuHllto316X3Z6Hrc,2860
31
- xinference/core/supervisor.py,sha256=CjZJQBZQ4P3M5BDdt6Fnwr6HqbBwnfrDpsrSOrdfz6U,74442
31
+ xinference/core/supervisor.py,sha256=Gxo1jFtqDc-yuU5Zg3uaXL3NmADlrAIDy_l2DyUDu48,75814
32
32
  xinference/core/utils.py,sha256=VgcvxpTr2Q8am3MoHp7JPjC7jLYlKX2kLVdBo2Q_fRo,10430
33
33
  xinference/core/worker.py,sha256=_t2T7xd_47-y4A2i62uZkV4pDpYJebVFqE8eu_PrcLQ,62252
34
34
  xinference/deploy/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
@@ -46,18 +46,19 @@ xinference/model/custom.py,sha256=byW3aBEUAaWPS9jAyEoabZ0ktRGJixSyyuDb6Dp-OOo,65
46
46
  xinference/model/utils.py,sha256=pH6yhCJnDoakJMcWXgQ8jL9_59OVJEx90q1Oox-hXyE,20630
47
47
  xinference/model/audio/__init__.py,sha256=RPf_feWYEh_BfMmwRkehIOBK5vUx6AadMHXp1d6EAk4,3473
48
48
  xinference/model/audio/chattts.py,sha256=LmwD-X1XFKhVwA5ruqEQJ7VOiHIVwMuJrL7cH82poNE,4154
49
- xinference/model/audio/core.py,sha256=oCy_a216F8iR_76ckMp7PFwMmE002iSRqemy52Gg864,6574
49
+ xinference/model/audio/core.py,sha256=OBXE7S9HwAP_u7jhE_C8oixW5ZsdH21d-zHpXnGp9Ko,6777
50
50
  xinference/model/audio/cosyvoice.py,sha256=opy0EK6ePS966Jy2CjjR1jEB30a4pKbYJbXnqC7jPQ4,7221
51
51
  xinference/model/audio/custom.py,sha256=UqiXQ1N9kDfcNOCxUmYnmS_kHOIVrrJvJrpUitAydCw,3107
52
52
  xinference/model/audio/f5tts.py,sha256=if2IxLKurIfIbLzSmeOtqFG3xoVEQ_Ax_GK7eYCVl28,6848
53
53
  xinference/model/audio/f5tts_mlx.py,sha256=RXtP5MPm8ewMt4mPbpu93QmEPAWecM_dC_aHCz0_uzY,8566
54
54
  xinference/model/audio/fish_speech.py,sha256=ljufZldrChWzC6hZj2j222DKqz9HP4aZ8f4XjgzRgEo,6113
55
55
  xinference/model/audio/funasr.py,sha256=L-seUq_y-rwC3sadyrYb7VUOF82AUizpdpHYYt8f9Z8,6231
56
- xinference/model/audio/kokoro.py,sha256=lt9S6edUjkMo2whO2xzYOhRH2Z-ZXCWVtwfGHq_iFWo,3768
56
+ xinference/model/audio/kokoro.py,sha256=IF5EEh7-jW3vgeItBCV_nbzf6uBqehX9OrZjfyiuOcI,3785
57
57
  xinference/model/audio/kokoro_mlx.py,sha256=9ZkJsz4wvFpVmpMTi8BEn10ICx7lev5ezpoBPLvSQTk,3475
58
+ xinference/model/audio/kokoro_zh.py,sha256=g1zDsOTLWCcgGBkZrDFnJ6E8vPFQMscCs-zi5MigMok,3951
58
59
  xinference/model/audio/megatts.py,sha256=K2n-EfJHbyv3qC0tlnhm68Q2zZDVkgHAlQpHrf3s2pU,3408
59
60
  xinference/model/audio/melotts.py,sha256=n3jKYKeoXwHlQrocSUdS_Wry6ATVXKwZyXrJpePvJU4,3532
60
- xinference/model/audio/model_spec.json,sha256=dNz-S4w_VcXm8T8BadEFi7KaymzlhwbNave0Z4iwX7c,21882
61
+ xinference/model/audio/model_spec.json,sha256=EEHS0GKs5cOqyBt7ehM5-nP9tr22Sh-j-9WZpdILNr8,22387
61
62
  xinference/model/audio/utils.py,sha256=DveA9EW3hZAlaYcGZ00AewacC631bcynwjH9fcfvPJc,4261
62
63
  xinference/model/audio/whisper.py,sha256=kgzZOGzGDC8odM_syKY0eEP7f1BvMSxOP2quZsFoBVM,9097
63
64
  xinference/model/audio/whisper_mlx.py,sha256=DIOTrBh-LVT_dzySjV7ax-J5lgTXg0-Cqvbq9ctHD7o,7276
@@ -72,9 +73,9 @@ xinference/model/embedding/flag/core.py,sha256=n84TMXGWZT8TOIbo7DDllDmKWL6qPblPg
72
73
  xinference/model/embedding/llama_cpp/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
73
74
  xinference/model/embedding/llama_cpp/core.py,sha256=Hipbs9mFM2iyev2oqf5bQnREYZbbzmp3J7OndQDGz3E,9084
74
75
  xinference/model/embedding/sentence_transformers/__init__.py,sha256=CyLLkbImZouAk4lePIgKXT4WQoqyauIEwdqea5IOUVU,581
75
- xinference/model/embedding/sentence_transformers/core.py,sha256=GSy--In3Fetsb7Nrdi-qwht0h0lch5sX84GOq5IPkq4,18078
76
+ xinference/model/embedding/sentence_transformers/core.py,sha256=huBp54uAWT5VKhAgpF0LK5h5LGZyCijlJ-IgqlKiEMk,18139
76
77
  xinference/model/embedding/vllm/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
77
- xinference/model/embedding/vllm/core.py,sha256=HDGG4FWOAVwKNy7IiHqfA7-R4dtmTTyfwyAv5BArCec,6601
78
+ xinference/model/embedding/vllm/core.py,sha256=tcS2Gc93Fv6NWmbMF9JjuKRDQVkpcoowJVSRaAZLECA,6890
78
79
  xinference/model/flexible/__init__.py,sha256=ASs6q89T6X5oTj1uAYmahpRNnUVntC5d5HEuox1U3xw,1887
79
80
  xinference/model/flexible/core.py,sha256=DCCnZ3oaZJVFxOVZilBI26yC9rNM7B6te87vbOk_U8o,4031
80
81
  xinference/model/flexible/custom.py,sha256=EhZ2voduhM-_M3S4R0SwsuKFzS6FUXyNxS3RkqnQZjQ,2216
@@ -88,7 +89,7 @@ xinference/model/image/__init__.py,sha256=X43XSNSbQrVlU82jgKxrX965o6uGO-GPMvLvyb
88
89
  xinference/model/image/cache_manager.py,sha256=Ccc0SRWdq8qiLhrRwh4LYZLiHZ6ywQTEz6VdyFHnE2Y,4700
89
90
  xinference/model/image/core.py,sha256=0JD_91jl1Q0yxu3_H7S2dQjR3eHKfM6a6jjzp1LQZME,9515
90
91
  xinference/model/image/custom.py,sha256=THn9AZUdPtV0BmMO1tUTpMEXBQkzfle8p5685ZYcqek,1969
91
- xinference/model/image/model_spec.json,sha256=3M61MIokz9Qbtof74wwx9-lff1Gae9rViF2ZL23HUCE,22348
92
+ xinference/model/image/model_spec.json,sha256=mjVd_bE3IIP41VpxeYrUx2fdv375dLvNMNHjzuBYabc,22312
92
93
  xinference/model/image/sdapi.py,sha256=Xgdtnvw4Xwj1Nc0cBoDo_ogH6E2mFJqLvX0jSxxgdnA,5936
93
94
  xinference/model/image/utils.py,sha256=wXqZRHqn11qERJKfYkK4nDSNanjNXsg1xaG2nVAs01Y,2344
94
95
  xinference/model/image/ocr/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
@@ -100,20 +101,20 @@ xinference/model/image/stable_diffusion/core.py,sha256=gr39tURTzw5OvrhcygI5YnrXL
100
101
  xinference/model/image/stable_diffusion/mlx.py,sha256=caWbXNAvGIbg6FvG1M6BFFXzsPUltI2Fhhu-lpMPirY,7487
101
102
  xinference/model/llm/__init__.py,sha256=cZ5ckp_dye6ftr5iC_f31rTkKbE3AWEZOCbD0hzy39k,8842
102
103
  xinference/model/llm/cache_manager.py,sha256=7Ult1h8JCcwd05g95Kwm3j7qIaaK3phyW9LQNAzrHmY,11253
103
- xinference/model/llm/core.py,sha256=c9vveVxSZhyd8H6zXJSrZgET98V8-D-xDtBNl2x_j3U,8852
104
+ xinference/model/llm/core.py,sha256=-gjkSXcytd3W2u-dDiJrQujAKJZXWPf3XGeCyVqYYCc,9221
104
105
  xinference/model/llm/custom.py,sha256=uRJGWICXvaAKKnVYM7gyWO9e_x6jzz9dWZWH92UWpAE,2761
105
106
  xinference/model/llm/harmony.py,sha256=E1KqpFn2lz9uxegbpnrYqQAL1Gx8BfBVB8gyiblWccg,9900
106
- xinference/model/llm/llm_family.json,sha256=SPSEgM8gePf_N5hTt9Yq84rn3GhirMgWWywUTWl5sFc,773987
107
- xinference/model/llm/llm_family.py,sha256=tAvZTQXEoI_TDGBrxXy65UHgWWznB2yu4Ihbrh4PS6I,21350
107
+ xinference/model/llm/llm_family.json,sha256=0UMONTTP2Q9tkwmRlXTxKkxM30NI2hAmJjh3_X-gsKo,774530
108
+ xinference/model/llm/llm_family.py,sha256=H92Mtq8NJavwenI3BPyTHVHLrlgfUXcy2LGN1OCA7pE,21381
108
109
  xinference/model/llm/memory.py,sha256=y8fBjIGd6zIPkgIxGtjakD7GPLW3VoM4m6x1UBM6IKs,10144
109
110
  xinference/model/llm/reasoning_parser.py,sha256=sk5KuteBMGK0A0-ooq3nB9scP1SS8WxWS_b5OYiDD68,17449
110
- xinference/model/llm/utils.py,sha256=cLGu7lw-kpmStBL5ZLGafvEnvzueYY4shDZgcgbM2ns,38915
111
+ xinference/model/llm/utils.py,sha256=j_zRlHoXCpEtOUGExVyuXcW3y6Edmgdz2HaQVFCnbLs,42019
111
112
  xinference/model/llm/llama_cpp/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
112
- xinference/model/llm/llama_cpp/core.py,sha256=nPE2tsvX2vKNaFwe2SQvJTvJ8rYf9pIc8i4fMJAZuHQ,14031
113
+ xinference/model/llm/llama_cpp/core.py,sha256=-KfD1TUfMhfHCn6jvoLihgTXBszkkMHoVd1nf4w3oPU,14071
113
114
  xinference/model/llm/lmdeploy/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
114
115
  xinference/model/llm/lmdeploy/core.py,sha256=DAUHO1AxPA10C7zovxXQe8Qr8yPF1PqyHKAUkrFbI_k,19895
115
116
  xinference/model/llm/mlx/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
116
- xinference/model/llm/mlx/core.py,sha256=qyxlqDYvXKoP5tsjJKzV5GdV_5jpxb9uJT6Y7YHeZ0o,34852
117
+ xinference/model/llm/mlx/core.py,sha256=5nxHxEFI2x6DVDWUln3HBoxf4NfeLN2P3rhV9zKwOMU,35482
117
118
  xinference/model/llm/mlx/distributed_models/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
118
119
  xinference/model/llm/mlx/distributed_models/core.py,sha256=0pYu9SiBwVxTJ04yf_lDzRvjBrbdDQfWobWzJA89HLo,5744
119
120
  xinference/model/llm/mlx/distributed_models/deepseek_v3.py,sha256=oH6Yv7rzEL644gnA_rqBgU4hICpppUTaaQtwiODwfig,2441
@@ -121,10 +122,17 @@ xinference/model/llm/mlx/distributed_models/qwen2.py,sha256=B7YifMQqDujnrxCnjJZb
121
122
  xinference/model/llm/mlx/distributed_models/qwen3.py,sha256=mconllhlTKOY96UP6Y9G3kBppSbP5kYCcziDeBEdtVY,2586
122
123
  xinference/model/llm/mlx/distributed_models/qwen3_moe.py,sha256=_d__HWDYfL1wAUAa-0xWiszLC6AYkGLQ5eTVtsi5Pc4,2380
123
124
  xinference/model/llm/sglang/__init__.py,sha256=-sjSIQ4K6w-TEzx49kVaWeWC443fnZqODU91GCQ_JNo,581
124
- xinference/model/llm/sglang/core.py,sha256=ulyJ-PNJHzCa_tyPr5paVoG39KnNryuswNNlrFRu3MU,31241
125
+ xinference/model/llm/sglang/core.py,sha256=t5SoPiKxnRu4BJCaPc0H62S0-HiUnUvJYU3TuOjfeyU,29462
126
+ xinference/model/llm/tool_parsers/__init__.py,sha256=FqS5V2v-HpBy5J9IWaw7ZfZ5_fzAtYeVG0WN-bmL98o,1778
127
+ xinference/model/llm/tool_parsers/abstract_tool_parser.py,sha256=7D2ihK7Ny9LNmHcezcEKYNwe8GIZJHydFZlWDg4xXpE,1312
128
+ xinference/model/llm/tool_parsers/deepseek_r1_tool_parser.py,sha256=anjzpOlEeeFaqm0fRmpvXx585_kyqb-SgdCZhfRjTwM,4942
129
+ xinference/model/llm/tool_parsers/deepseek_v3_tool_parser.py,sha256=T1CPzomvTj8HoGBCHTYm2FqFqd62WNxMqTjhST0b1pk,5146
130
+ xinference/model/llm/tool_parsers/glm4_tool_parser.py,sha256=YBittOVGwQOPYtXHDWdxpO2vGUg5XapYdcfWPH1Kseg,4313
131
+ xinference/model/llm/tool_parsers/llama3_tool_parser.py,sha256=vBD39Ub2ha0CXRCOtGu97i8eNyZ_2cDShT3yqxK8W5o,2787
132
+ xinference/model/llm/tool_parsers/qwen_tool_parser.py,sha256=y6UxvJ70RbvmcyUDgZGkQwn_uTyz-grjlNS1D-_Nv8E,11746
125
133
  xinference/model/llm/transformers/__init__.py,sha256=_4hQ7BvHNE4WAyzNcTB0_iY5mBcaPGTkLvQcWiylBoI,1724
126
134
  xinference/model/llm/transformers/chatglm.py,sha256=ovDSYZet7bdqloO_WXaH9a6Rv6FyQ_BrY5dkejqvyBc,22953
127
- xinference/model/llm/transformers/core.py,sha256=ZbcpGLr2oWGi7B2aXYg1uKTEjAbuO1-NYkCIMNmMpHw,40085
135
+ xinference/model/llm/transformers/core.py,sha256=tV48CxsTVqMfLbqfJgBuGubQe3gzlJMfKWQOZxMJUAs,40086
128
136
  xinference/model/llm/transformers/deepseek_v2.py,sha256=4LB_grDfdaXBCdTwduqpWFrYoeKsMnBERWTxcNl7EfA,2624
129
137
  xinference/model/llm/transformers/gemma3.py,sha256=oH5SwLM7aX-8zMPO7918x2BKDZGJgeFdZ5FduHiDDQI,5490
130
138
  xinference/model/llm/transformers/gpt_oss.py,sha256=uPO0WsDlxxd9KY3mlldyZyQIcogPk-rDxL-LHbIgSuc,3386
@@ -145,7 +153,7 @@ xinference/model/llm/transformers/multimodal/qwen-omni.py,sha256=tEZZAsnQssinF4s
145
153
  xinference/model/llm/transformers/multimodal/qwen2_audio.py,sha256=wFzyTyNvSfTKA4opMeYHT4m4SpmAbcUfvkc16Bf4FRA,4680
146
154
  xinference/model/llm/transformers/multimodal/qwen2_vl.py,sha256=b_gm_g2-seFpTB68-G3n_k2JKQqBxZa8KOg2STJPB7U,8594
147
155
  xinference/model/llm/vllm/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
148
- xinference/model/llm/vllm/core.py,sha256=ol8vFPL85lOOc1u-_UzDxspnwI8bJKgnHi2aro2rCH4,61618
156
+ xinference/model/llm/vllm/core.py,sha256=9Wo_EiAeMIsmf9FbRl8X0zKjWqSvur5ddlJBwLBtZNE,59152
149
157
  xinference/model/llm/vllm/distributed_executor.py,sha256=8bFU4JSgvbBTrhGZhsANfMUX4DR6es1zw-cljVLkTBw,14125
150
158
  xinference/model/llm/vllm/utils.py,sha256=LKOmwfFRrlSecawxT-uE39tC2RQbf1UIiSH9Uz90X6w,1313
151
159
  xinference/model/llm/vllm/xavier/__init__.py,sha256=CyLLkbImZouAk4lePIgKXT4WQoqyauIEwdqea5IOUVU,581
@@ -15804,9 +15812,9 @@ xinference/ui/web/ui/src/locales/en.json,sha256=2K1xlg0dY0Xw208qW0bdJlE7XL2dbouC
15804
15812
  xinference/ui/web/ui/src/locales/ja.json,sha256=EZmLCN1smdXmvR-tqFLIgelrIFRKGr6zf7x519DUpuA,11952
15805
15813
  xinference/ui/web/ui/src/locales/ko.json,sha256=pEVoh1jyaqliaNTLOt2d4wDkeVQGQB_pGMjNllNERA8,10805
15806
15814
  xinference/ui/web/ui/src/locales/zh.json,sha256=IY_eaPEE870ggqOMr_p9gjAu8IIoF6-3w_SlAyn-EGY,9859
15807
- xinference-1.9.1.dist-info/licenses/LICENSE,sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE,11356
15808
- xinference-1.9.1.dist-info/METADATA,sha256=Yy6mCfl2cYQ68m4X0iWDwEVJdR8YSdeXx719Nv5Flsw,26412
15809
- xinference-1.9.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
15810
- xinference-1.9.1.dist-info/entry_points.txt,sha256=-lDyyzqWMFQF0Rgm7VxBNz0V-bMBMQLRR3pvQ-Y8XTY,226
15811
- xinference-1.9.1.dist-info/top_level.txt,sha256=L1rQt7pl6m8tmKXpWVHzP-GtmzAxp663rXxGE7qnK00,11
15812
- xinference-1.9.1.dist-info/RECORD,,
15815
+ xinference-1.10.0.dist-info/licenses/LICENSE,sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE,11356
15816
+ xinference-1.10.0.dist-info/METADATA,sha256=VtKqtNrNEAlR4Wn_mmPax6ntXIw2vOtxcA8pPfIlIlU,26568
15817
+ xinference-1.10.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
15818
+ xinference-1.10.0.dist-info/entry_points.txt,sha256=-lDyyzqWMFQF0Rgm7VxBNz0V-bMBMQLRR3pvQ-Y8XTY,226
15819
+ xinference-1.10.0.dist-info/top_level.txt,sha256=L1rQt7pl6m8tmKXpWVHzP-GtmzAxp663rXxGE7qnK00,11
15820
+ xinference-1.10.0.dist-info/RECORD,,