xinference 1.9.1__py3-none-any.whl → 1.10.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of xinference might be problematic. Click here for more details.
- xinference/_version.py +3 -3
- xinference/api/restful_api.py +415 -1
- xinference/constants.py +2 -0
- xinference/core/supervisor.py +29 -1
- xinference/model/audio/core.py +5 -0
- xinference/model/audio/kokoro.py +1 -1
- xinference/model/audio/kokoro_zh.py +124 -0
- xinference/model/audio/model_spec.json +20 -0
- xinference/model/embedding/sentence_transformers/core.py +4 -4
- xinference/model/embedding/vllm/core.py +7 -1
- xinference/model/image/model_spec.json +2 -3
- xinference/model/llm/core.py +10 -0
- xinference/model/llm/llama_cpp/core.py +1 -0
- xinference/model/llm/llm_family.json +40 -20
- xinference/model/llm/llm_family.py +1 -0
- xinference/model/llm/mlx/core.py +52 -33
- xinference/model/llm/sglang/core.py +2 -44
- xinference/model/llm/tool_parsers/__init__.py +58 -0
- xinference/model/llm/tool_parsers/abstract_tool_parser.py +33 -0
- xinference/model/llm/tool_parsers/deepseek_r1_tool_parser.py +128 -0
- xinference/model/llm/tool_parsers/deepseek_v3_tool_parser.py +145 -0
- xinference/model/llm/tool_parsers/glm4_tool_parser.py +123 -0
- xinference/model/llm/tool_parsers/llama3_tool_parser.py +77 -0
- xinference/model/llm/tool_parsers/qwen_tool_parser.py +320 -0
- xinference/model/llm/transformers/core.py +1 -1
- xinference/model/llm/utils.py +127 -45
- xinference/model/llm/vllm/core.py +2 -61
- xinference/types.py +105 -2
- {xinference-1.9.1.dist-info → xinference-1.10.0.dist-info}/METADATA +7 -3
- {xinference-1.9.1.dist-info → xinference-1.10.0.dist-info}/RECORD +34 -26
- {xinference-1.9.1.dist-info → xinference-1.10.0.dist-info}/WHEEL +0 -0
- {xinference-1.9.1.dist-info → xinference-1.10.0.dist-info}/entry_points.txt +0 -0
- {xinference-1.9.1.dist-info → xinference-1.10.0.dist-info}/licenses/LICENSE +0 -0
- {xinference-1.9.1.dist-info → xinference-1.10.0.dist-info}/top_level.txt +0 -0
xinference/types.py
CHANGED
|
@@ -351,6 +351,11 @@ class ModelAndPrompt(BaseModel):
|
|
|
351
351
|
prompt: str
|
|
352
352
|
|
|
353
353
|
|
|
354
|
+
class ModelAndMessages(BaseModel):
|
|
355
|
+
model: str
|
|
356
|
+
messages: List[Dict[str, Any]]
|
|
357
|
+
|
|
358
|
+
|
|
354
359
|
class CreateCompletionTorch(BaseModel):
|
|
355
360
|
echo: bool = echo_field
|
|
356
361
|
max_tokens: Optional[int] = max_tokens_field
|
|
@@ -371,7 +376,6 @@ class CreateCompletionTorch(BaseModel):
|
|
|
371
376
|
# This type is for openai API compatibility
|
|
372
377
|
CreateCompletionOpenAI: BaseModel
|
|
373
378
|
|
|
374
|
-
|
|
375
379
|
from openai.types.completion_create_params import CompletionCreateParamsNonStreaming
|
|
376
380
|
|
|
377
381
|
CreateCompletionOpenAI = create_model_from_typeddict(
|
|
@@ -395,7 +399,6 @@ class CreateChatModel(BaseModel):
|
|
|
395
399
|
# Currently, chat calls generates, so the params share the same one.
|
|
396
400
|
CreateChatCompletionTorch = CreateCompletionTorch
|
|
397
401
|
|
|
398
|
-
|
|
399
402
|
from ._compat import CreateChatCompletionOpenAI
|
|
400
403
|
|
|
401
404
|
|
|
@@ -462,3 +465,103 @@ class PeftModelConfig:
|
|
|
462
465
|
image_lora_load_kwargs=data.get("image_lora_load_kwargs"),
|
|
463
466
|
image_lora_fuse_kwargs=data.get("image_lora_fuse_kwargs"),
|
|
464
467
|
)
|
|
468
|
+
|
|
469
|
+
|
|
470
|
+
# This type is for Anthropic API compatibility
|
|
471
|
+
ANTHROPIC_AVAILABLE = False
|
|
472
|
+
|
|
473
|
+
try:
|
|
474
|
+
from anthropic.types import ContentBlock, Usage
|
|
475
|
+
|
|
476
|
+
ANTHROPIC_AVAILABLE = True
|
|
477
|
+
except ImportError:
|
|
478
|
+
ContentBlock = None
|
|
479
|
+
Usage = None
|
|
480
|
+
|
|
481
|
+
# Use TYPE_CHECKING to avoid runtime issues with mypy
|
|
482
|
+
from typing import TYPE_CHECKING
|
|
483
|
+
|
|
484
|
+
if TYPE_CHECKING:
|
|
485
|
+
# For type checking, define the types as if Anthropic is available
|
|
486
|
+
from anthropic.types import ContentBlock as ContentBlock_
|
|
487
|
+
from anthropic.types import Usage as Usage_
|
|
488
|
+
|
|
489
|
+
class AnthropicMessage(TypedDict):
|
|
490
|
+
id: str
|
|
491
|
+
type: str
|
|
492
|
+
role: str
|
|
493
|
+
content: List[ContentBlock_]
|
|
494
|
+
model: str
|
|
495
|
+
stop_reason: str
|
|
496
|
+
stop_sequence: str
|
|
497
|
+
usage: Usage_
|
|
498
|
+
container: Dict[str, Any]
|
|
499
|
+
|
|
500
|
+
class MessageCreateParams(TypedDict):
|
|
501
|
+
model: str
|
|
502
|
+
messages: List[Dict[str, Any]]
|
|
503
|
+
max_tokens: int
|
|
504
|
+
stream: NotRequired[bool]
|
|
505
|
+
temperature: NotRequired[float]
|
|
506
|
+
top_p: NotRequired[float]
|
|
507
|
+
top_k: NotRequired[int]
|
|
508
|
+
stop_sequences: NotRequired[List[str]]
|
|
509
|
+
metadata: NotRequired[Dict[str, Any]]
|
|
510
|
+
tools: NotRequired[List[Dict[str, Any]]]
|
|
511
|
+
tool_choice: NotRequired[Union[str, Dict[str, Any]]]
|
|
512
|
+
|
|
513
|
+
CreateMessageAnthropic: BaseModel
|
|
514
|
+
|
|
515
|
+
class CreateMessage(
|
|
516
|
+
ModelAndMessages,
|
|
517
|
+
):
|
|
518
|
+
pass
|
|
519
|
+
|
|
520
|
+
else:
|
|
521
|
+
# Runtime definitions
|
|
522
|
+
if ANTHROPIC_AVAILABLE:
|
|
523
|
+
|
|
524
|
+
class AnthropicMessage(TypedDict):
|
|
525
|
+
id: str
|
|
526
|
+
type: str
|
|
527
|
+
role: str
|
|
528
|
+
content: List[ContentBlock]
|
|
529
|
+
model: str
|
|
530
|
+
stop_reason: str
|
|
531
|
+
stop_sequence: str
|
|
532
|
+
usage: Usage
|
|
533
|
+
container: Dict[str, Any]
|
|
534
|
+
|
|
535
|
+
class MessageCreateParams(TypedDict):
|
|
536
|
+
model: str
|
|
537
|
+
messages: List[Dict[str, Any]]
|
|
538
|
+
max_tokens: int
|
|
539
|
+
stream: NotRequired[bool]
|
|
540
|
+
temperature: NotRequired[float]
|
|
541
|
+
top_p: NotRequired[float]
|
|
542
|
+
top_k: NotRequired[int]
|
|
543
|
+
stop_sequences: NotRequired[List[str]]
|
|
544
|
+
metadata: NotRequired[Dict[str, Any]]
|
|
545
|
+
tools: NotRequired[List[Dict[str, Any]]]
|
|
546
|
+
tool_choice: NotRequired[Union[str, Dict[str, Any]]]
|
|
547
|
+
|
|
548
|
+
CreateMessageAnthropic: BaseModel = create_model_from_typeddict(
|
|
549
|
+
MessageCreateParams,
|
|
550
|
+
)
|
|
551
|
+
CreateMessageAnthropic = fix_forward_ref(CreateMessageAnthropic)
|
|
552
|
+
|
|
553
|
+
class CreateMessage(CreateMessageAnthropic):
|
|
554
|
+
pass
|
|
555
|
+
|
|
556
|
+
else:
|
|
557
|
+
# Define dummy types when Anthropic is not available
|
|
558
|
+
class AnthropicMessage:
|
|
559
|
+
pass
|
|
560
|
+
|
|
561
|
+
class MessageCreateParams:
|
|
562
|
+
pass
|
|
563
|
+
|
|
564
|
+
CreateMessageAnthropic = None
|
|
565
|
+
|
|
566
|
+
class CreateMessage:
|
|
567
|
+
pass
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: xinference
|
|
3
|
-
Version: 1.
|
|
3
|
+
Version: 1.10.0
|
|
4
4
|
Summary: Model Serving Made Easy
|
|
5
5
|
Home-page: https://github.com/xorbitsai/inference
|
|
6
6
|
Author: Qin Xuye
|
|
@@ -61,12 +61,14 @@ Requires-Dist: jieba>=0.42.0; extra == "dev"
|
|
|
61
61
|
Requires-Dist: flake8>=3.8.0; extra == "dev"
|
|
62
62
|
Requires-Dist: black; extra == "dev"
|
|
63
63
|
Requires-Dist: openai>=1.40.0; extra == "dev"
|
|
64
|
+
Requires-Dist: anthropic; extra == "dev"
|
|
64
65
|
Requires-Dist: langchain; extra == "dev"
|
|
65
66
|
Requires-Dist: langchain-community; extra == "dev"
|
|
66
67
|
Requires-Dist: orjson; extra == "dev"
|
|
67
68
|
Requires-Dist: sphinx-tabs; extra == "dev"
|
|
68
69
|
Requires-Dist: sphinx-design; extra == "dev"
|
|
69
70
|
Provides-Extra: all
|
|
71
|
+
Requires-Dist: anthropic; extra == "all"
|
|
70
72
|
Requires-Dist: uv; extra == "all"
|
|
71
73
|
Requires-Dist: xllamacpp>=0.2.0; extra == "all"
|
|
72
74
|
Requires-Dist: transformers>=4.46.0; extra == "all"
|
|
@@ -115,7 +117,7 @@ Requires-Dist: torchvision; extra == "all"
|
|
|
115
117
|
Requires-Dist: gguf; extra == "all"
|
|
116
118
|
Requires-Dist: diffusers>=0.32.0; extra == "all"
|
|
117
119
|
Requires-Dist: imageio-ffmpeg; extra == "all"
|
|
118
|
-
Requires-Dist: funasr
|
|
120
|
+
Requires-Dist: funasr==1.2.7; extra == "all"
|
|
119
121
|
Requires-Dist: omegaconf~=2.3.0; extra == "all"
|
|
120
122
|
Requires-Dist: nemo_text_processing<1.1.0; sys_platform == "linux" and extra == "all"
|
|
121
123
|
Requires-Dist: WeTextProcessing<1.0.4; sys_platform == "linux" and extra == "all"
|
|
@@ -230,7 +232,7 @@ Provides-Extra: video
|
|
|
230
232
|
Requires-Dist: diffusers>=0.32.0; extra == "video"
|
|
231
233
|
Requires-Dist: imageio-ffmpeg; extra == "video"
|
|
232
234
|
Provides-Extra: audio
|
|
233
|
-
Requires-Dist: funasr
|
|
235
|
+
Requires-Dist: funasr==1.2.7; extra == "audio"
|
|
234
236
|
Requires-Dist: omegaconf~=2.3.0; extra == "audio"
|
|
235
237
|
Requires-Dist: nemo_text_processing<1.1.0; sys_platform == "linux" and extra == "audio"
|
|
236
238
|
Requires-Dist: WeTextProcessing<1.0.4; sys_platform == "linux" and extra == "audio"
|
|
@@ -292,6 +294,8 @@ Provides-Extra: benchmark
|
|
|
292
294
|
Requires-Dist: psutil; extra == "benchmark"
|
|
293
295
|
Provides-Extra: virtualenv
|
|
294
296
|
Requires-Dist: uv; extra == "virtualenv"
|
|
297
|
+
Provides-Extra: anthropic
|
|
298
|
+
Requires-Dist: anthropic; extra == "anthropic"
|
|
295
299
|
Dynamic: description
|
|
296
300
|
Dynamic: description-content-type
|
|
297
301
|
Dynamic: license-file
|
|
@@ -1,15 +1,15 @@
|
|
|
1
1
|
xinference/__init__.py,sha256=nmTTrYbIpj964ZF6ojtgOM7E85JBOj1EyQbmYjbj1jw,915
|
|
2
2
|
xinference/_compat.py,sha256=YF-lS6tX06zkFi2oFS0yq_LBn4hX_8u0Ft0vKxGALwA,4238
|
|
3
|
-
xinference/_version.py,sha256=
|
|
3
|
+
xinference/_version.py,sha256=_EWji1MNqQ79G4kHRFbbD_UdNhdfHKrUEJFT8lnM8fs,498
|
|
4
4
|
xinference/conftest.py,sha256=vETDpRBVIlWbWi7OTwf7og89U25KyYGyI7yPIB3O8N8,9564
|
|
5
|
-
xinference/constants.py,sha256=
|
|
5
|
+
xinference/constants.py,sha256=643I-3Hd-3BU6DRCMrohsW5HYp990WjYi1cbFwAxCL8,5117
|
|
6
6
|
xinference/device_utils.py,sha256=vt3GpNNfEfuJzXPb49bUnADyM2r4SqgG03ODiJO86sA,4953
|
|
7
7
|
xinference/fields.py,sha256=FaL9-jXDkn6kwupCmo-F6hh2JvMPJJzRWSUB1NKuhKc,5352
|
|
8
8
|
xinference/isolation.py,sha256=gTU1em5fxg1m-7hxieWBMZvVkXZX4GZYmeT7XxXsYrU,2699
|
|
9
|
-
xinference/types.py,sha256=
|
|
9
|
+
xinference/types.py,sha256=JvYmp3k693GhubCwz4nOeLTYMKi0eANjR8e6MwcHSl0,14617
|
|
10
10
|
xinference/utils.py,sha256=xMuOg3LZhTUf7inEhm-HmXCIoly0pHaWtMKMnnf8XGk,2273
|
|
11
11
|
xinference/api/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
|
|
12
|
-
xinference/api/restful_api.py,sha256=
|
|
12
|
+
xinference/api/restful_api.py,sha256=I0aZwL6lKNxZDpApiFbxHVOoo24hdj3OswTC7UmsYMk,119876
|
|
13
13
|
xinference/api/oauth2/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
|
|
14
14
|
xinference/api/oauth2/auth_service.py,sha256=74JzB42fbbmBu4Q1dW3A9Fp_N7167KgRGB42Z0NHjAM,6119
|
|
15
15
|
xinference/api/oauth2/types.py,sha256=K923sv_XySIUtM2Eozl9IG082IJcDOS5SFLrPZ5ELBg,996
|
|
@@ -28,7 +28,7 @@ xinference/core/model.py,sha256=9go5zbuDZ7MvUvymdp4cgX65K1LgxUw-xggZ04eBSfc,3966
|
|
|
28
28
|
xinference/core/progress_tracker.py,sha256=CNCc1ZVscvp-JJznPTYJDPuis7ya6ZothZUIalDcxDo,6798
|
|
29
29
|
xinference/core/resource.py,sha256=aTV89dmuKxw5JnwQglRkA2Wxu1EBLM5WjmLxITSXYgs,1808
|
|
30
30
|
xinference/core/status_guard.py,sha256=VLhyqpobdclfyzcROqf4bmGDiKpuHllto316X3Z6Hrc,2860
|
|
31
|
-
xinference/core/supervisor.py,sha256=
|
|
31
|
+
xinference/core/supervisor.py,sha256=Gxo1jFtqDc-yuU5Zg3uaXL3NmADlrAIDy_l2DyUDu48,75814
|
|
32
32
|
xinference/core/utils.py,sha256=VgcvxpTr2Q8am3MoHp7JPjC7jLYlKX2kLVdBo2Q_fRo,10430
|
|
33
33
|
xinference/core/worker.py,sha256=_t2T7xd_47-y4A2i62uZkV4pDpYJebVFqE8eu_PrcLQ,62252
|
|
34
34
|
xinference/deploy/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
|
|
@@ -46,18 +46,19 @@ xinference/model/custom.py,sha256=byW3aBEUAaWPS9jAyEoabZ0ktRGJixSyyuDb6Dp-OOo,65
|
|
|
46
46
|
xinference/model/utils.py,sha256=pH6yhCJnDoakJMcWXgQ8jL9_59OVJEx90q1Oox-hXyE,20630
|
|
47
47
|
xinference/model/audio/__init__.py,sha256=RPf_feWYEh_BfMmwRkehIOBK5vUx6AadMHXp1d6EAk4,3473
|
|
48
48
|
xinference/model/audio/chattts.py,sha256=LmwD-X1XFKhVwA5ruqEQJ7VOiHIVwMuJrL7cH82poNE,4154
|
|
49
|
-
xinference/model/audio/core.py,sha256=
|
|
49
|
+
xinference/model/audio/core.py,sha256=OBXE7S9HwAP_u7jhE_C8oixW5ZsdH21d-zHpXnGp9Ko,6777
|
|
50
50
|
xinference/model/audio/cosyvoice.py,sha256=opy0EK6ePS966Jy2CjjR1jEB30a4pKbYJbXnqC7jPQ4,7221
|
|
51
51
|
xinference/model/audio/custom.py,sha256=UqiXQ1N9kDfcNOCxUmYnmS_kHOIVrrJvJrpUitAydCw,3107
|
|
52
52
|
xinference/model/audio/f5tts.py,sha256=if2IxLKurIfIbLzSmeOtqFG3xoVEQ_Ax_GK7eYCVl28,6848
|
|
53
53
|
xinference/model/audio/f5tts_mlx.py,sha256=RXtP5MPm8ewMt4mPbpu93QmEPAWecM_dC_aHCz0_uzY,8566
|
|
54
54
|
xinference/model/audio/fish_speech.py,sha256=ljufZldrChWzC6hZj2j222DKqz9HP4aZ8f4XjgzRgEo,6113
|
|
55
55
|
xinference/model/audio/funasr.py,sha256=L-seUq_y-rwC3sadyrYb7VUOF82AUizpdpHYYt8f9Z8,6231
|
|
56
|
-
xinference/model/audio/kokoro.py,sha256=
|
|
56
|
+
xinference/model/audio/kokoro.py,sha256=IF5EEh7-jW3vgeItBCV_nbzf6uBqehX9OrZjfyiuOcI,3785
|
|
57
57
|
xinference/model/audio/kokoro_mlx.py,sha256=9ZkJsz4wvFpVmpMTi8BEn10ICx7lev5ezpoBPLvSQTk,3475
|
|
58
|
+
xinference/model/audio/kokoro_zh.py,sha256=g1zDsOTLWCcgGBkZrDFnJ6E8vPFQMscCs-zi5MigMok,3951
|
|
58
59
|
xinference/model/audio/megatts.py,sha256=K2n-EfJHbyv3qC0tlnhm68Q2zZDVkgHAlQpHrf3s2pU,3408
|
|
59
60
|
xinference/model/audio/melotts.py,sha256=n3jKYKeoXwHlQrocSUdS_Wry6ATVXKwZyXrJpePvJU4,3532
|
|
60
|
-
xinference/model/audio/model_spec.json,sha256=
|
|
61
|
+
xinference/model/audio/model_spec.json,sha256=EEHS0GKs5cOqyBt7ehM5-nP9tr22Sh-j-9WZpdILNr8,22387
|
|
61
62
|
xinference/model/audio/utils.py,sha256=DveA9EW3hZAlaYcGZ00AewacC631bcynwjH9fcfvPJc,4261
|
|
62
63
|
xinference/model/audio/whisper.py,sha256=kgzZOGzGDC8odM_syKY0eEP7f1BvMSxOP2quZsFoBVM,9097
|
|
63
64
|
xinference/model/audio/whisper_mlx.py,sha256=DIOTrBh-LVT_dzySjV7ax-J5lgTXg0-Cqvbq9ctHD7o,7276
|
|
@@ -72,9 +73,9 @@ xinference/model/embedding/flag/core.py,sha256=n84TMXGWZT8TOIbo7DDllDmKWL6qPblPg
|
|
|
72
73
|
xinference/model/embedding/llama_cpp/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
73
74
|
xinference/model/embedding/llama_cpp/core.py,sha256=Hipbs9mFM2iyev2oqf5bQnREYZbbzmp3J7OndQDGz3E,9084
|
|
74
75
|
xinference/model/embedding/sentence_transformers/__init__.py,sha256=CyLLkbImZouAk4lePIgKXT4WQoqyauIEwdqea5IOUVU,581
|
|
75
|
-
xinference/model/embedding/sentence_transformers/core.py,sha256=
|
|
76
|
+
xinference/model/embedding/sentence_transformers/core.py,sha256=huBp54uAWT5VKhAgpF0LK5h5LGZyCijlJ-IgqlKiEMk,18139
|
|
76
77
|
xinference/model/embedding/vllm/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
77
|
-
xinference/model/embedding/vllm/core.py,sha256=
|
|
78
|
+
xinference/model/embedding/vllm/core.py,sha256=tcS2Gc93Fv6NWmbMF9JjuKRDQVkpcoowJVSRaAZLECA,6890
|
|
78
79
|
xinference/model/flexible/__init__.py,sha256=ASs6q89T6X5oTj1uAYmahpRNnUVntC5d5HEuox1U3xw,1887
|
|
79
80
|
xinference/model/flexible/core.py,sha256=DCCnZ3oaZJVFxOVZilBI26yC9rNM7B6te87vbOk_U8o,4031
|
|
80
81
|
xinference/model/flexible/custom.py,sha256=EhZ2voduhM-_M3S4R0SwsuKFzS6FUXyNxS3RkqnQZjQ,2216
|
|
@@ -88,7 +89,7 @@ xinference/model/image/__init__.py,sha256=X43XSNSbQrVlU82jgKxrX965o6uGO-GPMvLvyb
|
|
|
88
89
|
xinference/model/image/cache_manager.py,sha256=Ccc0SRWdq8qiLhrRwh4LYZLiHZ6ywQTEz6VdyFHnE2Y,4700
|
|
89
90
|
xinference/model/image/core.py,sha256=0JD_91jl1Q0yxu3_H7S2dQjR3eHKfM6a6jjzp1LQZME,9515
|
|
90
91
|
xinference/model/image/custom.py,sha256=THn9AZUdPtV0BmMO1tUTpMEXBQkzfle8p5685ZYcqek,1969
|
|
91
|
-
xinference/model/image/model_spec.json,sha256=
|
|
92
|
+
xinference/model/image/model_spec.json,sha256=mjVd_bE3IIP41VpxeYrUx2fdv375dLvNMNHjzuBYabc,22312
|
|
92
93
|
xinference/model/image/sdapi.py,sha256=Xgdtnvw4Xwj1Nc0cBoDo_ogH6E2mFJqLvX0jSxxgdnA,5936
|
|
93
94
|
xinference/model/image/utils.py,sha256=wXqZRHqn11qERJKfYkK4nDSNanjNXsg1xaG2nVAs01Y,2344
|
|
94
95
|
xinference/model/image/ocr/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
|
|
@@ -100,20 +101,20 @@ xinference/model/image/stable_diffusion/core.py,sha256=gr39tURTzw5OvrhcygI5YnrXL
|
|
|
100
101
|
xinference/model/image/stable_diffusion/mlx.py,sha256=caWbXNAvGIbg6FvG1M6BFFXzsPUltI2Fhhu-lpMPirY,7487
|
|
101
102
|
xinference/model/llm/__init__.py,sha256=cZ5ckp_dye6ftr5iC_f31rTkKbE3AWEZOCbD0hzy39k,8842
|
|
102
103
|
xinference/model/llm/cache_manager.py,sha256=7Ult1h8JCcwd05g95Kwm3j7qIaaK3phyW9LQNAzrHmY,11253
|
|
103
|
-
xinference/model/llm/core.py,sha256
|
|
104
|
+
xinference/model/llm/core.py,sha256=-gjkSXcytd3W2u-dDiJrQujAKJZXWPf3XGeCyVqYYCc,9221
|
|
104
105
|
xinference/model/llm/custom.py,sha256=uRJGWICXvaAKKnVYM7gyWO9e_x6jzz9dWZWH92UWpAE,2761
|
|
105
106
|
xinference/model/llm/harmony.py,sha256=E1KqpFn2lz9uxegbpnrYqQAL1Gx8BfBVB8gyiblWccg,9900
|
|
106
|
-
xinference/model/llm/llm_family.json,sha256=
|
|
107
|
-
xinference/model/llm/llm_family.py,sha256=
|
|
107
|
+
xinference/model/llm/llm_family.json,sha256=0UMONTTP2Q9tkwmRlXTxKkxM30NI2hAmJjh3_X-gsKo,774530
|
|
108
|
+
xinference/model/llm/llm_family.py,sha256=H92Mtq8NJavwenI3BPyTHVHLrlgfUXcy2LGN1OCA7pE,21381
|
|
108
109
|
xinference/model/llm/memory.py,sha256=y8fBjIGd6zIPkgIxGtjakD7GPLW3VoM4m6x1UBM6IKs,10144
|
|
109
110
|
xinference/model/llm/reasoning_parser.py,sha256=sk5KuteBMGK0A0-ooq3nB9scP1SS8WxWS_b5OYiDD68,17449
|
|
110
|
-
xinference/model/llm/utils.py,sha256=
|
|
111
|
+
xinference/model/llm/utils.py,sha256=j_zRlHoXCpEtOUGExVyuXcW3y6Edmgdz2HaQVFCnbLs,42019
|
|
111
112
|
xinference/model/llm/llama_cpp/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
|
|
112
|
-
xinference/model/llm/llama_cpp/core.py,sha256
|
|
113
|
+
xinference/model/llm/llama_cpp/core.py,sha256=-KfD1TUfMhfHCn6jvoLihgTXBszkkMHoVd1nf4w3oPU,14071
|
|
113
114
|
xinference/model/llm/lmdeploy/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
114
115
|
xinference/model/llm/lmdeploy/core.py,sha256=DAUHO1AxPA10C7zovxXQe8Qr8yPF1PqyHKAUkrFbI_k,19895
|
|
115
116
|
xinference/model/llm/mlx/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
|
|
116
|
-
xinference/model/llm/mlx/core.py,sha256=
|
|
117
|
+
xinference/model/llm/mlx/core.py,sha256=5nxHxEFI2x6DVDWUln3HBoxf4NfeLN2P3rhV9zKwOMU,35482
|
|
117
118
|
xinference/model/llm/mlx/distributed_models/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
|
|
118
119
|
xinference/model/llm/mlx/distributed_models/core.py,sha256=0pYu9SiBwVxTJ04yf_lDzRvjBrbdDQfWobWzJA89HLo,5744
|
|
119
120
|
xinference/model/llm/mlx/distributed_models/deepseek_v3.py,sha256=oH6Yv7rzEL644gnA_rqBgU4hICpppUTaaQtwiODwfig,2441
|
|
@@ -121,10 +122,17 @@ xinference/model/llm/mlx/distributed_models/qwen2.py,sha256=B7YifMQqDujnrxCnjJZb
|
|
|
121
122
|
xinference/model/llm/mlx/distributed_models/qwen3.py,sha256=mconllhlTKOY96UP6Y9G3kBppSbP5kYCcziDeBEdtVY,2586
|
|
122
123
|
xinference/model/llm/mlx/distributed_models/qwen3_moe.py,sha256=_d__HWDYfL1wAUAa-0xWiszLC6AYkGLQ5eTVtsi5Pc4,2380
|
|
123
124
|
xinference/model/llm/sglang/__init__.py,sha256=-sjSIQ4K6w-TEzx49kVaWeWC443fnZqODU91GCQ_JNo,581
|
|
124
|
-
xinference/model/llm/sglang/core.py,sha256=
|
|
125
|
+
xinference/model/llm/sglang/core.py,sha256=t5SoPiKxnRu4BJCaPc0H62S0-HiUnUvJYU3TuOjfeyU,29462
|
|
126
|
+
xinference/model/llm/tool_parsers/__init__.py,sha256=FqS5V2v-HpBy5J9IWaw7ZfZ5_fzAtYeVG0WN-bmL98o,1778
|
|
127
|
+
xinference/model/llm/tool_parsers/abstract_tool_parser.py,sha256=7D2ihK7Ny9LNmHcezcEKYNwe8GIZJHydFZlWDg4xXpE,1312
|
|
128
|
+
xinference/model/llm/tool_parsers/deepseek_r1_tool_parser.py,sha256=anjzpOlEeeFaqm0fRmpvXx585_kyqb-SgdCZhfRjTwM,4942
|
|
129
|
+
xinference/model/llm/tool_parsers/deepseek_v3_tool_parser.py,sha256=T1CPzomvTj8HoGBCHTYm2FqFqd62WNxMqTjhST0b1pk,5146
|
|
130
|
+
xinference/model/llm/tool_parsers/glm4_tool_parser.py,sha256=YBittOVGwQOPYtXHDWdxpO2vGUg5XapYdcfWPH1Kseg,4313
|
|
131
|
+
xinference/model/llm/tool_parsers/llama3_tool_parser.py,sha256=vBD39Ub2ha0CXRCOtGu97i8eNyZ_2cDShT3yqxK8W5o,2787
|
|
132
|
+
xinference/model/llm/tool_parsers/qwen_tool_parser.py,sha256=y6UxvJ70RbvmcyUDgZGkQwn_uTyz-grjlNS1D-_Nv8E,11746
|
|
125
133
|
xinference/model/llm/transformers/__init__.py,sha256=_4hQ7BvHNE4WAyzNcTB0_iY5mBcaPGTkLvQcWiylBoI,1724
|
|
126
134
|
xinference/model/llm/transformers/chatglm.py,sha256=ovDSYZet7bdqloO_WXaH9a6Rv6FyQ_BrY5dkejqvyBc,22953
|
|
127
|
-
xinference/model/llm/transformers/core.py,sha256=
|
|
135
|
+
xinference/model/llm/transformers/core.py,sha256=tV48CxsTVqMfLbqfJgBuGubQe3gzlJMfKWQOZxMJUAs,40086
|
|
128
136
|
xinference/model/llm/transformers/deepseek_v2.py,sha256=4LB_grDfdaXBCdTwduqpWFrYoeKsMnBERWTxcNl7EfA,2624
|
|
129
137
|
xinference/model/llm/transformers/gemma3.py,sha256=oH5SwLM7aX-8zMPO7918x2BKDZGJgeFdZ5FduHiDDQI,5490
|
|
130
138
|
xinference/model/llm/transformers/gpt_oss.py,sha256=uPO0WsDlxxd9KY3mlldyZyQIcogPk-rDxL-LHbIgSuc,3386
|
|
@@ -145,7 +153,7 @@ xinference/model/llm/transformers/multimodal/qwen-omni.py,sha256=tEZZAsnQssinF4s
|
|
|
145
153
|
xinference/model/llm/transformers/multimodal/qwen2_audio.py,sha256=wFzyTyNvSfTKA4opMeYHT4m4SpmAbcUfvkc16Bf4FRA,4680
|
|
146
154
|
xinference/model/llm/transformers/multimodal/qwen2_vl.py,sha256=b_gm_g2-seFpTB68-G3n_k2JKQqBxZa8KOg2STJPB7U,8594
|
|
147
155
|
xinference/model/llm/vllm/__init__.py,sha256=h_JgzSqV5lP6vQ6XX_17kE4IY4BRnvKta_7VLQAL1ms,581
|
|
148
|
-
xinference/model/llm/vllm/core.py,sha256=
|
|
156
|
+
xinference/model/llm/vllm/core.py,sha256=9Wo_EiAeMIsmf9FbRl8X0zKjWqSvur5ddlJBwLBtZNE,59152
|
|
149
157
|
xinference/model/llm/vllm/distributed_executor.py,sha256=8bFU4JSgvbBTrhGZhsANfMUX4DR6es1zw-cljVLkTBw,14125
|
|
150
158
|
xinference/model/llm/vllm/utils.py,sha256=LKOmwfFRrlSecawxT-uE39tC2RQbf1UIiSH9Uz90X6w,1313
|
|
151
159
|
xinference/model/llm/vllm/xavier/__init__.py,sha256=CyLLkbImZouAk4lePIgKXT4WQoqyauIEwdqea5IOUVU,581
|
|
@@ -15804,9 +15812,9 @@ xinference/ui/web/ui/src/locales/en.json,sha256=2K1xlg0dY0Xw208qW0bdJlE7XL2dbouC
|
|
|
15804
15812
|
xinference/ui/web/ui/src/locales/ja.json,sha256=EZmLCN1smdXmvR-tqFLIgelrIFRKGr6zf7x519DUpuA,11952
|
|
15805
15813
|
xinference/ui/web/ui/src/locales/ko.json,sha256=pEVoh1jyaqliaNTLOt2d4wDkeVQGQB_pGMjNllNERA8,10805
|
|
15806
15814
|
xinference/ui/web/ui/src/locales/zh.json,sha256=IY_eaPEE870ggqOMr_p9gjAu8IIoF6-3w_SlAyn-EGY,9859
|
|
15807
|
-
xinference-1.
|
|
15808
|
-
xinference-1.
|
|
15809
|
-
xinference-1.
|
|
15810
|
-
xinference-1.
|
|
15811
|
-
xinference-1.
|
|
15812
|
-
xinference-1.
|
|
15815
|
+
xinference-1.10.0.dist-info/licenses/LICENSE,sha256=QwcOLU5TJoTeUhuIXzhdCEEDDvorGiC6-3YTOl4TecE,11356
|
|
15816
|
+
xinference-1.10.0.dist-info/METADATA,sha256=VtKqtNrNEAlR4Wn_mmPax6ntXIw2vOtxcA8pPfIlIlU,26568
|
|
15817
|
+
xinference-1.10.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
15818
|
+
xinference-1.10.0.dist-info/entry_points.txt,sha256=-lDyyzqWMFQF0Rgm7VxBNz0V-bMBMQLRR3pvQ-Y8XTY,226
|
|
15819
|
+
xinference-1.10.0.dist-info/top_level.txt,sha256=L1rQt7pl6m8tmKXpWVHzP-GtmzAxp663rXxGE7qnK00,11
|
|
15820
|
+
xinference-1.10.0.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|