xinference 1.7.1.post1__py3-none-any.whl → 1.8.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of xinference might be problematic. Click here for more details.
- xinference/_version.py +3 -3
- xinference/client/restful/async_restful_client.py +8 -13
- xinference/client/restful/restful_client.py +6 -2
- xinference/core/chat_interface.py +6 -4
- xinference/core/media_interface.py +5 -0
- xinference/core/model.py +1 -5
- xinference/core/supervisor.py +117 -68
- xinference/core/worker.py +49 -37
- xinference/deploy/test/test_cmdline.py +2 -6
- xinference/model/audio/__init__.py +26 -23
- xinference/model/audio/chattts.py +3 -2
- xinference/model/audio/core.py +49 -98
- xinference/model/audio/cosyvoice.py +3 -2
- xinference/model/audio/custom.py +28 -73
- xinference/model/audio/f5tts.py +3 -2
- xinference/model/audio/f5tts_mlx.py +3 -2
- xinference/model/audio/fish_speech.py +3 -2
- xinference/model/audio/funasr.py +17 -4
- xinference/model/audio/kokoro.py +3 -2
- xinference/model/audio/megatts.py +3 -2
- xinference/model/audio/melotts.py +3 -2
- xinference/model/audio/model_spec.json +572 -171
- xinference/model/audio/utils.py +0 -6
- xinference/model/audio/whisper.py +3 -2
- xinference/model/audio/whisper_mlx.py +3 -2
- xinference/model/cache_manager.py +141 -0
- xinference/model/core.py +6 -49
- xinference/model/custom.py +174 -0
- xinference/model/embedding/__init__.py +67 -56
- xinference/model/embedding/cache_manager.py +35 -0
- xinference/model/embedding/core.py +104 -84
- xinference/model/embedding/custom.py +55 -78
- xinference/model/embedding/embed_family.py +80 -31
- xinference/model/embedding/flag/core.py +21 -5
- xinference/model/embedding/llama_cpp/__init__.py +0 -0
- xinference/model/embedding/llama_cpp/core.py +234 -0
- xinference/model/embedding/model_spec.json +968 -103
- xinference/model/embedding/sentence_transformers/core.py +30 -20
- xinference/model/embedding/vllm/core.py +11 -5
- xinference/model/flexible/__init__.py +8 -2
- xinference/model/flexible/core.py +26 -119
- xinference/model/flexible/custom.py +69 -0
- xinference/model/flexible/launchers/image_process_launcher.py +1 -0
- xinference/model/flexible/launchers/modelscope_launcher.py +5 -1
- xinference/model/flexible/launchers/transformers_launcher.py +15 -3
- xinference/model/flexible/launchers/yolo_launcher.py +5 -1
- xinference/model/image/__init__.py +20 -20
- xinference/model/image/cache_manager.py +62 -0
- xinference/model/image/core.py +70 -182
- xinference/model/image/custom.py +28 -72
- xinference/model/image/model_spec.json +402 -119
- xinference/model/image/ocr/got_ocr2.py +3 -2
- xinference/model/image/stable_diffusion/core.py +22 -7
- xinference/model/image/stable_diffusion/mlx.py +6 -6
- xinference/model/image/utils.py +2 -2
- xinference/model/llm/__init__.py +71 -94
- xinference/model/llm/cache_manager.py +292 -0
- xinference/model/llm/core.py +37 -111
- xinference/model/llm/custom.py +88 -0
- xinference/model/llm/llama_cpp/core.py +5 -7
- xinference/model/llm/llm_family.json +16260 -8151
- xinference/model/llm/llm_family.py +138 -839
- xinference/model/llm/lmdeploy/core.py +5 -7
- xinference/model/llm/memory.py +3 -4
- xinference/model/llm/mlx/core.py +6 -8
- xinference/model/llm/reasoning_parser.py +3 -1
- xinference/model/llm/sglang/core.py +32 -14
- xinference/model/llm/transformers/chatglm.py +3 -7
- xinference/model/llm/transformers/core.py +49 -27
- xinference/model/llm/transformers/deepseek_v2.py +2 -2
- xinference/model/llm/transformers/gemma3.py +2 -2
- xinference/model/llm/transformers/multimodal/cogagent.py +2 -2
- xinference/model/llm/transformers/multimodal/deepseek_vl2.py +2 -2
- xinference/model/llm/transformers/multimodal/gemma3.py +2 -2
- xinference/model/llm/transformers/multimodal/glm4_1v.py +167 -0
- xinference/model/llm/transformers/multimodal/glm4v.py +2 -2
- xinference/model/llm/transformers/multimodal/intern_vl.py +2 -2
- xinference/model/llm/transformers/multimodal/minicpmv26.py +3 -3
- xinference/model/llm/transformers/multimodal/ovis2.py +2 -2
- xinference/model/llm/transformers/multimodal/qwen-omni.py +2 -2
- xinference/model/llm/transformers/multimodal/qwen2_audio.py +2 -2
- xinference/model/llm/transformers/multimodal/qwen2_vl.py +2 -2
- xinference/model/llm/transformers/opt.py +3 -7
- xinference/model/llm/utils.py +34 -49
- xinference/model/llm/vllm/core.py +77 -27
- xinference/model/llm/vllm/xavier/engine.py +5 -3
- xinference/model/llm/vllm/xavier/scheduler.py +10 -6
- xinference/model/llm/vllm/xavier/transfer.py +1 -1
- xinference/model/rerank/__init__.py +26 -25
- xinference/model/rerank/core.py +47 -87
- xinference/model/rerank/custom.py +25 -71
- xinference/model/rerank/model_spec.json +158 -33
- xinference/model/rerank/utils.py +2 -2
- xinference/model/utils.py +115 -54
- xinference/model/video/__init__.py +13 -17
- xinference/model/video/core.py +44 -102
- xinference/model/video/diffusers.py +4 -3
- xinference/model/video/model_spec.json +90 -21
- xinference/types.py +5 -3
- xinference/web/ui/build/asset-manifest.json +3 -3
- xinference/web/ui/build/index.html +1 -1
- xinference/web/ui/build/static/js/main.7d24df53.js +3 -0
- xinference/web/ui/build/static/js/main.7d24df53.js.map +1 -0
- xinference/web/ui/node_modules/.cache/babel-loader/2704ff66a5f73ca78b341eb3edec60154369df9d87fbc8c6dd60121abc5e1b0a.json +1 -0
- xinference/web/ui/node_modules/.cache/babel-loader/607dfef23d33e6b594518c0c6434567639f24f356b877c80c60575184ec50ed0.json +1 -0
- xinference/web/ui/node_modules/.cache/babel-loader/9be3d56173aacc3efd0b497bcb13c4f6365de30069176ee9403b40e717542326.json +1 -0
- xinference/web/ui/node_modules/.cache/babel-loader/9f9dd6c32c78a222d07da5987ae902effe16bcf20aac00774acdccc4de3c9ff2.json +1 -0
- xinference/web/ui/node_modules/.cache/babel-loader/b2ab5ee972c60d15eb9abf5845705f8ab7e1d125d324d9a9b1bcae5d6fd7ffb2.json +1 -0
- xinference/web/ui/src/locales/en.json +0 -1
- xinference/web/ui/src/locales/ja.json +0 -1
- xinference/web/ui/src/locales/ko.json +0 -1
- xinference/web/ui/src/locales/zh.json +0 -1
- {xinference-1.7.1.post1.dist-info → xinference-1.8.0.dist-info}/METADATA +9 -11
- {xinference-1.7.1.post1.dist-info → xinference-1.8.0.dist-info}/RECORD +119 -119
- xinference/model/audio/model_spec_modelscope.json +0 -231
- xinference/model/embedding/model_spec_modelscope.json +0 -293
- xinference/model/embedding/utils.py +0 -18
- xinference/model/image/model_spec_modelscope.json +0 -375
- xinference/model/llm/llama_cpp/memory.py +0 -457
- xinference/model/llm/llm_family_csghub.json +0 -56
- xinference/model/llm/llm_family_modelscope.json +0 -8700
- xinference/model/llm/llm_family_openmind_hub.json +0 -1019
- xinference/model/rerank/model_spec_modelscope.json +0 -85
- xinference/model/video/model_spec_modelscope.json +0 -184
- xinference/web/ui/build/static/js/main.9b12b7f9.js +0 -3
- xinference/web/ui/build/static/js/main.9b12b7f9.js.map +0 -1
- xinference/web/ui/node_modules/.cache/babel-loader/1460361af6975e63576708039f1cb732faf9c672d97c494d4055fc6331460be0.json +0 -1
- xinference/web/ui/node_modules/.cache/babel-loader/4efd8dda58fda83ed9546bf2f587df67f8d98e639117bee2d9326a9a1d9bebb2.json +0 -1
- xinference/web/ui/node_modules/.cache/babel-loader/55b9fb40b57fa926e8f05f31c2f96467e76e5ad62f033dca97c03f9e8c4eb4fe.json +0 -1
- xinference/web/ui/node_modules/.cache/babel-loader/5b2dafe5aa9e1105e0244a2b6751807342fa86aa0144b4e84d947a1686102715.json +0 -1
- xinference/web/ui/node_modules/.cache/babel-loader/611fa2c6c53b66039991d06dfb0473b5ab37fc63b4564e0f6e1718523768a045.json +0 -1
- /xinference/web/ui/build/static/js/{main.9b12b7f9.js.LICENSE.txt → main.7d24df53.js.LICENSE.txt} +0 -0
- {xinference-1.7.1.post1.dist-info → xinference-1.8.0.dist-info}/WHEEL +0 -0
- {xinference-1.7.1.post1.dist-info → xinference-1.8.0.dist-info}/entry_points.txt +0 -0
- {xinference-1.7.1.post1.dist-info → xinference-1.8.0.dist-info}/licenses/LICENSE +0 -0
- {xinference-1.7.1.post1.dist-info → xinference-1.8.0.dist-info}/top_level.txt +0 -0
|
@@ -1,85 +0,0 @@
|
|
|
1
|
-
[
|
|
2
|
-
{
|
|
3
|
-
"model_name": "bge-reranker-base",
|
|
4
|
-
"type": "normal",
|
|
5
|
-
"language": ["en", "zh"],
|
|
6
|
-
"max_tokens": 512,
|
|
7
|
-
"model_id": "Xorbits/bge-reranker-base",
|
|
8
|
-
"model_revision": "v0.0.1",
|
|
9
|
-
"model_hub": "modelscope"
|
|
10
|
-
},
|
|
11
|
-
{
|
|
12
|
-
"model_name": "bge-reranker-large",
|
|
13
|
-
"type": "normal",
|
|
14
|
-
"language": ["en", "zh"],
|
|
15
|
-
"max_tokens": 512,
|
|
16
|
-
"model_id": "Xorbits/bge-reranker-large",
|
|
17
|
-
"model_revision": "v0.0.1",
|
|
18
|
-
"model_hub": "modelscope"
|
|
19
|
-
},
|
|
20
|
-
{
|
|
21
|
-
"model_name": "bce-reranker-base_v1",
|
|
22
|
-
"type": "normal",
|
|
23
|
-
"language": ["en", "zh"],
|
|
24
|
-
"max_tokens": 512,
|
|
25
|
-
"model_id": "maidalun/bce-reranker-base_v1",
|
|
26
|
-
"model_revision": "v0.0.1",
|
|
27
|
-
"model_hub": "modelscope"
|
|
28
|
-
},
|
|
29
|
-
{
|
|
30
|
-
"model_name": "bge-reranker-v2-m3",
|
|
31
|
-
"type": "normal",
|
|
32
|
-
"max_tokens": 8192,
|
|
33
|
-
"language": ["en", "zh", "multilingual"],
|
|
34
|
-
"model_id": "AI-ModelScope/bge-reranker-v2-m3",
|
|
35
|
-
"model_hub": "modelscope"
|
|
36
|
-
},
|
|
37
|
-
{
|
|
38
|
-
"model_name": "bge-reranker-v2-gemma",
|
|
39
|
-
"type": "LLM-based",
|
|
40
|
-
"language": ["en", "zh", "multilingual"],
|
|
41
|
-
"max_tokens": 8192,
|
|
42
|
-
"model_id": "AI-ModelScope/bge-reranker-v2-gemma",
|
|
43
|
-
"model_hub": "modelscope"
|
|
44
|
-
},
|
|
45
|
-
{
|
|
46
|
-
"model_name": "bge-reranker-v2-minicpm-layerwise",
|
|
47
|
-
"type": "LLM-based layerwise",
|
|
48
|
-
"language": ["en", "zh", "multilingual"],
|
|
49
|
-
"max_tokens": 2048,
|
|
50
|
-
"model_id": "mirror013/bge-reranker-v2-minicpm-layerwise",
|
|
51
|
-
"model_hub": "modelscope"
|
|
52
|
-
},
|
|
53
|
-
{
|
|
54
|
-
"model_name": "minicpm-reranker",
|
|
55
|
-
"type": "normal",
|
|
56
|
-
"language": ["en", "zh"],
|
|
57
|
-
"max_tokens": 1024,
|
|
58
|
-
"model_id": "OpenBMB/MiniCPM-Reranker",
|
|
59
|
-
"model_hub": "modelscope"
|
|
60
|
-
},
|
|
61
|
-
{
|
|
62
|
-
"model_name": "Qwen3-Reranker-0.6B",
|
|
63
|
-
"type": "normal",
|
|
64
|
-
"language": ["en", "zh"],
|
|
65
|
-
"max_tokens": 32768,
|
|
66
|
-
"model_id": "Qwen/Qwen3-Reranker-0.6B",
|
|
67
|
-
"model_hub": "modelscope"
|
|
68
|
-
},
|
|
69
|
-
{
|
|
70
|
-
"model_name": "Qwen3-Reranker-4B",
|
|
71
|
-
"type": "normal",
|
|
72
|
-
"language": ["en", "zh"],
|
|
73
|
-
"max_tokens": 32768,
|
|
74
|
-
"model_id": "Qwen/Qwen3-Reranker-4B",
|
|
75
|
-
"model_hub": "modelscope"
|
|
76
|
-
},
|
|
77
|
-
{
|
|
78
|
-
"model_name": "Qwen3-Reranker-8B",
|
|
79
|
-
"type": "normal",
|
|
80
|
-
"language": ["en", "zh"],
|
|
81
|
-
"max_tokens": 32768,
|
|
82
|
-
"model_id": "Qwen/Qwen3-Reranker-8B",
|
|
83
|
-
"model_hub": "modelscope"
|
|
84
|
-
}
|
|
85
|
-
]
|
|
@@ -1,184 +0,0 @@
|
|
|
1
|
-
[
|
|
2
|
-
{
|
|
3
|
-
"model_name": "CogVideoX-2b",
|
|
4
|
-
"model_family": "CogVideoX",
|
|
5
|
-
"model_hub": "modelscope",
|
|
6
|
-
"model_id": "ZhipuAI/CogVideoX-2b",
|
|
7
|
-
"model_revision": "master",
|
|
8
|
-
"model_ability": [
|
|
9
|
-
"text2video"
|
|
10
|
-
],
|
|
11
|
-
"default_model_config": {
|
|
12
|
-
"scheduler": "CogVideoXDDIMScheduler",
|
|
13
|
-
"torch_dtype": "float16"
|
|
14
|
-
},
|
|
15
|
-
"default_generate_config": {
|
|
16
|
-
"guidance_scale": 6
|
|
17
|
-
}
|
|
18
|
-
},
|
|
19
|
-
{
|
|
20
|
-
"model_name": "CogVideoX-5b",
|
|
21
|
-
"model_family": "CogVideoX",
|
|
22
|
-
"model_hub": "modelscope",
|
|
23
|
-
"model_id": "ZhipuAI/CogVideoX-5b",
|
|
24
|
-
"model_revision": "master",
|
|
25
|
-
"model_ability": [
|
|
26
|
-
"text2video"
|
|
27
|
-
],
|
|
28
|
-
"default_model_config": {
|
|
29
|
-
"scheduler": "CogVideoXDPMScheduler",
|
|
30
|
-
"torch_dtype": "bfloat16"
|
|
31
|
-
},
|
|
32
|
-
"default_generate_config": {
|
|
33
|
-
"guidance_scale": 7
|
|
34
|
-
}
|
|
35
|
-
},
|
|
36
|
-
{
|
|
37
|
-
"model_name": "HunyuanVideo",
|
|
38
|
-
"model_family": "HunyuanVideo",
|
|
39
|
-
"model_hub": "modelscope",
|
|
40
|
-
"model_id": "Xorbits/HunyuanVideo",
|
|
41
|
-
"model_revision": "master",
|
|
42
|
-
"model_ability": [
|
|
43
|
-
"text2video"
|
|
44
|
-
],
|
|
45
|
-
"default_model_config": {
|
|
46
|
-
"transformer_torch_dtype": "bfloat16",
|
|
47
|
-
"torch_dtype": "float16"
|
|
48
|
-
},
|
|
49
|
-
"default_generate_config": {
|
|
50
|
-
}
|
|
51
|
-
},
|
|
52
|
-
{
|
|
53
|
-
"model_name": "Wan2.1-1.3B",
|
|
54
|
-
"model_family": "Wan",
|
|
55
|
-
"model_hub": "modelscope",
|
|
56
|
-
"model_id": "Wan-AI/Wan2.1-T2V-1.3B-Diffusers",
|
|
57
|
-
"model_revision": "master",
|
|
58
|
-
"model_ability": [
|
|
59
|
-
"text2video"
|
|
60
|
-
],
|
|
61
|
-
"default_model_config": {
|
|
62
|
-
"torch_dtype": "bfloat16"
|
|
63
|
-
},
|
|
64
|
-
"default_generate_config": {
|
|
65
|
-
},
|
|
66
|
-
"virtualenv": {
|
|
67
|
-
"packages": [
|
|
68
|
-
"diffusers>=0.33.0",
|
|
69
|
-
"ftfy",
|
|
70
|
-
"imageio-ffmpeg",
|
|
71
|
-
"imageio",
|
|
72
|
-
"#system_numpy#"
|
|
73
|
-
]
|
|
74
|
-
}
|
|
75
|
-
},
|
|
76
|
-
{
|
|
77
|
-
"model_name": "Wan2.1-14B",
|
|
78
|
-
"model_family": "Wan",
|
|
79
|
-
"model_hub": "modelscope",
|
|
80
|
-
"model_id": "Wan-AI/Wan2.1-T2V-14B-Diffusers",
|
|
81
|
-
"model_revision": "master",
|
|
82
|
-
"model_ability": [
|
|
83
|
-
"text2video"
|
|
84
|
-
],
|
|
85
|
-
"default_model_config": {
|
|
86
|
-
"torch_dtype": "bfloat16"
|
|
87
|
-
},
|
|
88
|
-
"default_generate_config": {
|
|
89
|
-
},
|
|
90
|
-
"virtualenv": {
|
|
91
|
-
"packages": [
|
|
92
|
-
"diffusers>=0.33.0",
|
|
93
|
-
"ftfy",
|
|
94
|
-
"imageio-ffmpeg",
|
|
95
|
-
"imageio",
|
|
96
|
-
"#system_numpy#"
|
|
97
|
-
]
|
|
98
|
-
}
|
|
99
|
-
},
|
|
100
|
-
{
|
|
101
|
-
"model_name": "Wan2.1-i2v-14B-480p",
|
|
102
|
-
"model_family": "Wan",
|
|
103
|
-
"model_hub": "modelscope",
|
|
104
|
-
"model_id": "Wan-AI/Wan2.1-I2V-14B-480P-Diffusers",
|
|
105
|
-
"model_revision": "master",
|
|
106
|
-
"model_ability": [
|
|
107
|
-
"image2video"
|
|
108
|
-
],
|
|
109
|
-
"default_model_config": {
|
|
110
|
-
"torch_dtype": "bfloat16"
|
|
111
|
-
},
|
|
112
|
-
"default_generate_config": {
|
|
113
|
-
"max_area": [
|
|
114
|
-
480,
|
|
115
|
-
832
|
|
116
|
-
]
|
|
117
|
-
},
|
|
118
|
-
"virtualenv": {
|
|
119
|
-
"packages": [
|
|
120
|
-
"diffusers>=0.33.0",
|
|
121
|
-
"ftfy",
|
|
122
|
-
"imageio-ffmpeg",
|
|
123
|
-
"imageio",
|
|
124
|
-
"#system_numpy#"
|
|
125
|
-
]
|
|
126
|
-
}
|
|
127
|
-
},
|
|
128
|
-
{
|
|
129
|
-
"model_name": "Wan2.1-i2v-14B-720p",
|
|
130
|
-
"model_family": "Wan",
|
|
131
|
-
"model_hub": "modelscope",
|
|
132
|
-
"model_id": "Wan-AI/Wan2.1-I2V-14B-720P-Diffusers",
|
|
133
|
-
"model_revision": "master",
|
|
134
|
-
"model_ability": [
|
|
135
|
-
"image2video"
|
|
136
|
-
],
|
|
137
|
-
"default_model_config": {
|
|
138
|
-
"torch_dtype": "bfloat16"
|
|
139
|
-
},
|
|
140
|
-
"default_generate_config": {
|
|
141
|
-
"max_area": [
|
|
142
|
-
720,
|
|
143
|
-
1280
|
|
144
|
-
]
|
|
145
|
-
},
|
|
146
|
-
"virtualenv": {
|
|
147
|
-
"packages": [
|
|
148
|
-
"diffusers>=0.33.0",
|
|
149
|
-
"ftfy",
|
|
150
|
-
"imageio-ffmpeg",
|
|
151
|
-
"imageio",
|
|
152
|
-
"#system_numpy#"
|
|
153
|
-
]
|
|
154
|
-
}
|
|
155
|
-
},
|
|
156
|
-
{
|
|
157
|
-
"model_name": "Wan2.1-flf2v-14B-720p",
|
|
158
|
-
"model_family": "Wan",
|
|
159
|
-
"model_hub": "modelscope",
|
|
160
|
-
"model_id": "Wan-AI/Wan2.1-FLF2V-14B-720P-diffusers",
|
|
161
|
-
"model_revision": "master",
|
|
162
|
-
"model_ability": [
|
|
163
|
-
"firstlastframe2video"
|
|
164
|
-
],
|
|
165
|
-
"default_model_config": {
|
|
166
|
-
"torch_dtype": "bfloat16"
|
|
167
|
-
},
|
|
168
|
-
"default_generate_config": {
|
|
169
|
-
"max_area": [
|
|
170
|
-
720,
|
|
171
|
-
1280
|
|
172
|
-
]
|
|
173
|
-
},
|
|
174
|
-
"virtualenv": {
|
|
175
|
-
"packages": [
|
|
176
|
-
"git+https://github.com/huggingface/diffusers",
|
|
177
|
-
"ftfy",
|
|
178
|
-
"imageio-ffmpeg",
|
|
179
|
-
"imageio",
|
|
180
|
-
"#system_numpy#"
|
|
181
|
-
]
|
|
182
|
-
}
|
|
183
|
-
}
|
|
184
|
-
]
|