xinference 1.11.0.post1__py3-none-any.whl → 1.12.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of xinference might be problematic. Click here for more details.

Files changed (39) hide show
  1. xinference/__init__.py +8 -0
  2. xinference/_version.py +3 -3
  3. xinference/api/oauth2/utils.py +26 -5
  4. xinference/core/model.py +1 -10
  5. xinference/device_utils.py +11 -1
  6. xinference/model/embedding/model_spec.json +70 -0
  7. xinference/model/image/core.py +20 -10
  8. xinference/model/image/model_spec.json +55 -3
  9. xinference/model/image/ocr/__init__.py +5 -0
  10. xinference/model/image/ocr/deepseek_ocr.py +958 -0
  11. xinference/model/llm/core.py +2 -0
  12. xinference/model/llm/llama_cpp/core.py +2 -0
  13. xinference/model/llm/llm_family.json +319 -6
  14. xinference/model/llm/lmdeploy/core.py +2 -0
  15. xinference/model/llm/sglang/core.py +2 -0
  16. xinference/model/llm/transformers/core.py +2 -0
  17. xinference/model/llm/transformers/multimodal/qwen-omni.py +60 -11
  18. xinference/model/llm/transformers/multimodal/qwen2_vl.py +2 -2
  19. xinference/model/llm/vllm/core.py +2 -0
  20. xinference/model/rerank/model_spec.json +368 -252
  21. xinference/model/rerank/sentence_transformers/core.py +10 -2
  22. xinference/thirdparty/indextts/gpt/transformers_generation_utils.py +71 -5
  23. xinference/thirdparty/indextts/gpt/transformers_gpt2.py +51 -1
  24. xinference/ui/gradio/media_interface.py +469 -4
  25. xinference/ui/gradio/utils/__init__.py +19 -0
  26. xinference/ui/gradio/utils/latex.py +342 -0
  27. xinference/ui/web/ui/build/asset-manifest.json +3 -3
  28. xinference/ui/web/ui/build/index.html +1 -1
  29. xinference/ui/web/ui/build/static/js/{main.e4d9a9e1.js → main.87d6859b.js} +3 -3
  30. xinference/ui/web/ui/build/static/js/{main.e4d9a9e1.js.map → main.87d6859b.js.map} +1 -1
  31. xinference/ui/web/ui/node_modules/.cache/babel-loader/412a6b414a8267c7a349d9beda4593cdf218abf32edaaf339e6a230df40397b8.json +1 -0
  32. {xinference-1.11.0.post1.dist-info → xinference-1.12.0.dist-info}/METADATA +10 -11
  33. {xinference-1.11.0.post1.dist-info → xinference-1.12.0.dist-info}/RECORD +38 -35
  34. xinference/ui/web/ui/node_modules/.cache/babel-loader/bb4e8722d2d41d87f1fce3661bc8937bffe9448e231fc5f0462630849e851592.json +0 -1
  35. /xinference/ui/web/ui/build/static/js/{main.e4d9a9e1.js.LICENSE.txt → main.87d6859b.js.LICENSE.txt} +0 -0
  36. {xinference-1.11.0.post1.dist-info → xinference-1.12.0.dist-info}/WHEEL +0 -0
  37. {xinference-1.11.0.post1.dist-info → xinference-1.12.0.dist-info}/entry_points.txt +0 -0
  38. {xinference-1.11.0.post1.dist-info → xinference-1.12.0.dist-info}/licenses/LICENSE +0 -0
  39. {xinference-1.11.0.post1.dist-info → xinference-1.12.0.dist-info}/top_level.txt +0 -0
@@ -1,254 +1,370 @@
1
1
  [
2
- {
3
- "version": 2,
4
- "model_name": "bge-reranker-large",
5
- "type": "normal",
6
- "language": ["en", "zh"],
7
- "max_tokens": 512,
8
- "model_specs": [
9
- {
10
- "model_format": "pytorch",
11
- "model_src": {
12
- "huggingface": {
13
- "model_id": "BAAI/bge-reranker-large",
14
- "model_revision": "27c9168d479987529781de8474dff94d69beca11",
15
- "quantizations": ["none"]
16
- },
17
- "modelscope": {
18
- "model_id": "Xorbits/bge-reranker-large",
19
- "model_revision": "v0.0.1",
20
- "quantizations": ["none"]
21
- }
22
- }
23
- }
24
- ]
25
- },
26
- {
27
- "version": 2,
28
- "model_name": "bge-reranker-base",
29
- "type": "normal",
30
- "language": ["en", "zh"],
31
- "max_tokens": 512,
32
- "model_specs": [
33
- {
34
- "model_format": "pytorch",
35
- "model_src": {
36
- "huggingface": {
37
- "model_id": "BAAI/bge-reranker-base",
38
- "model_revision": "465b4b7ddf2be0a020c8ad6e525b9bb1dbb708ae",
39
- "quantizations": ["none"]
40
- },
41
- "modelscope": {
42
- "model_id": "Xorbits/bge-reranker-base",
43
- "model_revision": "v0.0.1",
44
- "quantizations": ["none"]
45
- }
46
- }
47
- }
48
- ]
49
- },
50
- {
51
- "version": 2,
52
- "model_name": "bce-reranker-base_v1",
53
- "type": "normal",
54
- "language": ["en", "zh"],
55
- "max_tokens": 512,
56
- "model_specs": [
57
- {
58
- "model_format": "pytorch",
59
- "model_src": {
60
- "huggingface": {
61
- "model_id": "maidalun1020/bce-reranker-base_v1",
62
- "model_revision": "eaa31a577a0574e87a08959bd229ca14ce1b5496",
63
- "quantizations": ["none"]
64
- },
65
- "modelscope": {
66
- "model_id": "maidalun/bce-reranker-base_v1",
67
- "model_revision": "v0.0.1",
68
- "quantizations": ["none"]
69
- }
70
- }
71
- }
72
- ]
73
- },
74
- {
75
- "version": 2,
76
- "model_name": "bge-reranker-v2-m3",
77
- "type": "normal",
78
- "language": ["en", "zh", "multilingual"],
79
- "max_tokens": 8192,
80
- "model_specs": [
81
- {
82
- "model_format": "pytorch",
83
- "model_src": {
84
- "huggingface": {
85
- "model_id": "BAAI/bge-reranker-v2-m3",
86
- "model_revision": "12e974610ba9083ed95f3edf08d7e899581f4de4",
87
- "quantizations": ["none"]
88
- },
89
- "modelscope": {
90
- "model_id": "AI-ModelScope/bge-reranker-v2-m3",
91
- "quantizations": ["none"]
92
- }
93
- }
94
- }
95
- ]
96
- },
97
- {
98
- "version": 2,
99
- "model_name": "bge-reranker-v2-gemma",
100
- "type": "LLM-based",
101
- "language": ["en", "zh", "multilingual"],
102
- "max_tokens": 8192,
103
- "model_specs": [
104
- {
105
- "model_format": "pytorch",
106
- "model_src": {
107
- "huggingface": {
108
- "model_id": "BAAI/bge-reranker-v2-gemma",
109
- "model_revision": "1787044f8b6fb740a9de4557c3a12377f84d9e17",
110
- "quantizations": ["none"]
111
- },
112
- "modelscope": {
113
- "model_id": "AI-ModelScope/bge-reranker-v2-gemma",
114
- "quantizations": ["none"]
115
- }
116
- }
117
- }
118
- ]
119
- },
120
- {
121
- "version": 2,
122
- "model_name": "bge-reranker-v2-minicpm-layerwise",
123
- "type": "LLM-based layerwise",
124
- "language": ["en", "zh", "multilingual"],
125
- "max_tokens": 2048,
126
- "model_specs": [
127
- {
128
- "model_format": "pytorch",
129
- "model_src": {
130
- "huggingface": {
131
- "model_id": "BAAI/bge-reranker-v2-minicpm-layerwise",
132
- "model_revision": "47b5332b296c4d8cb6ee2c60502cc62a0d708881",
133
- "quantizations": ["none"]
134
- },
135
- "modelscope": {
136
- "model_id": "mirror013/bge-reranker-v2-minicpm-layerwise",
137
- "quantizations": ["none"]
138
- }
139
- }
140
- }
141
- ]
142
- },
143
- {
144
- "version": 2,
145
- "model_name": "jina-reranker-v2",
146
- "type": "normal",
147
- "language": ["en", "zh", "multilingual"],
148
- "max_tokens": 1024,
149
- "model_specs": [
150
- {
151
- "model_format": "pytorch",
152
- "model_src": {
153
- "huggingface": {
154
- "model_id": "jinaai/jina-reranker-v2-base-multilingual",
155
- "model_revision": "298e48cada4a9318650d7fbd795f63827f884087",
156
- "quantizations": ["none"]
157
- }
158
- }
159
- }
160
- ]
161
- },
162
- {
163
- "version": 2,
164
- "model_name": "minicpm-reranker",
165
- "type": "normal",
166
- "language": ["en", "zh"],
167
- "max_tokens": 1024,
168
- "model_specs": [
169
- {
170
- "model_format": "pytorch",
171
- "model_src": {
172
- "huggingface": {
173
- "model_id": "openbmb/MiniCPM-Reranker",
174
- "model_revision": "5d2fd7345b6444c89d4c0fa59c92272888f3f2d0",
175
- "quantizations": ["none"]
176
- },
177
- "modelscope": {
178
- "model_id": "OpenBMB/MiniCPM-Reranker",
179
- "quantizations": ["none"]
180
- }
181
- }
182
- }
183
- ]
184
- },
185
- {
186
- "version": 2,
187
- "model_name": "Qwen3-Reranker-0.6B",
188
- "type": "normal",
189
- "language": ["en", "zh"],
190
- "max_tokens": 32768,
191
- "model_specs": [
192
- {
193
- "model_format": "pytorch",
194
- "model_src": {
195
- "huggingface": {
196
- "model_id": "Qwen/Qwen3-Reranker-0.6B",
197
- "model_revision": "6e9e69830b95c52b5fd889b7690dda3329508de3",
198
- "quantizations": ["none"]
199
- },
200
- "modelscope": {
201
- "model_id": "Qwen/Qwen3-Reranker-0.6B",
202
- "quantizations": ["none"]
203
- }
204
- }
205
- }
206
- ]
207
- },
208
- {
209
- "version": 2,
210
- "model_name": "Qwen3-Reranker-4B",
211
- "type": "normal",
212
- "language": ["en", "zh"],
213
- "max_tokens": 32768,
214
- "model_specs": [
215
- {
216
- "model_format": "pytorch",
217
- "model_src": {
218
- "huggingface": {
219
- "model_id": "Qwen/Qwen3-Reranker-4B",
220
- "model_revision": "f16fc5d5d2b9b1d0db8280929242745d79794ef5",
221
- "quantizations": ["none"]
222
- },
223
- "modelscope": {
224
- "model_id": "Qwen/Qwen3-Reranker-4B",
225
- "quantizations": ["none"]
226
- }
227
- }
228
- }
229
- ]
230
- },
231
- {
232
- "version": 2,
233
- "model_name": "Qwen3-Reranker-8B",
234
- "type": "normal",
235
- "language": ["en", "zh"],
236
- "max_tokens": 32768,
237
- "model_specs": [
238
- {
239
- "model_format": "pytorch",
240
- "model_src": {
241
- "huggingface": {
242
- "model_id": "Qwen/Qwen3-Reranker-8B",
243
- "model_revision": "5fa94080caafeaa45a15d11f969d7978e087a3db",
244
- "quantizations": ["none"]
245
- },
246
- "modelscope": {
247
- "model_id": "Qwen/Qwen3-Reranker-8B",
248
- "quantizations": ["none"]
249
- }
250
- }
251
- }
252
- ]
253
- }
2
+ {
3
+ "version": 2,
4
+ "model_name": "bge-reranker-large",
5
+ "type": "normal",
6
+ "language": [
7
+ "en",
8
+ "zh"
9
+ ],
10
+ "max_tokens": 512,
11
+ "model_specs": [
12
+ {
13
+ "model_format": "pytorch",
14
+ "model_src": {
15
+ "huggingface": {
16
+ "model_id": "BAAI/bge-reranker-large",
17
+ "model_revision": "27c9168d479987529781de8474dff94d69beca11",
18
+ "quantizations": [
19
+ "none"
20
+ ]
21
+ },
22
+ "modelscope": {
23
+ "model_id": "Xorbits/bge-reranker-large",
24
+ "model_revision": "v0.0.1",
25
+ "quantizations": [
26
+ "none"
27
+ ]
28
+ }
29
+ }
30
+ }
31
+ ]
32
+ },
33
+ {
34
+ "version": 2,
35
+ "model_name": "bge-reranker-base",
36
+ "type": "normal",
37
+ "language": [
38
+ "en",
39
+ "zh"
40
+ ],
41
+ "max_tokens": 512,
42
+ "model_specs": [
43
+ {
44
+ "model_format": "pytorch",
45
+ "model_src": {
46
+ "huggingface": {
47
+ "model_id": "BAAI/bge-reranker-base",
48
+ "model_revision": "465b4b7ddf2be0a020c8ad6e525b9bb1dbb708ae",
49
+ "quantizations": [
50
+ "none"
51
+ ]
52
+ },
53
+ "modelscope": {
54
+ "model_id": "Xorbits/bge-reranker-base",
55
+ "model_revision": "v0.0.1",
56
+ "quantizations": [
57
+ "none"
58
+ ]
59
+ }
60
+ }
61
+ }
62
+ ]
63
+ },
64
+ {
65
+ "version": 2,
66
+ "model_name": "bce-reranker-base_v1",
67
+ "type": "normal",
68
+ "language": [
69
+ "en",
70
+ "zh"
71
+ ],
72
+ "max_tokens": 512,
73
+ "model_specs": [
74
+ {
75
+ "model_format": "pytorch",
76
+ "model_src": {
77
+ "huggingface": {
78
+ "model_id": "maidalun1020/bce-reranker-base_v1",
79
+ "model_revision": "eaa31a577a0574e87a08959bd229ca14ce1b5496",
80
+ "quantizations": [
81
+ "none"
82
+ ]
83
+ },
84
+ "modelscope": {
85
+ "model_id": "maidalun/bce-reranker-base_v1",
86
+ "model_revision": "v0.0.1",
87
+ "quantizations": [
88
+ "none"
89
+ ]
90
+ }
91
+ }
92
+ }
93
+ ]
94
+ },
95
+ {
96
+ "version": 2,
97
+ "model_name": "bge-reranker-v2-m3",
98
+ "type": "normal",
99
+ "language": [
100
+ "en",
101
+ "zh",
102
+ "multilingual"
103
+ ],
104
+ "max_tokens": 8192,
105
+ "model_specs": [
106
+ {
107
+ "model_format": "pytorch",
108
+ "model_src": {
109
+ "huggingface": {
110
+ "model_id": "BAAI/bge-reranker-v2-m3",
111
+ "model_revision": "12e974610ba9083ed95f3edf08d7e899581f4de4",
112
+ "quantizations": [
113
+ "none"
114
+ ]
115
+ },
116
+ "modelscope": {
117
+ "model_id": "AI-ModelScope/bge-reranker-v2-m3",
118
+ "quantizations": [
119
+ "none"
120
+ ]
121
+ }
122
+ }
123
+ }
124
+ ]
125
+ },
126
+ {
127
+ "version": 2,
128
+ "model_name": "bge-reranker-v2-gemma",
129
+ "type": "LLM-based",
130
+ "language": [
131
+ "en",
132
+ "zh",
133
+ "multilingual"
134
+ ],
135
+ "max_tokens": 8192,
136
+ "model_specs": [
137
+ {
138
+ "model_format": "pytorch",
139
+ "model_src": {
140
+ "huggingface": {
141
+ "model_id": "BAAI/bge-reranker-v2-gemma",
142
+ "model_revision": "1787044f8b6fb740a9de4557c3a12377f84d9e17",
143
+ "quantizations": [
144
+ "none"
145
+ ]
146
+ },
147
+ "modelscope": {
148
+ "model_id": "AI-ModelScope/bge-reranker-v2-gemma",
149
+ "quantizations": [
150
+ "none"
151
+ ]
152
+ }
153
+ }
154
+ }
155
+ ]
156
+ },
157
+ {
158
+ "version": 2,
159
+ "model_name": "bge-reranker-v2-minicpm-layerwise",
160
+ "type": "LLM-based layerwise",
161
+ "language": [
162
+ "en",
163
+ "zh",
164
+ "multilingual"
165
+ ],
166
+ "max_tokens": 2048,
167
+ "model_specs": [
168
+ {
169
+ "model_format": "pytorch",
170
+ "model_src": {
171
+ "huggingface": {
172
+ "model_id": "BAAI/bge-reranker-v2-minicpm-layerwise",
173
+ "model_revision": "47b5332b296c4d8cb6ee2c60502cc62a0d708881",
174
+ "quantizations": [
175
+ "none"
176
+ ]
177
+ },
178
+ "modelscope": {
179
+ "model_id": "mirror013/bge-reranker-v2-minicpm-layerwise",
180
+ "quantizations": [
181
+ "none"
182
+ ]
183
+ }
184
+ }
185
+ }
186
+ ]
187
+ },
188
+ {
189
+ "version": 2,
190
+ "model_name": "jina-reranker-v2",
191
+ "type": "normal",
192
+ "language": [
193
+ "en",
194
+ "zh",
195
+ "multilingual"
196
+ ],
197
+ "max_tokens": 1024,
198
+ "model_specs": [
199
+ {
200
+ "model_format": "pytorch",
201
+ "model_src": {
202
+ "huggingface": {
203
+ "model_id": "jinaai/jina-reranker-v2-base-multilingual",
204
+ "model_revision": "298e48cada4a9318650d7fbd795f63827f884087",
205
+ "quantizations": [
206
+ "none"
207
+ ]
208
+ },
209
+ "modelscope": {
210
+ "model_id": "jinaai/jina-reranker-v2-base-multilingual",
211
+ "quantizations": [
212
+ "none"
213
+ ]
214
+ }
215
+ }
216
+ }
217
+ ]
218
+ },
219
+ {
220
+ "version": 2,
221
+ "model_name": "minicpm-reranker",
222
+ "type": "normal",
223
+ "language": [
224
+ "en",
225
+ "zh"
226
+ ],
227
+ "max_tokens": 1024,
228
+ "model_specs": [
229
+ {
230
+ "model_format": "pytorch",
231
+ "model_src": {
232
+ "huggingface": {
233
+ "model_id": "openbmb/MiniCPM-Reranker",
234
+ "model_revision": "5d2fd7345b6444c89d4c0fa59c92272888f3f2d0",
235
+ "quantizations": [
236
+ "none"
237
+ ]
238
+ },
239
+ "modelscope": {
240
+ "model_id": "OpenBMB/MiniCPM-Reranker",
241
+ "quantizations": [
242
+ "none"
243
+ ]
244
+ }
245
+ }
246
+ }
247
+ ]
248
+ },
249
+ {
250
+ "version": 2,
251
+ "model_name": "Qwen3-Reranker-0.6B",
252
+ "type": "normal",
253
+ "language": [
254
+ "en",
255
+ "zh"
256
+ ],
257
+ "max_tokens": 32768,
258
+ "model_specs": [
259
+ {
260
+ "model_format": "pytorch",
261
+ "model_src": {
262
+ "huggingface": {
263
+ "model_id": "Qwen/Qwen3-Reranker-0.6B",
264
+ "model_revision": "6e9e69830b95c52b5fd889b7690dda3329508de3",
265
+ "quantizations": [
266
+ "none"
267
+ ]
268
+ },
269
+ "modelscope": {
270
+ "model_id": "Qwen/Qwen3-Reranker-0.6B",
271
+ "quantizations": [
272
+ "none"
273
+ ]
274
+ }
275
+ }
276
+ }
277
+ ]
278
+ },
279
+ {
280
+ "version": 2,
281
+ "model_name": "Qwen3-Reranker-4B",
282
+ "type": "normal",
283
+ "language": [
284
+ "en",
285
+ "zh"
286
+ ],
287
+ "max_tokens": 32768,
288
+ "model_specs": [
289
+ {
290
+ "model_format": "pytorch",
291
+ "model_src": {
292
+ "huggingface": {
293
+ "model_id": "Qwen/Qwen3-Reranker-4B",
294
+ "model_revision": "f16fc5d5d2b9b1d0db8280929242745d79794ef5",
295
+ "quantizations": [
296
+ "none"
297
+ ]
298
+ },
299
+ "modelscope": {
300
+ "model_id": "Qwen/Qwen3-Reranker-4B",
301
+ "quantizations": [
302
+ "none"
303
+ ]
304
+ }
305
+ }
306
+ }
307
+ ]
308
+ },
309
+ {
310
+ "version": 2,
311
+ "model_name": "Qwen3-Reranker-8B",
312
+ "type": "normal",
313
+ "language": [
314
+ "en",
315
+ "zh"
316
+ ],
317
+ "max_tokens": 32768,
318
+ "model_specs": [
319
+ {
320
+ "model_format": "pytorch",
321
+ "model_src": {
322
+ "huggingface": {
323
+ "model_id": "Qwen/Qwen3-Reranker-8B",
324
+ "model_revision": "5fa94080caafeaa45a15d11f969d7978e087a3db",
325
+ "quantizations": [
326
+ "none"
327
+ ]
328
+ },
329
+ "modelscope": {
330
+ "model_id": "Qwen/Qwen3-Reranker-8B",
331
+ "quantizations": [
332
+ "none"
333
+ ]
334
+ }
335
+ }
336
+ }
337
+ ]
338
+ },
339
+ {
340
+ "version": 2,
341
+ "model_name": "jina-reranker-v3",
342
+ "type": "normal",
343
+ "language": [
344
+ "en",
345
+ "zh",
346
+ "multilingual"
347
+ ],
348
+ "max_tokens": 131072,
349
+ "model_specs": [
350
+ {
351
+ "model_format": "pytorch",
352
+ "model_src": {
353
+ "huggingface": {
354
+ "model_id": "jinaai/jina-reranker-v3",
355
+ "model_revision": "7fa51ea4da62cb1b13ac263a1a41e20962a36c81",
356
+ "quantizations": [
357
+ "none"
358
+ ]
359
+ },
360
+ "modelscope": {
361
+ "model_id": "jinaai/jina-reranker-v3",
362
+ "quantizations": [
363
+ "none"
364
+ ]
365
+ }
366
+ }
367
+ }
368
+ ]
369
+ }
254
370
  ]