xinference 1.7.1__py3-none-any.whl → 1.8.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of xinference might be problematic. Click here for more details.

Files changed (136) hide show
  1. xinference/_version.py +3 -3
  2. xinference/client/restful/async_restful_client.py +8 -13
  3. xinference/client/restful/restful_client.py +6 -2
  4. xinference/core/chat_interface.py +6 -4
  5. xinference/core/media_interface.py +5 -0
  6. xinference/core/model.py +1 -5
  7. xinference/core/supervisor.py +117 -68
  8. xinference/core/worker.py +49 -37
  9. xinference/deploy/test/test_cmdline.py +2 -6
  10. xinference/model/audio/__init__.py +26 -23
  11. xinference/model/audio/chattts.py +3 -2
  12. xinference/model/audio/core.py +49 -98
  13. xinference/model/audio/cosyvoice.py +3 -2
  14. xinference/model/audio/custom.py +28 -73
  15. xinference/model/audio/f5tts.py +3 -2
  16. xinference/model/audio/f5tts_mlx.py +3 -2
  17. xinference/model/audio/fish_speech.py +3 -2
  18. xinference/model/audio/funasr.py +17 -4
  19. xinference/model/audio/kokoro.py +3 -2
  20. xinference/model/audio/megatts.py +3 -2
  21. xinference/model/audio/melotts.py +3 -2
  22. xinference/model/audio/model_spec.json +572 -171
  23. xinference/model/audio/utils.py +0 -6
  24. xinference/model/audio/whisper.py +3 -2
  25. xinference/model/audio/whisper_mlx.py +3 -2
  26. xinference/model/cache_manager.py +141 -0
  27. xinference/model/core.py +6 -49
  28. xinference/model/custom.py +174 -0
  29. xinference/model/embedding/__init__.py +67 -56
  30. xinference/model/embedding/cache_manager.py +35 -0
  31. xinference/model/embedding/core.py +104 -84
  32. xinference/model/embedding/custom.py +55 -78
  33. xinference/model/embedding/embed_family.py +80 -31
  34. xinference/model/embedding/flag/core.py +21 -5
  35. xinference/model/embedding/llama_cpp/__init__.py +0 -0
  36. xinference/model/embedding/llama_cpp/core.py +234 -0
  37. xinference/model/embedding/model_spec.json +968 -103
  38. xinference/model/embedding/sentence_transformers/core.py +30 -20
  39. xinference/model/embedding/vllm/core.py +11 -5
  40. xinference/model/flexible/__init__.py +8 -2
  41. xinference/model/flexible/core.py +26 -119
  42. xinference/model/flexible/custom.py +69 -0
  43. xinference/model/flexible/launchers/image_process_launcher.py +1 -0
  44. xinference/model/flexible/launchers/modelscope_launcher.py +5 -1
  45. xinference/model/flexible/launchers/transformers_launcher.py +15 -3
  46. xinference/model/flexible/launchers/yolo_launcher.py +5 -1
  47. xinference/model/image/__init__.py +20 -20
  48. xinference/model/image/cache_manager.py +62 -0
  49. xinference/model/image/core.py +70 -182
  50. xinference/model/image/custom.py +28 -72
  51. xinference/model/image/model_spec.json +402 -119
  52. xinference/model/image/ocr/got_ocr2.py +3 -2
  53. xinference/model/image/stable_diffusion/core.py +22 -7
  54. xinference/model/image/stable_diffusion/mlx.py +6 -6
  55. xinference/model/image/utils.py +2 -2
  56. xinference/model/llm/__init__.py +71 -94
  57. xinference/model/llm/cache_manager.py +292 -0
  58. xinference/model/llm/core.py +37 -111
  59. xinference/model/llm/custom.py +88 -0
  60. xinference/model/llm/llama_cpp/core.py +5 -7
  61. xinference/model/llm/llm_family.json +16260 -8151
  62. xinference/model/llm/llm_family.py +138 -839
  63. xinference/model/llm/lmdeploy/core.py +5 -7
  64. xinference/model/llm/memory.py +3 -4
  65. xinference/model/llm/mlx/core.py +6 -8
  66. xinference/model/llm/reasoning_parser.py +3 -1
  67. xinference/model/llm/sglang/core.py +32 -14
  68. xinference/model/llm/transformers/chatglm.py +3 -7
  69. xinference/model/llm/transformers/core.py +49 -27
  70. xinference/model/llm/transformers/deepseek_v2.py +2 -2
  71. xinference/model/llm/transformers/gemma3.py +2 -2
  72. xinference/model/llm/transformers/multimodal/cogagent.py +2 -2
  73. xinference/model/llm/transformers/multimodal/deepseek_vl2.py +2 -2
  74. xinference/model/llm/transformers/multimodal/gemma3.py +2 -2
  75. xinference/model/llm/transformers/multimodal/glm4_1v.py +167 -0
  76. xinference/model/llm/transformers/multimodal/glm4v.py +2 -2
  77. xinference/model/llm/transformers/multimodal/intern_vl.py +2 -2
  78. xinference/model/llm/transformers/multimodal/minicpmv26.py +3 -3
  79. xinference/model/llm/transformers/multimodal/ovis2.py +2 -2
  80. xinference/model/llm/transformers/multimodal/qwen-omni.py +2 -2
  81. xinference/model/llm/transformers/multimodal/qwen2_audio.py +2 -2
  82. xinference/model/llm/transformers/multimodal/qwen2_vl.py +2 -2
  83. xinference/model/llm/transformers/opt.py +3 -7
  84. xinference/model/llm/utils.py +34 -49
  85. xinference/model/llm/vllm/core.py +77 -27
  86. xinference/model/llm/vllm/xavier/engine.py +5 -3
  87. xinference/model/llm/vllm/xavier/scheduler.py +10 -6
  88. xinference/model/llm/vllm/xavier/transfer.py +1 -1
  89. xinference/model/rerank/__init__.py +26 -25
  90. xinference/model/rerank/core.py +47 -87
  91. xinference/model/rerank/custom.py +25 -71
  92. xinference/model/rerank/model_spec.json +158 -33
  93. xinference/model/rerank/utils.py +2 -2
  94. xinference/model/utils.py +115 -54
  95. xinference/model/video/__init__.py +13 -17
  96. xinference/model/video/core.py +44 -102
  97. xinference/model/video/diffusers.py +4 -3
  98. xinference/model/video/model_spec.json +90 -21
  99. xinference/types.py +5 -3
  100. xinference/web/ui/build/asset-manifest.json +3 -3
  101. xinference/web/ui/build/index.html +1 -1
  102. xinference/web/ui/build/static/js/main.7d24df53.js +3 -0
  103. xinference/web/ui/build/static/js/main.7d24df53.js.map +1 -0
  104. xinference/web/ui/node_modules/.cache/babel-loader/2704ff66a5f73ca78b341eb3edec60154369df9d87fbc8c6dd60121abc5e1b0a.json +1 -0
  105. xinference/web/ui/node_modules/.cache/babel-loader/607dfef23d33e6b594518c0c6434567639f24f356b877c80c60575184ec50ed0.json +1 -0
  106. xinference/web/ui/node_modules/.cache/babel-loader/9be3d56173aacc3efd0b497bcb13c4f6365de30069176ee9403b40e717542326.json +1 -0
  107. xinference/web/ui/node_modules/.cache/babel-loader/9f9dd6c32c78a222d07da5987ae902effe16bcf20aac00774acdccc4de3c9ff2.json +1 -0
  108. xinference/web/ui/node_modules/.cache/babel-loader/b2ab5ee972c60d15eb9abf5845705f8ab7e1d125d324d9a9b1bcae5d6fd7ffb2.json +1 -0
  109. xinference/web/ui/src/locales/en.json +0 -1
  110. xinference/web/ui/src/locales/ja.json +0 -1
  111. xinference/web/ui/src/locales/ko.json +0 -1
  112. xinference/web/ui/src/locales/zh.json +0 -1
  113. {xinference-1.7.1.dist-info → xinference-1.8.0.dist-info}/METADATA +9 -11
  114. {xinference-1.7.1.dist-info → xinference-1.8.0.dist-info}/RECORD +119 -119
  115. xinference/model/audio/model_spec_modelscope.json +0 -231
  116. xinference/model/embedding/model_spec_modelscope.json +0 -293
  117. xinference/model/embedding/utils.py +0 -18
  118. xinference/model/image/model_spec_modelscope.json +0 -375
  119. xinference/model/llm/llama_cpp/memory.py +0 -457
  120. xinference/model/llm/llm_family_csghub.json +0 -56
  121. xinference/model/llm/llm_family_modelscope.json +0 -8700
  122. xinference/model/llm/llm_family_openmind_hub.json +0 -1019
  123. xinference/model/rerank/model_spec_modelscope.json +0 -85
  124. xinference/model/video/model_spec_modelscope.json +0 -184
  125. xinference/web/ui/build/static/js/main.9b12b7f9.js +0 -3
  126. xinference/web/ui/build/static/js/main.9b12b7f9.js.map +0 -1
  127. xinference/web/ui/node_modules/.cache/babel-loader/1460361af6975e63576708039f1cb732faf9c672d97c494d4055fc6331460be0.json +0 -1
  128. xinference/web/ui/node_modules/.cache/babel-loader/4efd8dda58fda83ed9546bf2f587df67f8d98e639117bee2d9326a9a1d9bebb2.json +0 -1
  129. xinference/web/ui/node_modules/.cache/babel-loader/55b9fb40b57fa926e8f05f31c2f96467e76e5ad62f033dca97c03f9e8c4eb4fe.json +0 -1
  130. xinference/web/ui/node_modules/.cache/babel-loader/5b2dafe5aa9e1105e0244a2b6751807342fa86aa0144b4e84d947a1686102715.json +0 -1
  131. xinference/web/ui/node_modules/.cache/babel-loader/611fa2c6c53b66039991d06dfb0473b5ab37fc63b4564e0f6e1718523768a045.json +0 -1
  132. /xinference/web/ui/build/static/js/{main.9b12b7f9.js.LICENSE.txt → main.7d24df53.js.LICENSE.txt} +0 -0
  133. {xinference-1.7.1.dist-info → xinference-1.8.0.dist-info}/WHEEL +0 -0
  134. {xinference-1.7.1.dist-info → xinference-1.8.0.dist-info}/entry_points.txt +0 -0
  135. {xinference-1.7.1.dist-info → xinference-1.8.0.dist-info}/licenses/LICENSE +0 -0
  136. {xinference-1.7.1.dist-info → xinference-1.8.0.dist-info}/top_level.txt +0 -0
@@ -1,281 +1,1109 @@
1
1
  [
2
2
  {
3
+ "version": 2,
3
4
  "model_name": "bge-large-en",
4
5
  "dimensions": 1024,
5
6
  "max_tokens": 512,
6
- "language": ["en"],
7
- "model_id": "BAAI/bge-large-en",
8
- "model_revision": "d57a0d82f0d0884de76bbce093f201364d9b720e"
7
+ "language": [
8
+ "en"
9
+ ],
10
+ "model_specs": [
11
+ {
12
+ "model_format": "pytorch",
13
+ "model_src": {
14
+ "huggingface": {
15
+ "model_id": "BAAI/bge-large-en",
16
+ "model_revision": "d57a0d82f0d0884de76bbce093f201364d9b720e",
17
+ "quantizations": [
18
+ "none"
19
+ ]
20
+ },
21
+ "modelscope": {
22
+ "model_id": "Xorbits/bge-large-en",
23
+ "model_revision": "v0.0.1",
24
+ "quantizations": [
25
+ "none"
26
+ ]
27
+ }
28
+ }
29
+ }
30
+ ]
9
31
  },
10
32
  {
33
+ "version": 2,
11
34
  "model_name": "bge-base-en",
12
35
  "dimensions": 768,
13
36
  "max_tokens": 512,
14
- "language": ["en"],
15
- "model_id": "BAAI/bge-base-en",
16
- "model_revision": "90e113f4f9cd0c83220c873b94ca7bc37f85de97"
37
+ "language": [
38
+ "en"
39
+ ],
40
+ "model_specs": [
41
+ {
42
+ "model_format": "pytorch",
43
+ "model_src": {
44
+ "huggingface": {
45
+ "model_id": "BAAI/bge-base-en",
46
+ "model_revision": "90e113f4f9cd0c83220c873b94ca7bc37f85de97",
47
+ "quantizations": [
48
+ "none"
49
+ ]
50
+ },
51
+ "modelscope": {
52
+ "model_id": "Xorbits/bge-base-en",
53
+ "model_revision": "v0.0.1",
54
+ "quantizations": [
55
+ "none"
56
+ ]
57
+ }
58
+ }
59
+ }
60
+ ]
17
61
  },
18
62
  {
63
+ "version": 2,
19
64
  "model_name": "gte-large",
20
65
  "dimensions": 1024,
21
66
  "max_tokens": 512,
22
- "language": ["en"],
23
- "model_id": "thenlper/gte-large",
24
- "model_revision": "2b5163b62ed28492dc70eb19a882b71c81dbc7c8"
67
+ "language": [
68
+ "en"
69
+ ],
70
+ "model_specs": [
71
+ {
72
+ "model_format": "pytorch",
73
+ "model_src": {
74
+ "huggingface": {
75
+ "model_id": "thenlper/gte-large",
76
+ "model_revision": "2b5163b62ed28492dc70eb19a882b71c81dbc7c8",
77
+ "quantizations": [
78
+ "none"
79
+ ]
80
+ },
81
+ "modelscope": {
82
+ "model_id": "Xorbits/gte-large",
83
+ "model_revision": "v0.0.1",
84
+ "quantizations": [
85
+ "none"
86
+ ]
87
+ }
88
+ }
89
+ }
90
+ ]
25
91
  },
26
92
  {
93
+ "version": 2,
27
94
  "model_name": "gte-base",
28
95
  "dimensions": 768,
29
96
  "max_tokens": 512,
30
- "language": ["en"],
31
- "model_id": "thenlper/gte-base",
32
- "model_revision": "792749e8178be77f479b26788a0e1adb4ec9c8a9"
97
+ "language": [
98
+ "en"
99
+ ],
100
+ "model_specs": [
101
+ {
102
+ "model_format": "pytorch",
103
+ "model_src": {
104
+ "huggingface": {
105
+ "model_id": "thenlper/gte-base",
106
+ "model_revision": "792749e8178be77f479b26788a0e1adb4ec9c8a9",
107
+ "quantizations": [
108
+ "none"
109
+ ]
110
+ },
111
+ "modelscope": {
112
+ "model_id": "Xorbits/gte-base",
113
+ "model_revision": "v0.0.1",
114
+ "quantizations": [
115
+ "none"
116
+ ]
117
+ }
118
+ }
119
+ }
120
+ ]
33
121
  },
34
122
  {
123
+ "version": 2,
35
124
  "model_name": "e5-large-v2",
36
125
  "dimensions": 1024,
37
126
  "max_tokens": 512,
38
- "language": ["en"],
39
- "model_id": "intfloat/e5-large-v2",
40
- "model_revision": "b322e09026e4ea05f42beadf4d661fb4e101d311"
127
+ "language": [
128
+ "en"
129
+ ],
130
+ "model_specs": [
131
+ {
132
+ "model_format": "pytorch",
133
+ "model_src": {
134
+ "huggingface": {
135
+ "model_id": "intfloat/e5-large-v2",
136
+ "model_revision": "b322e09026e4ea05f42beadf4d661fb4e101d311",
137
+ "quantizations": [
138
+ "none"
139
+ ]
140
+ },
141
+ "modelscope": {
142
+ "model_id": "Xorbits/e5-large-v2",
143
+ "model_revision": "v0.0.1",
144
+ "quantizations": [
145
+ "none"
146
+ ]
147
+ }
148
+ }
149
+ }
150
+ ]
41
151
  },
42
152
  {
153
+ "version": 2,
43
154
  "model_name": "bge-large-zh",
44
155
  "dimensions": 1024,
45
156
  "max_tokens": 512,
46
- "language": ["zh"],
47
- "model_id": "BAAI/bge-large-zh",
48
- "model_revision": "1b543b301eb63dd32914b56d939db2a972df15d5"
157
+ "language": [
158
+ "zh"
159
+ ],
160
+ "model_specs": [
161
+ {
162
+ "model_format": "pytorch",
163
+ "model_src": {
164
+ "huggingface": {
165
+ "model_id": "BAAI/bge-large-zh",
166
+ "model_revision": "1b543b301eb63dd32914b56d939db2a972df15d5",
167
+ "quantizations": [
168
+ "none"
169
+ ]
170
+ },
171
+ "modelscope": {
172
+ "model_id": "Xorbits/bge-large-zh",
173
+ "model_revision": "v0.0.1",
174
+ "quantizations": [
175
+ "none"
176
+ ]
177
+ }
178
+ }
179
+ }
180
+ ]
49
181
  },
50
182
  {
183
+ "version": 2,
51
184
  "model_name": "bge-large-zh-noinstruct",
52
185
  "dimensions": 1024,
53
186
  "max_tokens": 512,
54
- "language": ["zh"],
55
- "model_id": "BAAI/bge-large-zh-noinstruct",
56
- "model_revision": "d971248454d6267756fab9caa431c2c2fc5f0f35"
187
+ "language": [
188
+ "zh"
189
+ ],
190
+ "model_specs": [
191
+ {
192
+ "model_format": "pytorch",
193
+ "model_src": {
194
+ "huggingface": {
195
+ "model_id": "BAAI/bge-large-zh-noinstruct",
196
+ "model_revision": "d971248454d6267756fab9caa431c2c2fc5f0f35",
197
+ "quantizations": [
198
+ "none"
199
+ ]
200
+ },
201
+ "modelscope": {
202
+ "model_id": "Xorbits/bge-large-zh-noinstruct",
203
+ "model_revision": "v0.0.1",
204
+ "quantizations": [
205
+ "none"
206
+ ]
207
+ }
208
+ }
209
+ }
210
+ ]
57
211
  },
58
212
  {
213
+ "version": 2,
59
214
  "model_name": "bge-base-zh",
60
215
  "dimensions": 768,
61
216
  "max_tokens": 512,
62
- "language": ["zh"],
63
- "model_id": "BAAI/bge-base-zh",
64
- "model_revision": "faefe5952238b3d28bc35d1c8fe63eb269d8cee0"
217
+ "language": [
218
+ "zh"
219
+ ],
220
+ "model_specs": [
221
+ {
222
+ "model_format": "pytorch",
223
+ "model_src": {
224
+ "huggingface": {
225
+ "model_id": "BAAI/bge-base-zh",
226
+ "model_revision": "faefe5952238b3d28bc35d1c8fe63eb269d8cee0",
227
+ "quantizations": [
228
+ "none"
229
+ ]
230
+ },
231
+ "modelscope": {
232
+ "model_id": "Xorbits/bge-base-zh",
233
+ "model_revision": "v0.0.2",
234
+ "quantizations": [
235
+ "none"
236
+ ]
237
+ }
238
+ }
239
+ }
240
+ ]
65
241
  },
66
242
  {
243
+ "version": 2,
67
244
  "model_name": "multilingual-e5-large",
68
245
  "dimensions": 1024,
69
246
  "max_tokens": 514,
70
- "language": ["zh"],
71
- "model_id": "intfloat/multilingual-e5-large",
72
- "model_revision": "c505dce3578a12ec54e47bdc72bef5cd0eacb085"
247
+ "language": [
248
+ "zh"
249
+ ],
250
+ "model_specs": [
251
+ {
252
+ "model_format": "pytorch",
253
+ "model_src": {
254
+ "huggingface": {
255
+ "model_id": "intfloat/multilingual-e5-large",
256
+ "model_revision": "c505dce3578a12ec54e47bdc72bef5cd0eacb085",
257
+ "quantizations": [
258
+ "none"
259
+ ]
260
+ },
261
+ "modelscope": {
262
+ "model_id": "Xorbits/multilingual-e5-large",
263
+ "model_revision": "v0.0.1",
264
+ "quantizations": [
265
+ "none"
266
+ ]
267
+ }
268
+ }
269
+ }
270
+ ]
73
271
  },
74
272
  {
273
+ "version": 2,
75
274
  "model_name": "bge-small-zh",
76
275
  "dimensions": 512,
77
276
  "max_tokens": 512,
78
- "language": ["zh"],
79
- "model_id": "BAAI/bge-small-zh",
80
- "model_revision": "52185a5f4aa5bb1fe80c0671b7303161880a2d79"
277
+ "language": [
278
+ "zh"
279
+ ],
280
+ "model_specs": [
281
+ {
282
+ "model_format": "pytorch",
283
+ "model_src": {
284
+ "huggingface": {
285
+ "model_id": "BAAI/bge-small-zh",
286
+ "model_revision": "52185a5f4aa5bb1fe80c0671b7303161880a2d79",
287
+ "quantizations": [
288
+ "none"
289
+ ]
290
+ },
291
+ "modelscope": {
292
+ "model_id": "Xorbits/bge-small-zh",
293
+ "model_revision": "v0.0.1",
294
+ "quantizations": [
295
+ "none"
296
+ ]
297
+ }
298
+ }
299
+ }
300
+ ]
81
301
  },
82
302
  {
303
+ "version": 2,
83
304
  "model_name": "bge-small-zh-v1.5",
84
305
  "dimensions": 512,
85
306
  "max_tokens": 512,
86
- "language": ["zh"],
87
- "model_id": "BAAI/bge-small-zh-v1.5",
88
- "model_revision": "a7ec18349c42fc774b0e86af26215e38a10fbe9d"
307
+ "language": [
308
+ "zh"
309
+ ],
310
+ "model_specs": [
311
+ {
312
+ "model_format": "pytorch",
313
+ "model_src": {
314
+ "huggingface": {
315
+ "model_id": "BAAI/bge-small-zh-v1.5",
316
+ "model_revision": "a7ec18349c42fc774b0e86af26215e38a10fbe9d",
317
+ "quantizations": [
318
+ "none"
319
+ ]
320
+ },
321
+ "modelscope": {
322
+ "model_id": "Xorbits/bge-small-zh-v1.5",
323
+ "model_revision": "v0.0.2",
324
+ "quantizations": [
325
+ "none"
326
+ ]
327
+ }
328
+ }
329
+ }
330
+ ]
89
331
  },
90
332
  {
333
+ "version": 2,
91
334
  "model_name": "bge-base-zh-v1.5",
92
335
  "dimensions": 768,
93
336
  "max_tokens": 512,
94
- "language": ["zh"],
95
- "model_id": "BAAI/bge-base-zh-v1.5",
96
- "model_revision": "fcd022c36ff982da395e71ae930a5ad0d4b9330f"
337
+ "language": [
338
+ "zh"
339
+ ],
340
+ "model_specs": [
341
+ {
342
+ "model_format": "pytorch",
343
+ "model_src": {
344
+ "huggingface": {
345
+ "model_id": "BAAI/bge-base-zh-v1.5",
346
+ "model_revision": "fcd022c36ff982da395e71ae930a5ad0d4b9330f",
347
+ "quantizations": [
348
+ "none"
349
+ ]
350
+ },
351
+ "modelscope": {
352
+ "model_id": "Xorbits/bge-base-zh-v1.5",
353
+ "model_revision": "v0.0.1",
354
+ "quantizations": [
355
+ "none"
356
+ ]
357
+ }
358
+ }
359
+ }
360
+ ]
97
361
  },
98
362
  {
363
+ "version": 2,
99
364
  "model_name": "bge-large-zh-v1.5",
100
365
  "dimensions": 1024,
101
366
  "max_tokens": 512,
102
- "language": ["zh"],
103
- "model_id": "BAAI/bge-large-zh-v1.5",
104
- "model_revision": "029c4bfff6b0c5cfcd20b40c17ed52ec55202748"
367
+ "language": [
368
+ "zh"
369
+ ],
370
+ "model_specs": [
371
+ {
372
+ "model_format": "pytorch",
373
+ "model_src": {
374
+ "huggingface": {
375
+ "model_id": "BAAI/bge-large-zh-v1.5",
376
+ "model_revision": "029c4bfff6b0c5cfcd20b40c17ed52ec55202748",
377
+ "quantizations": [
378
+ "none"
379
+ ]
380
+ },
381
+ "modelscope": {
382
+ "model_id": "Xorbits/bge-large-zh-v1.5",
383
+ "model_revision": "v0.0.1",
384
+ "quantizations": [
385
+ "none"
386
+ ]
387
+ }
388
+ }
389
+ }
390
+ ]
105
391
  },
106
392
  {
393
+ "version": 2,
107
394
  "model_name": "bge-small-en-v1.5",
108
395
  "dimensions": 384,
109
396
  "max_tokens": 512,
110
- "language": ["en"],
111
- "model_id": "BAAI/bge-small-en-v1.5",
112
- "model_revision": "88885630388d6249d876a3ab145b78b34665b79a"
397
+ "language": [
398
+ "en"
399
+ ],
400
+ "model_specs": [
401
+ {
402
+ "model_format": "pytorch",
403
+ "model_src": {
404
+ "huggingface": {
405
+ "model_id": "BAAI/bge-small-en-v1.5",
406
+ "model_revision": "88885630388d6249d876a3ab145b78b34665b79a",
407
+ "quantizations": [
408
+ "none"
409
+ ]
410
+ },
411
+ "modelscope": {
412
+ "model_id": "Xorbits/bge-small-en-v1.5",
413
+ "model_revision": "v0.0.2",
414
+ "quantizations": [
415
+ "none"
416
+ ]
417
+ }
418
+ }
419
+ }
420
+ ]
113
421
  },
114
422
  {
423
+ "version": 2,
115
424
  "model_name": "bge-base-en-v1.5",
116
425
  "dimensions": 768,
117
426
  "max_tokens": 512,
118
- "language": ["en"],
119
- "model_id": "BAAI/bge-base-en-v1.5",
120
- "model_revision": "1dafa38af496bee39ad5e0d11447fac46d0714e1"
427
+ "language": [
428
+ "en"
429
+ ],
430
+ "model_specs": [
431
+ {
432
+ "model_format": "pytorch",
433
+ "model_src": {
434
+ "huggingface": {
435
+ "model_id": "BAAI/bge-base-en-v1.5",
436
+ "model_revision": "1dafa38af496bee39ad5e0d11447fac46d0714e1",
437
+ "quantizations": [
438
+ "none"
439
+ ]
440
+ },
441
+ "modelscope": {
442
+ "model_id": "Xorbits/bge-base-en-v1.5",
443
+ "model_revision": "v0.0.1",
444
+ "quantizations": [
445
+ "none"
446
+ ]
447
+ }
448
+ }
449
+ }
450
+ ]
121
451
  },
122
452
  {
453
+ "version": 2,
123
454
  "model_name": "bge-large-en-v1.5",
124
455
  "dimensions": 1024,
125
456
  "max_tokens": 512,
126
- "language": ["en"],
127
- "model_id": "BAAI/bge-large-en-v1.5",
128
- "model_revision": "5888da4a3a013e65d33dd6f612ecd4625eb87a7d"
457
+ "language": [
458
+ "en"
459
+ ],
460
+ "model_specs": [
461
+ {
462
+ "model_format": "pytorch",
463
+ "model_src": {
464
+ "huggingface": {
465
+ "model_id": "BAAI/bge-large-en-v1.5",
466
+ "model_revision": "5888da4a3a013e65d33dd6f612ecd4625eb87a7d",
467
+ "quantizations": [
468
+ "none"
469
+ ]
470
+ },
471
+ "modelscope": {
472
+ "model_id": "Xorbits/bge-large-en-v1.5",
473
+ "model_revision": "v0.0.1",
474
+ "quantizations": [
475
+ "none"
476
+ ]
477
+ }
478
+ }
479
+ }
480
+ ]
129
481
  },
130
482
  {
483
+ "version": 2,
131
484
  "model_name": "jina-embeddings-v2-small-en",
132
485
  "dimensions": 512,
133
486
  "max_tokens": 8192,
134
- "language": ["en"],
135
- "model_id": "jinaai/jina-embeddings-v2-small-en",
136
- "model_revision": "b811f03af3d4d7ea72a7c25c802b21fc675a5d99"
487
+ "language": [
488
+ "en"
489
+ ],
490
+ "model_specs": [
491
+ {
492
+ "model_format": "pytorch",
493
+ "model_src": {
494
+ "huggingface": {
495
+ "model_id": "jinaai/jina-embeddings-v2-small-en",
496
+ "model_revision": "b811f03af3d4d7ea72a7c25c802b21fc675a5d99",
497
+ "quantizations": [
498
+ "none"
499
+ ]
500
+ },
501
+ "modelscope": {
502
+ "model_id": "Xorbits/jina-embeddings-v2-small-en",
503
+ "model_revision": "v0.0.1",
504
+ "quantizations": [
505
+ "none"
506
+ ]
507
+ }
508
+ }
509
+ }
510
+ ]
137
511
  },
138
512
  {
513
+ "version": 2,
139
514
  "model_name": "jina-embeddings-v2-base-en",
140
515
  "dimensions": 512,
141
516
  "max_tokens": 8192,
142
- "language": ["en"],
143
- "model_id": "jinaai/jina-embeddings-v2-base-en",
144
- "model_revision": "7302ac470bed880590f9344bfeee32ff8722d0e5"
517
+ "language": [
518
+ "en"
519
+ ],
520
+ "model_specs": [
521
+ {
522
+ "model_format": "pytorch",
523
+ "model_src": {
524
+ "huggingface": {
525
+ "model_id": "jinaai/jina-embeddings-v2-base-en",
526
+ "model_revision": "7302ac470bed880590f9344bfeee32ff8722d0e5",
527
+ "quantizations": [
528
+ "none"
529
+ ]
530
+ },
531
+ "modelscope": {
532
+ "model_id": "Xorbits/jina-embeddings-v2-base-en",
533
+ "model_revision": "v0.0.1",
534
+ "quantizations": [
535
+ "none"
536
+ ]
537
+ }
538
+ }
539
+ }
540
+ ]
145
541
  },
146
542
  {
543
+ "version": 2,
147
544
  "model_name": "jina-embeddings-v2-base-zh",
148
545
  "dimensions": 768,
149
546
  "max_tokens": 8192,
150
- "language": ["zh", "en"],
151
- "model_id": "jinaai/jina-embeddings-v2-base-zh",
152
- "model_revision": "67974cbef5cf50562eadd745de8afc661c52c96f"
547
+ "language": [
548
+ "zh",
549
+ "en"
550
+ ],
551
+ "model_specs": [
552
+ {
553
+ "model_format": "pytorch",
554
+ "model_src": {
555
+ "huggingface": {
556
+ "model_id": "jinaai/jina-embeddings-v2-base-zh",
557
+ "model_revision": "67974cbef5cf50562eadd745de8afc661c52c96f",
558
+ "quantizations": [
559
+ "none"
560
+ ]
561
+ },
562
+ "modelscope": {
563
+ "model_id": "jinaai/jina-embeddings-v2-base-zh",
564
+ "quantizations": [
565
+ "none"
566
+ ]
567
+ }
568
+ }
569
+ }
570
+ ]
153
571
  },
154
572
  {
573
+ "version": 2,
155
574
  "model_name": "text2vec-large-chinese",
156
575
  "dimensions": 1024,
157
576
  "max_tokens": 256,
158
- "language": ["zh"],
159
- "model_id": "shibing624/text2vec-bge-large-chinese",
160
- "model_revision": "f5027ca48ea8316d63ee26d2b9bd27a061de33a3"
577
+ "language": [
578
+ "zh"
579
+ ],
580
+ "model_specs": [
581
+ {
582
+ "model_format": "pytorch",
583
+ "model_src": {
584
+ "huggingface": {
585
+ "model_id": "shibing624/text2vec-bge-large-chinese",
586
+ "model_revision": "f5027ca48ea8316d63ee26d2b9bd27a061de33a3",
587
+ "quantizations": [
588
+ "none"
589
+ ]
590
+ },
591
+ "modelscope": {
592
+ "model_id": "Jerry0/text2vec-large-chinese",
593
+ "quantizations": [
594
+ "none"
595
+ ]
596
+ }
597
+ }
598
+ }
599
+ ]
161
600
  },
162
601
  {
602
+ "version": 2,
163
603
  "model_name": "text2vec-base-chinese",
164
604
  "dimensions": 768,
165
605
  "max_tokens": 128,
166
- "language": ["zh"],
167
- "model_id": "shibing624/text2vec-base-chinese",
168
- "model_revision": "8acc1289891d75f6b665ad623359798b55f86adb"
606
+ "language": [
607
+ "zh"
608
+ ],
609
+ "model_specs": [
610
+ {
611
+ "model_format": "pytorch",
612
+ "model_src": {
613
+ "huggingface": {
614
+ "model_id": "shibing624/text2vec-base-chinese",
615
+ "model_revision": "8acc1289891d75f6b665ad623359798b55f86adb",
616
+ "quantizations": [
617
+ "none"
618
+ ]
619
+ },
620
+ "modelscope": {
621
+ "model_id": "Jerry0/text2vec-base-chinese",
622
+ "quantizations": [
623
+ "none"
624
+ ]
625
+ }
626
+ }
627
+ }
628
+ ]
169
629
  },
170
630
  {
631
+ "version": 2,
171
632
  "model_name": "text2vec-base-chinese-paraphrase",
172
633
  "dimensions": 768,
173
634
  "max_tokens": 256,
174
- "language": ["zh"],
175
- "model_id": "shibing624/text2vec-base-chinese-paraphrase",
176
- "model_revision": "beaf10481a5d9ca3b0daa9f0df6831ec956bf739"
635
+ "language": [
636
+ "zh"
637
+ ],
638
+ "model_specs": [
639
+ {
640
+ "model_format": "pytorch",
641
+ "model_src": {
642
+ "huggingface": {
643
+ "model_id": "shibing624/text2vec-base-chinese-paraphrase",
644
+ "model_revision": "beaf10481a5d9ca3b0daa9f0df6831ec956bf739",
645
+ "quantizations": [
646
+ "none"
647
+ ]
648
+ },
649
+ "modelscope": {
650
+ "model_id": "mwei23/text2vec-base-chinese-paraphrase",
651
+ "quantizations": [
652
+ "none"
653
+ ]
654
+ }
655
+ }
656
+ }
657
+ ]
177
658
  },
178
659
  {
660
+ "version": 2,
179
661
  "model_name": "text2vec-base-chinese-sentence",
180
662
  "dimensions": 768,
181
663
  "max_tokens": 256,
182
- "language": ["zh"],
183
- "model_id": "shibing624/text2vec-base-chinese-sentence",
184
- "model_revision": "e73a94e821f22c6163166bfab9408d03933a5525"
664
+ "language": [
665
+ "zh"
666
+ ],
667
+ "model_specs": [
668
+ {
669
+ "model_format": "pytorch",
670
+ "model_src": {
671
+ "huggingface": {
672
+ "model_id": "shibing624/text2vec-base-chinese-sentence",
673
+ "model_revision": "e73a94e821f22c6163166bfab9408d03933a5525",
674
+ "quantizations": [
675
+ "none"
676
+ ]
677
+ }
678
+ }
679
+ }
680
+ ]
185
681
  },
186
682
  {
683
+ "version": 2,
187
684
  "model_name": "text2vec-base-multilingual",
188
685
  "dimensions": 384,
189
686
  "max_tokens": 256,
190
- "language": ["zh"],
191
- "model_id": "shibing624/text2vec-base-multilingual",
192
- "model_revision": "f241877385fa56ebcc75f04d1850e1579cfa661d"
687
+ "language": [
688
+ "zh"
689
+ ],
690
+ "model_specs": [
691
+ {
692
+ "model_format": "pytorch",
693
+ "model_src": {
694
+ "huggingface": {
695
+ "model_id": "shibing624/text2vec-base-multilingual",
696
+ "model_revision": "f241877385fa56ebcc75f04d1850e1579cfa661d",
697
+ "quantizations": [
698
+ "none"
699
+ ]
700
+ }
701
+ }
702
+ }
703
+ ]
193
704
  },
194
705
  {
706
+ "version": 2,
195
707
  "model_name": "bge-m3",
196
708
  "dimensions": 1024,
197
709
  "max_tokens": 8192,
198
- "language": ["zh", "en"],
199
- "model_id": "BAAI/bge-m3",
200
- "model_revision": "73a15ad29ab604f3bdc31601849a9defe86d563f"
710
+ "language": [
711
+ "zh",
712
+ "en"
713
+ ],
714
+ "model_specs": [
715
+ {
716
+ "model_format": "pytorch",
717
+ "model_src": {
718
+ "huggingface": {
719
+ "model_id": "BAAI/bge-m3",
720
+ "model_revision": "73a15ad29ab604f3bdc31601849a9defe86d563f",
721
+ "quantizations": [
722
+ "none"
723
+ ]
724
+ },
725
+ "modelscope": {
726
+ "model_id": "Xorbits/bge-m3",
727
+ "quantizations": [
728
+ "none"
729
+ ]
730
+ }
731
+ }
732
+ }
733
+ ]
201
734
  },
202
735
  {
736
+ "version": 2,
203
737
  "model_name": "bce-embedding-base_v1",
204
738
  "dimensions": 768,
205
739
  "max_tokens": 512,
206
- "language": ["zh", "en"],
207
- "model_id": "maidalun1020/bce-embedding-base_v1",
208
- "model_revision": "236d9024fc1b4046f03848723f934521a66a9323"
740
+ "language": [
741
+ "zh",
742
+ "en"
743
+ ],
744
+ "model_specs": [
745
+ {
746
+ "model_format": "pytorch",
747
+ "model_src": {
748
+ "huggingface": {
749
+ "model_id": "maidalun1020/bce-embedding-base_v1",
750
+ "model_revision": "236d9024fc1b4046f03848723f934521a66a9323",
751
+ "quantizations": [
752
+ "none"
753
+ ]
754
+ },
755
+ "modelscope": {
756
+ "model_id": "maidalun/bce-embedding-base_v1",
757
+ "quantizations": [
758
+ "none"
759
+ ]
760
+ }
761
+ }
762
+ }
763
+ ]
209
764
  },
210
765
  {
766
+ "version": 2,
211
767
  "model_name": "m3e-small",
212
768
  "dimensions": 512,
213
769
  "max_tokens": 512,
214
- "language": ["zh", "en"],
215
- "model_id": "moka-ai/m3e-small",
216
- "model_revision": "44c696631b2a8c200220aaaad5f987f096e986df"
770
+ "language": [
771
+ "zh",
772
+ "en"
773
+ ],
774
+ "model_specs": [
775
+ {
776
+ "model_format": "pytorch",
777
+ "model_src": {
778
+ "huggingface": {
779
+ "model_id": "moka-ai/m3e-small",
780
+ "model_revision": "44c696631b2a8c200220aaaad5f987f096e986df",
781
+ "quantizations": [
782
+ "none"
783
+ ]
784
+ },
785
+ "modelscope": {
786
+ "model_id": "AI-ModelScope/m3e-small",
787
+ "quantizations": [
788
+ "none"
789
+ ]
790
+ }
791
+ }
792
+ }
793
+ ]
217
794
  },
218
795
  {
796
+ "version": 2,
219
797
  "model_name": "m3e-base",
220
798
  "dimensions": 768,
221
799
  "max_tokens": 512,
222
- "language": ["zh", "en"],
223
- "model_id": "moka-ai/m3e-base",
224
- "model_revision": "764b537a0e50e5c7d64db883f2d2e051cbe3c64c"
800
+ "language": [
801
+ "zh",
802
+ "en"
803
+ ],
804
+ "model_specs": [
805
+ {
806
+ "model_format": "pytorch",
807
+ "model_src": {
808
+ "huggingface": {
809
+ "model_id": "moka-ai/m3e-base",
810
+ "model_revision": "764b537a0e50e5c7d64db883f2d2e051cbe3c64c",
811
+ "quantizations": [
812
+ "none"
813
+ ]
814
+ },
815
+ "modelscope": {
816
+ "model_id": "AI-ModelScope/m3e-base",
817
+ "quantizations": [
818
+ "none"
819
+ ]
820
+ }
821
+ }
822
+ }
823
+ ]
225
824
  },
226
825
  {
826
+ "version": 2,
227
827
  "model_name": "m3e-large",
228
828
  "dimensions": 1024,
229
829
  "max_tokens": 512,
230
- "language": ["zh", "en"],
231
- "model_id": "moka-ai/m3e-large",
232
- "model_revision": "12900375086c37ba5d83d1e417b21dc7d1d1f388"
830
+ "language": [
831
+ "zh",
832
+ "en"
833
+ ],
834
+ "model_specs": [
835
+ {
836
+ "model_format": "pytorch",
837
+ "model_src": {
838
+ "huggingface": {
839
+ "model_id": "moka-ai/m3e-large",
840
+ "model_revision": "12900375086c37ba5d83d1e417b21dc7d1d1f388",
841
+ "quantizations": [
842
+ "none"
843
+ ]
844
+ },
845
+ "modelscope": {
846
+ "model_id": "AI-ModelScope/m3e-large",
847
+ "quantizations": [
848
+ "none"
849
+ ]
850
+ }
851
+ }
852
+ }
853
+ ]
233
854
  },
234
855
  {
856
+ "version": 2,
235
857
  "model_name": "gte-Qwen2",
236
858
  "dimensions": 3584,
237
859
  "max_tokens": 32000,
238
- "language": ["zh", "en"],
239
- "model_id": "Alibaba-NLP/gte-Qwen2-7B-instruct",
240
- "model_revision": "e26182b2122f4435e8b3ebecbf363990f409b45b"
860
+ "language": [
861
+ "zh",
862
+ "en"
863
+ ],
864
+ "model_specs": [
865
+ {
866
+ "model_format": "pytorch",
867
+ "model_src": {
868
+ "huggingface": {
869
+ "model_id": "Alibaba-NLP/gte-Qwen2-7B-instruct",
870
+ "model_revision": "e26182b2122f4435e8b3ebecbf363990f409b45b",
871
+ "quantizations": [
872
+ "none"
873
+ ]
874
+ },
875
+ "modelscope": {
876
+ "model_id": "iic/gte_Qwen2-7B-instruct",
877
+ "quantizations": [
878
+ "none"
879
+ ]
880
+ }
881
+ }
882
+ }
883
+ ]
241
884
  },
242
885
  {
886
+ "version": 2,
243
887
  "model_name": "Qwen3-Embedding-0.6B",
244
888
  "dimensions": 1024,
245
889
  "max_tokens": 32768,
246
- "language": ["zh", "en"],
247
- "model_id": "Qwen/Qwen3-Embedding-0.6B",
248
- "model_revision": "744169034862c8eec56628663995004342e4e449"
890
+ "language": [
891
+ "zh",
892
+ "en"
893
+ ],
894
+ "model_specs": [
895
+ {
896
+ "model_format": "pytorch",
897
+ "model_src": {
898
+ "huggingface": {
899
+ "model_id": "Qwen/Qwen3-Embedding-0.6B",
900
+ "model_revision": "744169034862c8eec56628663995004342e4e449",
901
+ "quantizations": [
902
+ "none"
903
+ ]
904
+ },
905
+ "modelscope": {
906
+ "model_id": "Qwen/Qwen3-Embedding-0.6B",
907
+ "quantizations": [
908
+ "none"
909
+ ]
910
+ }
911
+ }
912
+ },
913
+ {
914
+ "model_format": "ggufv2",
915
+ "model_src": {
916
+ "huggingface": {
917
+ "model_id": "Qwen/Qwen3-Embedding-0.6B-GGUF",
918
+ "model_revision": "48f36f50b4a081a6f56dd4a227f9b66668e1399f",
919
+ "quantizations": [
920
+ "Q8_0"
921
+ ],
922
+ "model_file_name_template": "Qwen3-Embedding-0.6B-{quantization}.gguf"
923
+ },
924
+ "modelscope": {
925
+ "model_id": "Qwen/Qwen3-Embedding-0.6B-GGUF",
926
+ "quantizations": [
927
+ "Q8_0"
928
+ ],
929
+ "model_file_name_template": "Qwen3-Embedding-0.6B-{quantization}.gguf"
930
+ }
931
+ }
932
+ }
933
+ ]
249
934
  },
250
935
  {
936
+ "version": 2,
251
937
  "model_name": "Qwen3-Embedding-4B",
252
938
  "dimensions": 2560,
253
939
  "max_tokens": 32768,
254
- "language": ["zh", "en"],
255
- "model_id": "Qwen/Qwen3-Embedding-4B",
256
- "model_revision": "408b81b7fab742073065d5b3661fa74c1b3ee0a1"
940
+ "language": [
941
+ "zh",
942
+ "en"
943
+ ],
944
+ "model_specs": [
945
+ {
946
+ "model_format": "pytorch",
947
+ "model_src": {
948
+ "huggingface": {
949
+ "model_id": "Qwen/Qwen3-Embedding-4B",
950
+ "model_revision": "408b81b7fab742073065d5b3661fa74c1b3ee0a1",
951
+ "quantizations": [
952
+ "none"
953
+ ]
954
+ },
955
+ "modelscope": {
956
+ "model_id": "Qwen/Qwen3-Embedding-4B",
957
+ "quantizations": [
958
+ "none"
959
+ ]
960
+ }
961
+ }
962
+ },
963
+ {
964
+ "model_format": "ggufv2",
965
+ "model_src": {
966
+ "huggingface": {
967
+ "model_id": "Qwen/Qwen3-Embedding-4B-GGUF",
968
+ "model_revision": "e85059c9a23c106d40df0da29d27a6b7c528265b",
969
+ "quantizations": [
970
+ "Q4_K_M",
971
+ "Q5_0",
972
+ "Q5_K_M",
973
+ "Q6_K",
974
+ "Q8_0"
975
+ ],
976
+ "model_file_name_template": "Qwen3-Embedding-4B-{quantization}.gguf"
977
+ },
978
+ "modelscope": {
979
+ "model_id": "Qwen/Qwen3-Embedding-4B-GGUF",
980
+ "quantizations": [
981
+ "Q4_K_M",
982
+ "Q5_0",
983
+ "Q5_K_M",
984
+ "Q6_K",
985
+ "Q8_0"
986
+ ],
987
+ "model_file_name_template": "Qwen3-Embedding-4B-{quantization}.gguf"
988
+ }
989
+ }
990
+ }
991
+ ]
257
992
  },
258
993
  {
994
+ "version": 2,
259
995
  "model_name": "Qwen3-Embedding-8B",
260
996
  "dimensions": 4096,
261
997
  "max_tokens": 32768,
262
- "language": ["zh", "en"],
263
- "model_id": "Qwen/Qwen3-Embedding-8B",
264
- "model_revision": "a3d38e32b9c835d5b3d0d0a3ef3c133bbea92539"
998
+ "language": [
999
+ "zh",
1000
+ "en"
1001
+ ],
1002
+ "model_specs": [
1003
+ {
1004
+ "model_format": "pytorch",
1005
+ "model_src": {
1006
+ "huggingface": {
1007
+ "model_id": "Qwen/Qwen3-Embedding-8B",
1008
+ "model_revision": "a3d38e32b9c835d5b3d0d0a3ef3c133bbea92539",
1009
+ "quantizations": [
1010
+ "none"
1011
+ ]
1012
+ },
1013
+ "modelscope": {
1014
+ "model_id": "Qwen/Qwen3-Embedding-8B",
1015
+ "quantizations": [
1016
+ "none"
1017
+ ]
1018
+ }
1019
+ }
1020
+ },
1021
+ {
1022
+ "model_format": "ggufv2",
1023
+ "model_src": {
1024
+ "huggingface": {
1025
+ "model_id": "Qwen/Qwen3-Embedding-8B-GGUF",
1026
+ "model_revision": "e7cad3531ff6c346352edc899d1cf5f63e616b05",
1027
+ "quantizations": [
1028
+ "Q4_K_M",
1029
+ "Q5_0",
1030
+ "Q5_K_M",
1031
+ "Q6_K",
1032
+ "Q8_0"
1033
+ ],
1034
+ "model_file_name_template": "Qwen3-Embedding-8B-{quantization}.gguf"
1035
+ },
1036
+ "modelscope": {
1037
+ "model_id": "Qwen/Qwen3-Embedding-8B-GGUF",
1038
+ "quantizations": [
1039
+ "Q4_K_M",
1040
+ "Q5_0",
1041
+ "Q5_K_M",
1042
+ "Q6_K",
1043
+ "Q8_0"
1044
+ ],
1045
+ "model_file_name_template": "Qwen3-Embedding-8B-{quantization}.gguf"
1046
+ }
1047
+ }
1048
+ }
1049
+ ]
265
1050
  },
266
1051
  {
1052
+ "version": 2,
267
1053
  "model_name": "jina-embeddings-v3",
268
1054
  "dimensions": 1024,
269
1055
  "max_tokens": 8192,
270
- "language": ["zh", "en"],
271
- "model_id": "jinaai/jina-embeddings-v3"
1056
+ "language": [
1057
+ "zh",
1058
+ "en"
1059
+ ],
1060
+ "model_specs": [
1061
+ {
1062
+ "model_format": "pytorch",
1063
+ "model_src": {
1064
+ "huggingface": {
1065
+ "model_id": "jinaai/jina-embeddings-v3",
1066
+ "quantizations": [
1067
+ "none"
1068
+ ]
1069
+ },
1070
+ "modelscope": {
1071
+ "model_id": "jinaai/jina-embeddings-v3",
1072
+ "quantizations": [
1073
+ "none"
1074
+ ]
1075
+ }
1076
+ }
1077
+ }
1078
+ ]
272
1079
  },
273
1080
  {
1081
+ "version": 2,
274
1082
  "model_name": "jina-clip-v2",
275
1083
  "dimensions": 1024,
276
1084
  "max_tokens": 8192,
277
- "language": ["89 languages supported"],
278
- "model_id": "jinaai/jina-clip-v2",
1085
+ "language": [
1086
+ "89 languages supported"
1087
+ ],
1088
+ "model_specs": [
1089
+ {
1090
+ "model_format": "pytorch",
1091
+ "model_src": {
1092
+ "huggingface": {
1093
+ "model_id": "jinaai/jina-clip-v2",
1094
+ "quantizations": [
1095
+ "none"
1096
+ ]
1097
+ },
1098
+ "modelscope": {
1099
+ "model_id": "jinaai/jina-clip-v2",
1100
+ "quantizations": [
1101
+ "none"
1102
+ ]
1103
+ }
1104
+ }
1105
+ }
1106
+ ],
279
1107
  "virtualenv": {
280
1108
  "packages": [
281
1109
  "sentence_transformers",
@@ -285,5 +1113,42 @@
285
1113
  ],
286
1114
  "no_build_isolation": true
287
1115
  }
1116
+ },
1117
+ {
1118
+ "version": 2,
1119
+ "model_name": "jina-embeddings-v4",
1120
+ "dimensions": 2048,
1121
+ "max_tokens": 32768,
1122
+ "language": [
1123
+ "30+ languages supported"
1124
+ ],
1125
+ "model_specs": [
1126
+ {
1127
+ "model_format": "pytorch",
1128
+ "model_src": {
1129
+ "huggingface": {
1130
+ "model_id": "jinaai/jina-embeddings-v4",
1131
+ "quantizations": [
1132
+ "none"
1133
+ ]
1134
+ },
1135
+ "modelscope": {
1136
+ "model_id": "jinaai/jina-embeddings-v4",
1137
+ "quantizations": [
1138
+ "none"
1139
+ ]
1140
+ }
1141
+ }
1142
+ }
1143
+ ],
1144
+ "virtualenv": {
1145
+ "packages": [
1146
+ "sentence_transformers",
1147
+ "transformers==4.52.0",
1148
+ "xformers",
1149
+ "flash_attn==2.7.4 ; sys_platform=='linux'"
1150
+ ],
1151
+ "no_build_isolation": true
1152
+ }
288
1153
  }
289
1154
  ]