mteb 2.7.3__py3-none-any.whl → 2.7.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (157) hide show
  1. mteb/abstasks/retrieval.py +1 -1
  2. mteb/benchmarks/benchmarks/__init__.py +2 -0
  3. mteb/benchmarks/benchmarks/benchmarks.py +41 -2
  4. mteb/descriptive_stats/Retrieval/BrightAopsRetrieval.json +35 -0
  5. mteb/descriptive_stats/Retrieval/BrightBiologyLongRetrieval.json +35 -0
  6. mteb/descriptive_stats/Retrieval/BrightBiologyRetrieval.json +35 -0
  7. mteb/descriptive_stats/Retrieval/BrightEarthScienceLongRetrieval.json +35 -0
  8. mteb/descriptive_stats/Retrieval/BrightEarthScienceRetrieval.json +35 -0
  9. mteb/descriptive_stats/Retrieval/BrightEconomicsLongRetrieval.json +35 -0
  10. mteb/descriptive_stats/Retrieval/BrightEconomicsRetrieval.json +35 -0
  11. mteb/descriptive_stats/Retrieval/BrightLeetcodeRetrieval.json +35 -0
  12. mteb/descriptive_stats/Retrieval/BrightPonyLongRetrieval.json +35 -0
  13. mteb/descriptive_stats/Retrieval/BrightPonyRetrieval.json +35 -0
  14. mteb/descriptive_stats/Retrieval/BrightPsychologyLongRetrieval.json +35 -0
  15. mteb/descriptive_stats/Retrieval/BrightPsychologyRetrieval.json +35 -0
  16. mteb/descriptive_stats/Retrieval/BrightRoboticsLongRetrieval.json +35 -0
  17. mteb/descriptive_stats/Retrieval/BrightRoboticsRetrieval.json +35 -0
  18. mteb/descriptive_stats/Retrieval/BrightStackoverflowLongRetrieval.json +35 -0
  19. mteb/descriptive_stats/Retrieval/BrightStackoverflowRetrieval.json +35 -0
  20. mteb/descriptive_stats/Retrieval/BrightSustainableLivingLongRetrieval.json +35 -0
  21. mteb/descriptive_stats/Retrieval/BrightSustainableLivingRetrieval.json +35 -0
  22. mteb/descriptive_stats/Retrieval/BrightTheoremQAQuestionsRetrieval.json +35 -0
  23. mteb/descriptive_stats/Retrieval/BrightTheoremQATheoremsRetrieval.json +35 -0
  24. mteb/models/model_implementations/align_models.py +1 -0
  25. mteb/models/model_implementations/amazon_models.py +1 -0
  26. mteb/models/model_implementations/andersborges.py +2 -0
  27. mteb/models/model_implementations/ara_models.py +1 -0
  28. mteb/models/model_implementations/arctic_models.py +8 -0
  29. mteb/models/model_implementations/b1ade_models.py +1 -0
  30. mteb/models/model_implementations/bedrock_models.py +4 -0
  31. mteb/models/model_implementations/bge_models.py +40 -1
  32. mteb/models/model_implementations/bica_model.py +1 -0
  33. mteb/models/model_implementations/blip2_models.py +2 -0
  34. mteb/models/model_implementations/blip_models.py +8 -0
  35. mteb/models/model_implementations/bm25.py +8 -5
  36. mteb/models/model_implementations/bmretriever_models.py +4 -0
  37. mteb/models/model_implementations/cadet_models.py +1 -0
  38. mteb/models/model_implementations/cde_models.py +2 -0
  39. mteb/models/model_implementations/clip_models.py +3 -0
  40. mteb/models/model_implementations/clips_models.py +3 -0
  41. mteb/models/model_implementations/codefuse_models.py +5 -0
  42. mteb/models/model_implementations/codesage_models.py +3 -0
  43. mteb/models/model_implementations/cohere_models.py +4 -0
  44. mteb/models/model_implementations/cohere_v.py +5 -0
  45. mteb/models/model_implementations/colpali_models.py +3 -0
  46. mteb/models/model_implementations/colqwen_models.py +7 -0
  47. mteb/models/model_implementations/colsmol_models.py +2 -0
  48. mteb/models/model_implementations/conan_models.py +1 -0
  49. mteb/models/model_implementations/dino_models.py +19 -0
  50. mteb/models/model_implementations/e5_instruct.py +4 -0
  51. mteb/models/model_implementations/e5_models.py +9 -0
  52. mteb/models/model_implementations/e5_v.py +1 -0
  53. mteb/models/model_implementations/eagerworks_models.py +1 -0
  54. mteb/models/model_implementations/emillykkejensen_models.py +3 -0
  55. mteb/models/model_implementations/en_code_retriever.py +1 -0
  56. mteb/models/model_implementations/euler_models.py +1 -0
  57. mteb/models/model_implementations/evaclip_models.py +4 -0
  58. mteb/models/model_implementations/fa_models.py +9 -0
  59. mteb/models/model_implementations/facebookai.py +2 -0
  60. mteb/models/model_implementations/geogpt_models.py +1 -0
  61. mteb/models/model_implementations/gme_v_models.py +2 -0
  62. mteb/models/model_implementations/google_models.py +5 -0
  63. mteb/models/model_implementations/granite_vision_embedding_models.py +1 -0
  64. mteb/models/model_implementations/gritlm_models.py +2 -0
  65. mteb/models/model_implementations/gte_models.py +9 -0
  66. mteb/models/model_implementations/hinvec_models.py +1 -0
  67. mteb/models/model_implementations/human.py +1 -0
  68. mteb/models/model_implementations/ibm_granite_models.py +6 -0
  69. mteb/models/model_implementations/inf_models.py +2 -0
  70. mteb/models/model_implementations/jasper_models.py +2 -0
  71. mteb/models/model_implementations/jina_clip.py +1 -0
  72. mteb/models/model_implementations/jina_models.py +7 -0
  73. mteb/models/model_implementations/kalm_models.py +6 -0
  74. mteb/models/model_implementations/kblab.py +1 -0
  75. mteb/models/model_implementations/kennethenevoldsen_models.py +2 -0
  76. mteb/models/model_implementations/kfst.py +1 -0
  77. mteb/models/model_implementations/kowshik24_models.py +1 -0
  78. mteb/models/model_implementations/lens_models.py +2 -0
  79. mteb/models/model_implementations/lgai_embedding_models.py +1 -0
  80. mteb/models/model_implementations/linq_models.py +1 -0
  81. mteb/models/model_implementations/listconranker.py +1 -0
  82. mteb/models/model_implementations/llm2clip_models.py +3 -0
  83. mteb/models/model_implementations/llm2vec_models.py +8 -0
  84. mteb/models/model_implementations/mcinext_models.py +3 -0
  85. mteb/models/model_implementations/mdbr_models.py +2 -0
  86. mteb/models/model_implementations/misc_models.py +63 -0
  87. mteb/models/model_implementations/mixedbread_ai_models.py +3 -0
  88. mteb/models/model_implementations/mme5_models.py +2 -1
  89. mteb/models/model_implementations/moco_models.py +2 -0
  90. mteb/models/model_implementations/mod_models.py +1 -0
  91. mteb/models/model_implementations/model2vec_models.py +13 -0
  92. mteb/models/model_implementations/moka_models.py +3 -0
  93. mteb/models/model_implementations/nbailab.py +3 -0
  94. mteb/models/model_implementations/no_instruct_sentence_models.py +1 -0
  95. mteb/models/model_implementations/nomic_models.py +6 -0
  96. mteb/models/model_implementations/nomic_models_vision.py +1 -0
  97. mteb/models/model_implementations/nvidia_llama_nemoretriever_colemb.py +2 -0
  98. mteb/models/model_implementations/nvidia_models.py +3 -0
  99. mteb/models/model_implementations/octen_models.py +2 -0
  100. mteb/models/model_implementations/openai_models.py +5 -0
  101. mteb/models/model_implementations/openclip_models.py +8 -0
  102. mteb/models/model_implementations/opensearch_neural_sparse_models.py +5 -0
  103. mteb/models/model_implementations/ops_moa_models.py +2 -0
  104. mteb/models/model_implementations/ordalietech_solon_embeddings_mini_beta_1_1.py +1 -0
  105. mteb/models/model_implementations/pawan_models.py +1 -0
  106. mteb/models/model_implementations/piccolo_models.py +2 -0
  107. mteb/models/model_implementations/promptriever_models.py +4 -0
  108. mteb/models/model_implementations/pylate_models.py +3 -0
  109. mteb/models/model_implementations/qodo_models.py +2 -0
  110. mteb/models/model_implementations/qtack_models.py +1 -0
  111. mteb/models/model_implementations/qwen3_models.py +3 -0
  112. mteb/models/model_implementations/qzhou_models.py +2 -0
  113. mteb/models/model_implementations/rasgaard_models.py +1 -0
  114. mteb/models/model_implementations/reasonir_model.py +65 -0
  115. mteb/models/model_implementations/repllama_models.py +2 -0
  116. mteb/models/model_implementations/rerankers_custom.py +3 -0
  117. mteb/models/model_implementations/rerankers_monot5_based.py +14 -0
  118. mteb/models/model_implementations/richinfoai_models.py +1 -0
  119. mteb/models/model_implementations/ru_sentence_models.py +20 -0
  120. mteb/models/model_implementations/ruri_models.py +10 -0
  121. mteb/models/model_implementations/salesforce_models.py +3 -0
  122. mteb/models/model_implementations/samilpwc_models.py +1 -0
  123. mteb/models/model_implementations/sarashina_embedding_models.py +2 -0
  124. mteb/models/model_implementations/searchmap_models.py +1 -0
  125. mteb/models/model_implementations/seed_1_6_embedding_models.py +1 -0
  126. mteb/models/model_implementations/seed_1_6_embedding_models_1215.py +1 -0
  127. mteb/models/model_implementations/seed_models.py +1 -0
  128. mteb/models/model_implementations/sentence_transformers_models.py +18 -0
  129. mteb/models/model_implementations/shuu_model.py +1 -0
  130. mteb/models/model_implementations/siglip_models.py +10 -0
  131. mteb/models/model_implementations/sonar_models.py +2 -1
  132. mteb/models/model_implementations/spartan8806_atles_champion.py +1 -0
  133. mteb/models/model_implementations/stella_models.py +6 -0
  134. mteb/models/model_implementations/tarka_models.py +2 -0
  135. mteb/models/model_implementations/text2vec_models.py +3 -0
  136. mteb/models/model_implementations/ua_sentence_models.py +1 -0
  137. mteb/models/model_implementations/uae_models.py +1 -0
  138. mteb/models/model_implementations/vdr_models.py +1 -0
  139. mteb/models/model_implementations/vi_vn_models.py +6 -0
  140. mteb/models/model_implementations/vista_models.py +2 -0
  141. mteb/models/model_implementations/vlm2vec_models.py +2 -0
  142. mteb/models/model_implementations/voyage_models.py +15 -0
  143. mteb/models/model_implementations/voyage_v.py +1 -0
  144. mteb/models/model_implementations/xyz_models.py +1 -0
  145. mteb/models/model_implementations/youtu_models.py +1 -0
  146. mteb/models/model_implementations/yuan_models.py +1 -0
  147. mteb/models/model_implementations/yuan_models_en.py +1 -0
  148. mteb/models/model_meta.py +35 -2
  149. mteb/tasks/retrieval/eng/__init__.py +42 -0
  150. mteb/tasks/retrieval/eng/bright_retrieval.py +9 -1
  151. mteb/tasks/retrieval/eng/bright_v1_1_retrieval.py +968 -0
  152. {mteb-2.7.3.dist-info → mteb-2.7.4.dist-info}/METADATA +1 -1
  153. {mteb-2.7.3.dist-info → mteb-2.7.4.dist-info}/RECORD +157 -136
  154. {mteb-2.7.3.dist-info → mteb-2.7.4.dist-info}/WHEEL +0 -0
  155. {mteb-2.7.3.dist-info → mteb-2.7.4.dist-info}/entry_points.txt +0 -0
  156. {mteb-2.7.3.dist-info → mteb-2.7.4.dist-info}/licenses/LICENSE +0 -0
  157. {mteb-2.7.3.dist-info → mteb-2.7.4.dist-info}/top_level.txt +0 -0
@@ -20,6 +20,7 @@ geoembedding = ModelMeta(
20
20
  ),
21
21
  release_date="2025-04-22",
22
22
  n_parameters=7241732096,
23
+ n_embedding_parameters=131_072_000,
23
24
  memory_usage_mb=27625,
24
25
  embed_dim=4096,
25
26
  license="apache-2.0",
@@ -356,6 +356,7 @@ gme_qwen2vl_2b = ModelMeta(
356
356
  release_date="2024-12-24",
357
357
  modalities=["image", "text"],
358
358
  n_parameters=2_210_000_000,
359
+ n_embedding_parameters=233_373_696,
359
360
  memory_usage_mb=8427,
360
361
  embed_dim=1536,
361
362
  license="apache-2.0",
@@ -380,6 +381,7 @@ gme_qwen2vl_7b = ModelMeta(
380
381
  release_date="2024-12-24",
381
382
  modalities=["image", "text"],
382
383
  n_parameters=8_290_000_000,
384
+ n_embedding_parameters=544_997_376,
383
385
  memory_usage_mb=31629,
384
386
  embed_dim=3584,
385
387
  license="apache-2.0",
@@ -162,6 +162,7 @@ google_text_emb_004 = ModelMeta(
162
162
  revision="1", # revision is intended for implementation
163
163
  release_date="2024-05-14",
164
164
  n_parameters=None,
165
+ n_embedding_parameters=None,
165
166
  memory_usage_mb=None,
166
167
  max_tokens=2048,
167
168
  embed_dim=768,
@@ -187,6 +188,7 @@ google_text_emb_005 = ModelMeta(
187
188
  revision="1", # revision is intended for implementation
188
189
  release_date="2024-11-18",
189
190
  n_parameters=None,
191
+ n_embedding_parameters=None,
190
192
  memory_usage_mb=None,
191
193
  max_tokens=2048,
192
194
  embed_dim=768,
@@ -212,6 +214,7 @@ google_text_multilingual_emb_002 = ModelMeta(
212
214
  revision="1",
213
215
  release_date="2024-05-14",
214
216
  n_parameters=None,
217
+ n_embedding_parameters=None,
215
218
  memory_usage_mb=None,
216
219
  max_tokens=2048,
217
220
  embed_dim=768,
@@ -237,6 +240,7 @@ google_gemini_embedding_001 = ModelMeta(
237
240
  revision="1",
238
241
  release_date="2025-03-07",
239
242
  n_parameters=None,
243
+ n_embedding_parameters=None,
240
244
  memory_usage_mb=None,
241
245
  max_tokens=2048,
242
246
  embed_dim=3072,
@@ -272,6 +276,7 @@ embedding_gemma_300m = ModelMeta(
272
276
  revision="64614b0b8b64f0c6c1e52b07e4e9a4e8fe4d2da2",
273
277
  release_date="2025-09-04",
274
278
  n_parameters=307_581_696,
279
+ n_embedding_parameters=201_326_592,
275
280
  embed_dim=768,
276
281
  max_tokens=2048,
277
282
  license="gemma",
@@ -173,6 +173,7 @@ granite_vision_embedding = ModelMeta(
173
173
  release_date="2025-06-11",
174
174
  modalities=["image", "text"],
175
175
  n_parameters=2_980_000_000,
176
+ n_embedding_parameters=None,
176
177
  memory_usage_mb=11351,
177
178
  max_tokens=128000,
178
179
  embed_dim=128,
@@ -44,6 +44,7 @@ gritlm7b = ModelMeta(
44
44
  revision="13f00a0e36500c80ce12870ea513846a066004af",
45
45
  release_date="2024-02-15",
46
46
  n_parameters=7_240_000_000,
47
+ n_embedding_parameters=131_072_000,
47
48
  memory_usage_mb=13813,
48
49
  embed_dim=4096,
49
50
  license="apache-2.0",
@@ -73,6 +74,7 @@ gritlm8x7b = ModelMeta(
73
74
  revision="7f089b13e3345510281733ca1e6ff871b5b4bc76",
74
75
  release_date="2024-02-15",
75
76
  n_parameters=57_920_000_000,
77
+ n_embedding_parameters=None,
76
78
  memory_usage_mb=89079,
77
79
  embed_dim=32768,
78
80
  license="apache-2.0",
@@ -48,6 +48,7 @@ gte_qwen2_7b_instruct = ModelMeta(
48
48
  revision="e26182b2122f4435e8b3ebecbf363990f409b45b",
49
49
  release_date="2024-06-15", # initial commit of hf model.
50
50
  n_parameters=7_613_000_000,
51
+ n_embedding_parameters=543_499_264,
51
52
  memory_usage_mb=29040,
52
53
  embed_dim=3584,
53
54
  license="apache-2.0",
@@ -80,6 +81,7 @@ gte_qwen1_5_7b_instruct = ModelMeta(
80
81
  revision="07d27e5226328010336563bc1b564a5e3436a298",
81
82
  release_date="2024-04-20", # initial commit of hf model.
82
83
  n_parameters=7_720_000_000,
84
+ n_embedding_parameters=None,
83
85
  memory_usage_mb=29449,
84
86
  embed_dim=4096,
85
87
  license="apache-2.0",
@@ -117,6 +119,7 @@ gte_qwen2_1_5b_instruct = ModelMeta(
117
119
  revision="c6c1b92f4a3e1b92b326ad29dd3c8433457df8dd",
118
120
  release_date="2024-07-29", # initial commit of hf model.
119
121
  n_parameters=1_780_000_000,
122
+ n_embedding_parameters=232_928_256,
120
123
  memory_usage_mb=6776,
121
124
  embed_dim=8960,
122
125
  license="apache-2.0",
@@ -145,6 +148,7 @@ gte_small_zh = ModelMeta(
145
148
  revision="af7bd46fbb00b3a6963c8dd7f1786ddfbfbe973a",
146
149
  release_date="2023-11-08", # initial commit of hf model.
147
150
  n_parameters=int(30.3 * 1e6),
151
+ n_embedding_parameters=10_817_536,
148
152
  memory_usage_mb=58,
149
153
  embed_dim=1024,
150
154
  license="mit",
@@ -173,6 +177,7 @@ gte_base_zh = ModelMeta(
173
177
  revision="71ab7947d6fac5b64aa299e6e40e6c2b2e85976c",
174
178
  release_date="2023-11-08", # initial commit of hf model.
175
179
  n_parameters=int(102 * 1e6),
180
+ n_embedding_parameters=16_226_304,
176
181
  memory_usage_mb=195,
177
182
  embed_dim=1024,
178
183
  license="mit",
@@ -201,6 +206,7 @@ gte_large_zh = ModelMeta(
201
206
  revision="64c364e579de308104a9b2c170ca009502f4f545",
202
207
  release_date="2023-11-08", # initial commit of hf model.
203
208
  n_parameters=int(326 * 1e6),
209
+ n_embedding_parameters=21_635_072,
204
210
  memory_usage_mb=621,
205
211
  embed_dim=1024,
206
212
  license="mit",
@@ -330,6 +336,7 @@ gte_multilingual_base = ModelMeta(
330
336
  revision="ca1791e0bcc104f6db161f27de1340241b13c5a4",
331
337
  release_date="2024-07-20", # initial commit of hf model.
332
338
  n_parameters=int(305 * 1e6),
339
+ n_embedding_parameters=192_036_864,
333
340
  memory_usage_mb=582,
334
341
  embed_dim=768,
335
342
  license="apache-2.0",
@@ -359,6 +366,7 @@ gte_modernbert_base = ModelMeta(
359
366
  revision="7ca8b4ca700621b67618669f5378fe5f5820b8e4",
360
367
  release_date="2025-01-21", # initial commit of hf model.
361
368
  n_parameters=int(149 * 1e6),
369
+ n_embedding_parameters=None,
362
370
  memory_usage_mb=284,
363
371
  embed_dim=768,
364
372
  license="apache-2.0",
@@ -402,6 +410,7 @@ gte_base_en_v15 = ModelMeta(
402
410
  revision="a829fd0e060bb84554da0dfd354d0de0f7712b7f", # can be any
403
411
  release_date="2024-06-20", # initial commit of hf model
404
412
  n_parameters=137_000_000,
413
+ n_embedding_parameters=23_445_504,
405
414
  memory_usage_mb=None,
406
415
  embed_dim=768,
407
416
  license="apache-2.0",
@@ -47,6 +47,7 @@ Hinvec_bidir = ModelMeta(
47
47
  revision="d4fc678720cc1b8c5d18599ce2d9a4d6090c8b6b",
48
48
  release_date="2025-06-19",
49
49
  n_parameters=939_591_680,
50
+ n_embedding_parameters=None,
50
51
  memory_usage_mb=3715,
51
52
  embed_dim=2048,
52
53
  license="cc-by-nc-4.0",
@@ -9,6 +9,7 @@ human = ModelMeta(
9
9
  revision="2025_09_25",
10
10
  release_date=None,
11
11
  n_parameters=None,
12
+ n_embedding_parameters=None,
12
13
  memory_usage_mb=None,
13
14
  embed_dim=None,
14
15
  license=None,
@@ -100,6 +100,7 @@ granite_107m_multilingual = ModelMeta(
100
100
  revision="47db56afe692f731540413c67dd818ff492277e7",
101
101
  release_date="2024-12-18",
102
102
  n_parameters=107_000_000,
103
+ n_embedding_parameters=96_000_768,
103
104
  memory_usage_mb=204,
104
105
  embed_dim=384,
105
106
  license="apache-2.0",
@@ -131,6 +132,7 @@ granite_278m_multilingual = ModelMeta(
131
132
  revision="84e3546b88b0cb69f8078608a1df558020bcbf1f",
132
133
  release_date="2024-12-18",
133
134
  n_parameters=278_000_000,
135
+ n_embedding_parameters=192_001_536,
134
136
  memory_usage_mb=530,
135
137
  embed_dim=768,
136
138
  license="apache-2.0",
@@ -162,6 +164,7 @@ granite_30m_english = ModelMeta(
162
164
  revision="eddbb57470f896b5f8e2bfcb823d8f0e2d2024a5",
163
165
  release_date="2024-12-18",
164
166
  n_parameters=30_000_000,
167
+ n_embedding_parameters=19_301_760,
165
168
  memory_usage_mb=58,
166
169
  embed_dim=384,
167
170
  license="apache-2.0",
@@ -193,6 +196,7 @@ granite_125m_english = ModelMeta(
193
196
  revision="e48d3a5b47eaa18e3fe07d4676e187fd80f32730",
194
197
  release_date="2024-12-18",
195
198
  n_parameters=125_000_000,
199
+ n_embedding_parameters=38_603_520,
196
200
  memory_usage_mb=238,
197
201
  embed_dim=768,
198
202
  license="apache-2.0",
@@ -225,6 +229,7 @@ granite_english_r2 = ModelMeta(
225
229
  revision="6e7b8ce0e76270394ac4669ba4bbd7133b60b7f9",
226
230
  release_date="2025-08-15",
227
231
  n_parameters=149_000_000,
232
+ n_embedding_parameters=None,
228
233
  memory_usage_mb=284,
229
234
  embed_dim=768,
230
235
  license="apache-2.0",
@@ -250,6 +255,7 @@ granite_small_english_r2 = ModelMeta(
250
255
  revision="54a8d2616a0844355a5164432d3f6dafb37b17a3",
251
256
  release_date="2025-08-15",
252
257
  n_parameters=47_000_000,
258
+ n_embedding_parameters=None,
253
259
  memory_usage_mb=91,
254
260
  embed_dim=384,
255
261
  license="apache-2.0",
@@ -56,6 +56,7 @@ inf_retriever_v1 = ModelMeta(
56
56
  revision="cb70ca7c31dfa866b2eff2dad229c144d8ddfd91",
57
57
  release_date="2024-12-24", # initial commit of hf model.
58
58
  n_parameters=7_069_121_024,
59
+ n_embedding_parameters=None,
59
60
  memory_usage_mb=13483,
60
61
  embed_dim=3584,
61
62
  license="apache-2.0",
@@ -83,6 +84,7 @@ inf_retriever_v1_1_5b = ModelMeta(
83
84
  revision="c9c05c2dd50707a486966ba81703021ae2094a06",
84
85
  release_date="2025-02-08", # initial commit of hf model.
85
86
  n_parameters=1_543_268_864,
87
+ n_embedding_parameters=232_928_256,
86
88
  memory_usage_mb=2944,
87
89
  embed_dim=1536,
88
90
  license="apache-2.0",
@@ -299,6 +299,7 @@ jasper_en_v1 = ModelMeta(
299
299
  revision="d6330ce98f8a0d741e781df845904c9484f00efa",
300
300
  release_date="2024-12-11", # first commit
301
301
  n_parameters=1_999_000_000,
302
+ n_embedding_parameters=232_932_864,
302
303
  memory_usage_mb=3802,
303
304
  max_tokens=131072,
304
305
  embed_dim=8960,
@@ -346,6 +347,7 @@ Jasper_Token_Compression_600M = ModelMeta(
346
347
  revision="06a100f753a5a96d9e583b3af79c6fcdfacc4719",
347
348
  release_date="2025-11-14",
348
349
  n_parameters=595776512,
350
+ n_embedding_parameters=None,
349
351
  memory_usage_mb=2272,
350
352
  embed_dim=2048,
351
353
  license="mit",
@@ -144,6 +144,7 @@ jina_clip_v1 = ModelMeta(
144
144
  release_date="2024-05-30",
145
145
  modalities=["image", "text"],
146
146
  n_parameters=223_000_000,
147
+ n_embedding_parameters=None,
147
148
  memory_usage_mb=849,
148
149
  max_tokens=8192,
149
150
  embed_dim=768,
@@ -733,6 +733,7 @@ jina_reranker_v3 = ModelMeta(
733
733
  release_date="2025-09-18", # official release date
734
734
  modalities=["text"],
735
735
  n_parameters=int(0.6 * 1e9),
736
+ n_embedding_parameters=None,
736
737
  memory_usage_mb=1138,
737
738
  max_tokens=131072,
738
739
  embed_dim=None,
@@ -776,6 +777,7 @@ jina_embeddings_v4 = ModelMeta(
776
777
  release_date="2025-06-24", # official release date
777
778
  modalities=["image", "text"],
778
779
  n_parameters=int(3.8 * 1e9),
780
+ n_embedding_parameters=None,
779
781
  memory_usage_mb=7500,
780
782
  max_tokens=32768,
781
783
  embed_dim=2048,
@@ -824,6 +826,7 @@ jina_embeddings_v3 = ModelMeta(
824
826
  revision="215a6e121fa0183376388ac6b1ae230326bfeaed",
825
827
  release_date="2024-09-18", # official release date
826
828
  n_parameters=int(572 * 1e6),
829
+ n_embedding_parameters=None,
827
830
  memory_usage_mb=1092,
828
831
  max_tokens=8194,
829
832
  embed_dim=1024,
@@ -884,6 +887,7 @@ jina_embeddings_v2_base_en = ModelMeta(
884
887
  revision="6e85f575bc273f1fd840a658067d0157933c83f0",
885
888
  release_date="2023-09-27",
886
889
  n_parameters=137_000_000,
890
+ n_embedding_parameters=23_445_504,
887
891
  memory_usage_mb=262,
888
892
  embed_dim=768,
889
893
  license="apache-2.0",
@@ -948,6 +952,7 @@ jina_embeddings_v2_small_en = ModelMeta(
948
952
  revision="44e7d1d6caec8c883c2d4b207588504d519788d0",
949
953
  release_date="2023-09-27",
950
954
  n_parameters=32_700_000,
955
+ n_embedding_parameters=15_630_336,
951
956
  memory_usage_mb=62,
952
957
  embed_dim=512,
953
958
  license="apache-2.0",
@@ -1009,6 +1014,7 @@ jina_embedding_b_en_v1 = ModelMeta(
1009
1014
  revision="32aa658e5ceb90793454d22a57d8e3a14e699516",
1010
1015
  release_date="2023-07-07",
1011
1016
  n_parameters=110_000_000,
1017
+ n_embedding_parameters=24_674_304,
1012
1018
  memory_usage_mb=420,
1013
1019
  embed_dim=768,
1014
1020
  license="apache-2.0",
@@ -1066,6 +1072,7 @@ jina_embedding_s_en_v1 = ModelMeta(
1066
1072
  revision="5ac6cd473e2324c6d5f9e558a6a9f65abb57143e",
1067
1073
  release_date="2023-07-07",
1068
1074
  n_parameters=35_000_000,
1075
+ n_embedding_parameters=16_449_536,
1069
1076
  memory_usage_mb=134,
1070
1077
  embed_dim=512,
1071
1078
  license="apache-2.0",
@@ -780,6 +780,7 @@ HIT_TMG__KaLM_embedding_multilingual_mini_instruct_v1 = ModelMeta(
780
780
  release_date="2024-10-23",
781
781
  languages=["eng-Latn", "zho-Hans"],
782
782
  n_parameters=494032768,
783
+ n_embedding_parameters=136_134_656,
783
784
  memory_usage_mb=1885,
784
785
  max_tokens=512,
785
786
  embed_dim=896,
@@ -805,6 +806,7 @@ HIT_TMG__KaLM_embedding_multilingual_mini_v1 = ModelMeta(
805
806
  release_date="2024-08-27",
806
807
  languages=["eng-Latn", "zho-Hans"],
807
808
  n_parameters=494032768,
809
+ n_embedding_parameters=136_134_656,
808
810
  memory_usage_mb=1885,
809
811
  max_tokens=512,
810
812
  embed_dim=896,
@@ -836,6 +838,7 @@ HIT_TMG__KaLM_embedding_multilingual_mini_instruct_v1_5 = ModelMeta(
836
838
  release_date="2024-12-26",
837
839
  languages=["eng-Latn", "zho-Hans"],
838
840
  n_parameters=494032768,
841
+ n_embedding_parameters=136_134_656,
839
842
  memory_usage_mb=1885,
840
843
  max_tokens=512,
841
844
  embed_dim=896,
@@ -867,6 +870,7 @@ HIT_TMG__KaLM_embedding_multilingual_mini_instruct_v2 = ModelMeta(
867
870
  release_date="2025-06-25",
868
871
  languages=["eng-Latn", "zho-Hans"],
869
872
  n_parameters=494032768,
873
+ n_embedding_parameters=136_134_656,
870
874
  memory_usage_mb=942,
871
875
  max_tokens=512,
872
876
  embed_dim=896,
@@ -898,6 +902,7 @@ KaLM_Embedding_KaLM_embedding_multilingual_mini_instruct_v2_5 = ModelMeta(
898
902
  release_date="2025-09-30",
899
903
  languages=["eng-Latn", "zho-Hans"],
900
904
  n_parameters=494032768,
905
+ n_embedding_parameters=136_134_656,
901
906
  memory_usage_mb=1885,
902
907
  max_tokens=512,
903
908
  embed_dim=896,
@@ -948,6 +953,7 @@ KaLM_Embedding_gemma_3_12b_2511 = ModelMeta(
948
953
  open_weights=True,
949
954
  release_date="2025-11-06",
950
955
  n_parameters=11.76 * 1e9,
956
+ n_embedding_parameters=None,
951
957
  memory_usage_mb=44884,
952
958
  max_tokens=32768,
953
959
  embed_dim=3840,
@@ -10,6 +10,7 @@ sbert_swedish = ModelMeta(
10
10
  revision="6b5e83cd29c03729cfdc33d13b1423399b0efb5c",
11
11
  release_date="2023-01-11",
12
12
  n_parameters=124690944,
13
+ n_embedding_parameters=38_649_600,
13
14
  memory_usage_mb=476,
14
15
  embed_dim=768,
15
16
  license="apache-2.0",
@@ -12,6 +12,7 @@ dfm_enc_large = ModelMeta(
12
12
  revision="132c53391e7a780dc6a2f9a03724d0158fe7122c",
13
13
  release_date="2023-07-12",
14
14
  n_parameters=355087360,
15
+ n_embedding_parameters=51_200_000,
15
16
  memory_usage_mb=1554,
16
17
  embed_dim=1024,
17
18
  license="mit",
@@ -47,6 +48,7 @@ dfm_enc_med = ModelMeta(
47
48
  revision="701bce95d499fa97610d57e8823c54fd1fb79930",
48
49
  release_date="2023-07-12",
49
50
  n_parameters=124445952,
51
+ n_embedding_parameters=38_403_840,
50
52
  memory_usage_mb=475,
51
53
  embed_dim=768,
52
54
  license="mit",
@@ -10,6 +10,7 @@ xlmr_scandi = ModelMeta(
10
10
  revision="d40c10ca7b1e68b5a8372f2d112dac9eb3279df1",
11
11
  release_date="2022-02-22",
12
12
  n_parameters=278043648,
13
+ n_embedding_parameters=192_001_536,
13
14
  memory_usage_mb=1061,
14
15
  embed_dim=768,
15
16
  license="not specified",
@@ -9,6 +9,7 @@ kowshik24_bangla_embedding_model = ModelMeta(
9
9
  revision="6689c21e69be5950596bad084457cbaa138728d8",
10
10
  release_date="2025-11-10",
11
11
  n_parameters=278_000_000,
12
+ n_embedding_parameters=192_001_536,
12
13
  memory_usage_mb=1061,
13
14
  embed_dim=768,
14
15
  license="apache-2.0",
@@ -18,6 +18,7 @@ lens_d4000 = ModelMeta(
18
18
  revision="e473b33364e6c48a324796fd1411d3b93670c6fe",
19
19
  release_date="2025-01-17",
20
20
  n_parameters=int(7.11 * 1e9),
21
+ n_embedding_parameters=131_084_288,
21
22
  memory_usage_mb=27125,
22
23
  embed_dim=4000,
23
24
  license="apache-2.0",
@@ -41,6 +42,7 @@ lens_d8000 = ModelMeta(
41
42
  revision="a0b87bd91cb27b6f2f0b0fe22c28026da1d464ef",
42
43
  release_date="2025-01-17",
43
44
  n_parameters=int(7.11 * 1e9),
45
+ n_embedding_parameters=131_084_288,
44
46
  memory_usage_mb=27125,
45
47
  embed_dim=8000,
46
48
  license="apache-2.0",
@@ -52,6 +52,7 @@ lgai_embedding_en = ModelMeta(
52
52
  revision="5e0b2316acc8c2e2941ded6b9cb200b1cb313e65",
53
53
  release_date="2025-06-11",
54
54
  n_parameters=7_110_000_000,
55
+ n_embedding_parameters=131_084_288,
55
56
  memory_usage_mb=27125,
56
57
  embed_dim=4096,
57
58
  license="apache-2.0",
@@ -43,6 +43,7 @@ Linq_Embed_Mistral = ModelMeta(
43
43
  revision="0c1a0b0589177079acc552433cad51d7c9132379",
44
44
  release_date="2024-05-29", # initial commit of hf model.
45
45
  n_parameters=7_110_000_000,
46
+ n_embedding_parameters=None,
46
47
  memory_usage_mb=13563,
47
48
  embed_dim=4096,
48
49
  license="cc-by-nc-4.0",
@@ -123,6 +123,7 @@ listconranker = ModelMeta(
123
123
  revision="95ae6a5f422a916bc36520f0f3e198e7d91520a0",
124
124
  release_date="2024-12-11",
125
125
  n_parameters=401_000_000,
126
+ n_embedding_parameters=None,
126
127
  memory_usage_mb=1242,
127
128
  similarity_fn_name="cosine",
128
129
  training_datasets=listconranker_training_datasets,
@@ -194,6 +194,7 @@ llm2clip_openai_l_14_336 = ModelMeta(
194
194
  release_date="2024-11-07",
195
195
  modalities=["image", "text"],
196
196
  n_parameters=579_000_000,
197
+ n_embedding_parameters=None,
197
198
  memory_usage_mb=None,
198
199
  max_tokens=None,
199
200
  embed_dim=1280,
@@ -219,6 +220,7 @@ llm2clip_openai_l_14_224 = ModelMeta(
219
220
  release_date="2024-11-07",
220
221
  modalities=["image", "text"],
221
222
  n_parameters=578_000_000,
223
+ n_embedding_parameters=None,
222
224
  memory_usage_mb=None,
223
225
  max_tokens=None,
224
226
  embed_dim=1280,
@@ -243,6 +245,7 @@ llm2clip_openai_b_16 = ModelMeta(
243
245
  release_date="2024-11-07",
244
246
  modalities=["image", "text"],
245
247
  n_parameters=361_000_000,
248
+ n_embedding_parameters=None,
246
249
  memory_usage_mb=None,
247
250
  max_tokens=None,
248
251
  embed_dim=1280,
@@ -145,6 +145,7 @@ llm2vec_llama3_8b_supervised = ModelMeta(
145
145
  # TODO: Not sure what to put here as a model is made of two peft repos, each with a different revision
146
146
  release_date="2024-04-09",
147
147
  n_parameters=7_505_000_000,
148
+ n_embedding_parameters=None,
148
149
  memory_usage_mb=28629,
149
150
  max_tokens=8192,
150
151
  embed_dim=4096,
@@ -174,6 +175,7 @@ llm2vec_llama3_8b_unsupervised = ModelMeta(
174
175
  revision="1cb7b735326d13a8541db8f57f35da5373f5e9c6",
175
176
  release_date="2024-04-09",
176
177
  n_parameters=7_505_000_000,
178
+ n_embedding_parameters=None,
177
179
  memory_usage_mb=28629,
178
180
  max_tokens=8192,
179
181
  embed_dim=4096,
@@ -203,6 +205,7 @@ llm2vec_mistral7b_supervised = ModelMeta(
203
205
  revision="0ae69bdd5816105778b971c3138e8f8a18eaa3ae",
204
206
  release_date="2024-04-09",
205
207
  n_parameters=7_111_000_000,
208
+ n_embedding_parameters=131_072_000,
206
209
  memory_usage_mb=27126,
207
210
  max_tokens=32768,
208
211
  embed_dim=4096,
@@ -232,6 +235,7 @@ llm2vec_mistral7b_unsupervised = ModelMeta(
232
235
  revision="2c055a5d77126c0d3dc6cd8ffa30e2908f4f45f8",
233
236
  release_date="2024-04-09",
234
237
  n_parameters=7_111_000_000,
238
+ n_embedding_parameters=131_072_000,
235
239
  memory_usage_mb=27126,
236
240
  max_tokens=32768,
237
241
  embed_dim=4096,
@@ -261,6 +265,7 @@ llm2vec_llama2_7b_supervised = ModelMeta(
261
265
  revision="2c055a5d77126c0d3dc6cd8ffa30e2908f4f45f8",
262
266
  release_date="2024-04-09",
263
267
  n_parameters=7_111_000_000,
268
+ n_embedding_parameters=None,
264
269
  memory_usage_mb=27126,
265
270
  max_tokens=32768,
266
271
  embed_dim=4096,
@@ -290,6 +295,7 @@ llm2vec_llama2_7b_unsupervised = ModelMeta(
290
295
  revision="a76944871d169ebe7c97eb921764cd063afed785",
291
296
  release_date="2024-04-09",
292
297
  n_parameters=7_111_000_000,
298
+ n_embedding_parameters=None,
293
299
  memory_usage_mb=27126,
294
300
  max_tokens=32768,
295
301
  embed_dim=4096,
@@ -319,6 +325,7 @@ llm2vec_sheared_llama_supervised = ModelMeta(
319
325
  revision="a5943d406c6b016fef3f07906aac183cf1a0b47d",
320
326
  release_date="2024-04-09",
321
327
  n_parameters=7_111_000_000,
328
+ n_embedding_parameters=65_536_000,
322
329
  memory_usage_mb=27126,
323
330
  max_tokens=32768,
324
331
  embed_dim=4096,
@@ -348,6 +355,7 @@ llm2vec_sheared_llama_unsupervised = ModelMeta(
348
355
  revision="a5943d406c6b016fef3f07906aac183cf1a0b47d",
349
356
  release_date="2024-04-09",
350
357
  n_parameters=7_111_000_000,
358
+ n_embedding_parameters=65_536_000,
351
359
  memory_usage_mb=27126,
352
360
  max_tokens=32768,
353
361
  embed_dim=4096,
@@ -358,6 +358,7 @@ hakim = ModelMeta(
358
358
  revision="1",
359
359
  release_date="2025-05-10",
360
360
  n_parameters=124_441_344,
361
+ n_embedding_parameters=None,
361
362
  memory_usage_mb=475,
362
363
  embed_dim=768,
363
364
  license="not specified",
@@ -426,6 +427,7 @@ hakim_small = ModelMeta(
426
427
  revision="1",
427
428
  release_date="2025-05-10",
428
429
  n_parameters=38_736_384,
430
+ n_embedding_parameters=None,
429
431
  memory_usage_mb=148,
430
432
  embed_dim=512,
431
433
  license="not specified",
@@ -493,6 +495,7 @@ hakim_unsup = ModelMeta(
493
495
  revision="1",
494
496
  release_date="2025-05-10",
495
497
  n_parameters=124_441_344,
498
+ n_embedding_parameters=None,
496
499
  memory_usage_mb=475,
497
500
  embed_dim=768,
498
501
  license="not specified",
@@ -45,6 +45,7 @@ mdbr_leaf_ir = ModelMeta(
45
45
  "Transformers",
46
46
  ],
47
47
  n_parameters=22_861_056,
48
+ n_embedding_parameters=11_720_448,
48
49
  memory_usage_mb=86,
49
50
  max_tokens=512,
50
51
  embed_dim=768,
@@ -79,6 +80,7 @@ mdbr_leaf_mt = ModelMeta(
79
80
  "Transformers",
80
81
  ],
81
82
  n_parameters=22_958_592,
83
+ n_embedding_parameters=11_720_448,
82
84
  memory_usage_mb=86,
83
85
  max_tokens=512,
84
86
  embed_dim=1024,