mteb 2.7.3__py3-none-any.whl → 2.7.4__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- mteb/abstasks/retrieval.py +1 -1
- mteb/benchmarks/benchmarks/__init__.py +2 -0
- mteb/benchmarks/benchmarks/benchmarks.py +41 -2
- mteb/descriptive_stats/Retrieval/BrightAopsRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightBiologyLongRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightBiologyRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightEarthScienceLongRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightEarthScienceRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightEconomicsLongRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightEconomicsRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightLeetcodeRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightPonyLongRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightPonyRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightPsychologyLongRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightPsychologyRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightRoboticsLongRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightRoboticsRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightStackoverflowLongRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightStackoverflowRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightSustainableLivingLongRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightSustainableLivingRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightTheoremQAQuestionsRetrieval.json +35 -0
- mteb/descriptive_stats/Retrieval/BrightTheoremQATheoremsRetrieval.json +35 -0
- mteb/models/model_implementations/align_models.py +1 -0
- mteb/models/model_implementations/amazon_models.py +1 -0
- mteb/models/model_implementations/andersborges.py +2 -0
- mteb/models/model_implementations/ara_models.py +1 -0
- mteb/models/model_implementations/arctic_models.py +8 -0
- mteb/models/model_implementations/b1ade_models.py +1 -0
- mteb/models/model_implementations/bedrock_models.py +4 -0
- mteb/models/model_implementations/bge_models.py +40 -1
- mteb/models/model_implementations/bica_model.py +1 -0
- mteb/models/model_implementations/blip2_models.py +2 -0
- mteb/models/model_implementations/blip_models.py +8 -0
- mteb/models/model_implementations/bm25.py +8 -5
- mteb/models/model_implementations/bmretriever_models.py +4 -0
- mteb/models/model_implementations/cadet_models.py +1 -0
- mteb/models/model_implementations/cde_models.py +2 -0
- mteb/models/model_implementations/clip_models.py +3 -0
- mteb/models/model_implementations/clips_models.py +3 -0
- mteb/models/model_implementations/codefuse_models.py +5 -0
- mteb/models/model_implementations/codesage_models.py +3 -0
- mteb/models/model_implementations/cohere_models.py +4 -0
- mteb/models/model_implementations/cohere_v.py +5 -0
- mteb/models/model_implementations/colpali_models.py +3 -0
- mteb/models/model_implementations/colqwen_models.py +7 -0
- mteb/models/model_implementations/colsmol_models.py +2 -0
- mteb/models/model_implementations/conan_models.py +1 -0
- mteb/models/model_implementations/dino_models.py +19 -0
- mteb/models/model_implementations/e5_instruct.py +4 -0
- mteb/models/model_implementations/e5_models.py +9 -0
- mteb/models/model_implementations/e5_v.py +1 -0
- mteb/models/model_implementations/eagerworks_models.py +1 -0
- mteb/models/model_implementations/emillykkejensen_models.py +3 -0
- mteb/models/model_implementations/en_code_retriever.py +1 -0
- mteb/models/model_implementations/euler_models.py +1 -0
- mteb/models/model_implementations/evaclip_models.py +4 -0
- mteb/models/model_implementations/fa_models.py +9 -0
- mteb/models/model_implementations/facebookai.py +2 -0
- mteb/models/model_implementations/geogpt_models.py +1 -0
- mteb/models/model_implementations/gme_v_models.py +2 -0
- mteb/models/model_implementations/google_models.py +5 -0
- mteb/models/model_implementations/granite_vision_embedding_models.py +1 -0
- mteb/models/model_implementations/gritlm_models.py +2 -0
- mteb/models/model_implementations/gte_models.py +9 -0
- mteb/models/model_implementations/hinvec_models.py +1 -0
- mteb/models/model_implementations/human.py +1 -0
- mteb/models/model_implementations/ibm_granite_models.py +6 -0
- mteb/models/model_implementations/inf_models.py +2 -0
- mteb/models/model_implementations/jasper_models.py +2 -0
- mteb/models/model_implementations/jina_clip.py +1 -0
- mteb/models/model_implementations/jina_models.py +7 -0
- mteb/models/model_implementations/kalm_models.py +6 -0
- mteb/models/model_implementations/kblab.py +1 -0
- mteb/models/model_implementations/kennethenevoldsen_models.py +2 -0
- mteb/models/model_implementations/kfst.py +1 -0
- mteb/models/model_implementations/kowshik24_models.py +1 -0
- mteb/models/model_implementations/lens_models.py +2 -0
- mteb/models/model_implementations/lgai_embedding_models.py +1 -0
- mteb/models/model_implementations/linq_models.py +1 -0
- mteb/models/model_implementations/listconranker.py +1 -0
- mteb/models/model_implementations/llm2clip_models.py +3 -0
- mteb/models/model_implementations/llm2vec_models.py +8 -0
- mteb/models/model_implementations/mcinext_models.py +3 -0
- mteb/models/model_implementations/mdbr_models.py +2 -0
- mteb/models/model_implementations/misc_models.py +63 -0
- mteb/models/model_implementations/mixedbread_ai_models.py +3 -0
- mteb/models/model_implementations/mme5_models.py +2 -1
- mteb/models/model_implementations/moco_models.py +2 -0
- mteb/models/model_implementations/mod_models.py +1 -0
- mteb/models/model_implementations/model2vec_models.py +13 -0
- mteb/models/model_implementations/moka_models.py +3 -0
- mteb/models/model_implementations/nbailab.py +3 -0
- mteb/models/model_implementations/no_instruct_sentence_models.py +1 -0
- mteb/models/model_implementations/nomic_models.py +6 -0
- mteb/models/model_implementations/nomic_models_vision.py +1 -0
- mteb/models/model_implementations/nvidia_llama_nemoretriever_colemb.py +2 -0
- mteb/models/model_implementations/nvidia_models.py +3 -0
- mteb/models/model_implementations/octen_models.py +2 -0
- mteb/models/model_implementations/openai_models.py +5 -0
- mteb/models/model_implementations/openclip_models.py +8 -0
- mteb/models/model_implementations/opensearch_neural_sparse_models.py +5 -0
- mteb/models/model_implementations/ops_moa_models.py +2 -0
- mteb/models/model_implementations/ordalietech_solon_embeddings_mini_beta_1_1.py +1 -0
- mteb/models/model_implementations/pawan_models.py +1 -0
- mteb/models/model_implementations/piccolo_models.py +2 -0
- mteb/models/model_implementations/promptriever_models.py +4 -0
- mteb/models/model_implementations/pylate_models.py +3 -0
- mteb/models/model_implementations/qodo_models.py +2 -0
- mteb/models/model_implementations/qtack_models.py +1 -0
- mteb/models/model_implementations/qwen3_models.py +3 -0
- mteb/models/model_implementations/qzhou_models.py +2 -0
- mteb/models/model_implementations/rasgaard_models.py +1 -0
- mteb/models/model_implementations/reasonir_model.py +65 -0
- mteb/models/model_implementations/repllama_models.py +2 -0
- mteb/models/model_implementations/rerankers_custom.py +3 -0
- mteb/models/model_implementations/rerankers_monot5_based.py +14 -0
- mteb/models/model_implementations/richinfoai_models.py +1 -0
- mteb/models/model_implementations/ru_sentence_models.py +20 -0
- mteb/models/model_implementations/ruri_models.py +10 -0
- mteb/models/model_implementations/salesforce_models.py +3 -0
- mteb/models/model_implementations/samilpwc_models.py +1 -0
- mteb/models/model_implementations/sarashina_embedding_models.py +2 -0
- mteb/models/model_implementations/searchmap_models.py +1 -0
- mteb/models/model_implementations/seed_1_6_embedding_models.py +1 -0
- mteb/models/model_implementations/seed_1_6_embedding_models_1215.py +1 -0
- mteb/models/model_implementations/seed_models.py +1 -0
- mteb/models/model_implementations/sentence_transformers_models.py +18 -0
- mteb/models/model_implementations/shuu_model.py +1 -0
- mteb/models/model_implementations/siglip_models.py +10 -0
- mteb/models/model_implementations/sonar_models.py +2 -1
- mteb/models/model_implementations/spartan8806_atles_champion.py +1 -0
- mteb/models/model_implementations/stella_models.py +6 -0
- mteb/models/model_implementations/tarka_models.py +2 -0
- mteb/models/model_implementations/text2vec_models.py +3 -0
- mteb/models/model_implementations/ua_sentence_models.py +1 -0
- mteb/models/model_implementations/uae_models.py +1 -0
- mteb/models/model_implementations/vdr_models.py +1 -0
- mteb/models/model_implementations/vi_vn_models.py +6 -0
- mteb/models/model_implementations/vista_models.py +2 -0
- mteb/models/model_implementations/vlm2vec_models.py +2 -0
- mteb/models/model_implementations/voyage_models.py +15 -0
- mteb/models/model_implementations/voyage_v.py +1 -0
- mteb/models/model_implementations/xyz_models.py +1 -0
- mteb/models/model_implementations/youtu_models.py +1 -0
- mteb/models/model_implementations/yuan_models.py +1 -0
- mteb/models/model_implementations/yuan_models_en.py +1 -0
- mteb/models/model_meta.py +35 -2
- mteb/tasks/retrieval/eng/__init__.py +42 -0
- mteb/tasks/retrieval/eng/bright_retrieval.py +9 -1
- mteb/tasks/retrieval/eng/bright_v1_1_retrieval.py +968 -0
- {mteb-2.7.3.dist-info → mteb-2.7.4.dist-info}/METADATA +1 -1
- {mteb-2.7.3.dist-info → mteb-2.7.4.dist-info}/RECORD +157 -136
- {mteb-2.7.3.dist-info → mteb-2.7.4.dist-info}/WHEEL +0 -0
- {mteb-2.7.3.dist-info → mteb-2.7.4.dist-info}/entry_points.txt +0 -0
- {mteb-2.7.3.dist-info → mteb-2.7.4.dist-info}/licenses/LICENSE +0 -0
- {mteb-2.7.3.dist-info → mteb-2.7.4.dist-info}/top_level.txt +0 -0
|
@@ -356,6 +356,7 @@ gme_qwen2vl_2b = ModelMeta(
|
|
|
356
356
|
release_date="2024-12-24",
|
|
357
357
|
modalities=["image", "text"],
|
|
358
358
|
n_parameters=2_210_000_000,
|
|
359
|
+
n_embedding_parameters=233_373_696,
|
|
359
360
|
memory_usage_mb=8427,
|
|
360
361
|
embed_dim=1536,
|
|
361
362
|
license="apache-2.0",
|
|
@@ -380,6 +381,7 @@ gme_qwen2vl_7b = ModelMeta(
|
|
|
380
381
|
release_date="2024-12-24",
|
|
381
382
|
modalities=["image", "text"],
|
|
382
383
|
n_parameters=8_290_000_000,
|
|
384
|
+
n_embedding_parameters=544_997_376,
|
|
383
385
|
memory_usage_mb=31629,
|
|
384
386
|
embed_dim=3584,
|
|
385
387
|
license="apache-2.0",
|
|
@@ -162,6 +162,7 @@ google_text_emb_004 = ModelMeta(
|
|
|
162
162
|
revision="1", # revision is intended for implementation
|
|
163
163
|
release_date="2024-05-14",
|
|
164
164
|
n_parameters=None,
|
|
165
|
+
n_embedding_parameters=None,
|
|
165
166
|
memory_usage_mb=None,
|
|
166
167
|
max_tokens=2048,
|
|
167
168
|
embed_dim=768,
|
|
@@ -187,6 +188,7 @@ google_text_emb_005 = ModelMeta(
|
|
|
187
188
|
revision="1", # revision is intended for implementation
|
|
188
189
|
release_date="2024-11-18",
|
|
189
190
|
n_parameters=None,
|
|
191
|
+
n_embedding_parameters=None,
|
|
190
192
|
memory_usage_mb=None,
|
|
191
193
|
max_tokens=2048,
|
|
192
194
|
embed_dim=768,
|
|
@@ -212,6 +214,7 @@ google_text_multilingual_emb_002 = ModelMeta(
|
|
|
212
214
|
revision="1",
|
|
213
215
|
release_date="2024-05-14",
|
|
214
216
|
n_parameters=None,
|
|
217
|
+
n_embedding_parameters=None,
|
|
215
218
|
memory_usage_mb=None,
|
|
216
219
|
max_tokens=2048,
|
|
217
220
|
embed_dim=768,
|
|
@@ -237,6 +240,7 @@ google_gemini_embedding_001 = ModelMeta(
|
|
|
237
240
|
revision="1",
|
|
238
241
|
release_date="2025-03-07",
|
|
239
242
|
n_parameters=None,
|
|
243
|
+
n_embedding_parameters=None,
|
|
240
244
|
memory_usage_mb=None,
|
|
241
245
|
max_tokens=2048,
|
|
242
246
|
embed_dim=3072,
|
|
@@ -272,6 +276,7 @@ embedding_gemma_300m = ModelMeta(
|
|
|
272
276
|
revision="64614b0b8b64f0c6c1e52b07e4e9a4e8fe4d2da2",
|
|
273
277
|
release_date="2025-09-04",
|
|
274
278
|
n_parameters=307_581_696,
|
|
279
|
+
n_embedding_parameters=201_326_592,
|
|
275
280
|
embed_dim=768,
|
|
276
281
|
max_tokens=2048,
|
|
277
282
|
license="gemma",
|
|
@@ -44,6 +44,7 @@ gritlm7b = ModelMeta(
|
|
|
44
44
|
revision="13f00a0e36500c80ce12870ea513846a066004af",
|
|
45
45
|
release_date="2024-02-15",
|
|
46
46
|
n_parameters=7_240_000_000,
|
|
47
|
+
n_embedding_parameters=131_072_000,
|
|
47
48
|
memory_usage_mb=13813,
|
|
48
49
|
embed_dim=4096,
|
|
49
50
|
license="apache-2.0",
|
|
@@ -73,6 +74,7 @@ gritlm8x7b = ModelMeta(
|
|
|
73
74
|
revision="7f089b13e3345510281733ca1e6ff871b5b4bc76",
|
|
74
75
|
release_date="2024-02-15",
|
|
75
76
|
n_parameters=57_920_000_000,
|
|
77
|
+
n_embedding_parameters=None,
|
|
76
78
|
memory_usage_mb=89079,
|
|
77
79
|
embed_dim=32768,
|
|
78
80
|
license="apache-2.0",
|
|
@@ -48,6 +48,7 @@ gte_qwen2_7b_instruct = ModelMeta(
|
|
|
48
48
|
revision="e26182b2122f4435e8b3ebecbf363990f409b45b",
|
|
49
49
|
release_date="2024-06-15", # initial commit of hf model.
|
|
50
50
|
n_parameters=7_613_000_000,
|
|
51
|
+
n_embedding_parameters=543_499_264,
|
|
51
52
|
memory_usage_mb=29040,
|
|
52
53
|
embed_dim=3584,
|
|
53
54
|
license="apache-2.0",
|
|
@@ -80,6 +81,7 @@ gte_qwen1_5_7b_instruct = ModelMeta(
|
|
|
80
81
|
revision="07d27e5226328010336563bc1b564a5e3436a298",
|
|
81
82
|
release_date="2024-04-20", # initial commit of hf model.
|
|
82
83
|
n_parameters=7_720_000_000,
|
|
84
|
+
n_embedding_parameters=None,
|
|
83
85
|
memory_usage_mb=29449,
|
|
84
86
|
embed_dim=4096,
|
|
85
87
|
license="apache-2.0",
|
|
@@ -117,6 +119,7 @@ gte_qwen2_1_5b_instruct = ModelMeta(
|
|
|
117
119
|
revision="c6c1b92f4a3e1b92b326ad29dd3c8433457df8dd",
|
|
118
120
|
release_date="2024-07-29", # initial commit of hf model.
|
|
119
121
|
n_parameters=1_780_000_000,
|
|
122
|
+
n_embedding_parameters=232_928_256,
|
|
120
123
|
memory_usage_mb=6776,
|
|
121
124
|
embed_dim=8960,
|
|
122
125
|
license="apache-2.0",
|
|
@@ -145,6 +148,7 @@ gte_small_zh = ModelMeta(
|
|
|
145
148
|
revision="af7bd46fbb00b3a6963c8dd7f1786ddfbfbe973a",
|
|
146
149
|
release_date="2023-11-08", # initial commit of hf model.
|
|
147
150
|
n_parameters=int(30.3 * 1e6),
|
|
151
|
+
n_embedding_parameters=10_817_536,
|
|
148
152
|
memory_usage_mb=58,
|
|
149
153
|
embed_dim=1024,
|
|
150
154
|
license="mit",
|
|
@@ -173,6 +177,7 @@ gte_base_zh = ModelMeta(
|
|
|
173
177
|
revision="71ab7947d6fac5b64aa299e6e40e6c2b2e85976c",
|
|
174
178
|
release_date="2023-11-08", # initial commit of hf model.
|
|
175
179
|
n_parameters=int(102 * 1e6),
|
|
180
|
+
n_embedding_parameters=16_226_304,
|
|
176
181
|
memory_usage_mb=195,
|
|
177
182
|
embed_dim=1024,
|
|
178
183
|
license="mit",
|
|
@@ -201,6 +206,7 @@ gte_large_zh = ModelMeta(
|
|
|
201
206
|
revision="64c364e579de308104a9b2c170ca009502f4f545",
|
|
202
207
|
release_date="2023-11-08", # initial commit of hf model.
|
|
203
208
|
n_parameters=int(326 * 1e6),
|
|
209
|
+
n_embedding_parameters=21_635_072,
|
|
204
210
|
memory_usage_mb=621,
|
|
205
211
|
embed_dim=1024,
|
|
206
212
|
license="mit",
|
|
@@ -330,6 +336,7 @@ gte_multilingual_base = ModelMeta(
|
|
|
330
336
|
revision="ca1791e0bcc104f6db161f27de1340241b13c5a4",
|
|
331
337
|
release_date="2024-07-20", # initial commit of hf model.
|
|
332
338
|
n_parameters=int(305 * 1e6),
|
|
339
|
+
n_embedding_parameters=192_036_864,
|
|
333
340
|
memory_usage_mb=582,
|
|
334
341
|
embed_dim=768,
|
|
335
342
|
license="apache-2.0",
|
|
@@ -359,6 +366,7 @@ gte_modernbert_base = ModelMeta(
|
|
|
359
366
|
revision="7ca8b4ca700621b67618669f5378fe5f5820b8e4",
|
|
360
367
|
release_date="2025-01-21", # initial commit of hf model.
|
|
361
368
|
n_parameters=int(149 * 1e6),
|
|
369
|
+
n_embedding_parameters=None,
|
|
362
370
|
memory_usage_mb=284,
|
|
363
371
|
embed_dim=768,
|
|
364
372
|
license="apache-2.0",
|
|
@@ -402,6 +410,7 @@ gte_base_en_v15 = ModelMeta(
|
|
|
402
410
|
revision="a829fd0e060bb84554da0dfd354d0de0f7712b7f", # can be any
|
|
403
411
|
release_date="2024-06-20", # initial commit of hf model
|
|
404
412
|
n_parameters=137_000_000,
|
|
413
|
+
n_embedding_parameters=23_445_504,
|
|
405
414
|
memory_usage_mb=None,
|
|
406
415
|
embed_dim=768,
|
|
407
416
|
license="apache-2.0",
|
|
@@ -100,6 +100,7 @@ granite_107m_multilingual = ModelMeta(
|
|
|
100
100
|
revision="47db56afe692f731540413c67dd818ff492277e7",
|
|
101
101
|
release_date="2024-12-18",
|
|
102
102
|
n_parameters=107_000_000,
|
|
103
|
+
n_embedding_parameters=96_000_768,
|
|
103
104
|
memory_usage_mb=204,
|
|
104
105
|
embed_dim=384,
|
|
105
106
|
license="apache-2.0",
|
|
@@ -131,6 +132,7 @@ granite_278m_multilingual = ModelMeta(
|
|
|
131
132
|
revision="84e3546b88b0cb69f8078608a1df558020bcbf1f",
|
|
132
133
|
release_date="2024-12-18",
|
|
133
134
|
n_parameters=278_000_000,
|
|
135
|
+
n_embedding_parameters=192_001_536,
|
|
134
136
|
memory_usage_mb=530,
|
|
135
137
|
embed_dim=768,
|
|
136
138
|
license="apache-2.0",
|
|
@@ -162,6 +164,7 @@ granite_30m_english = ModelMeta(
|
|
|
162
164
|
revision="eddbb57470f896b5f8e2bfcb823d8f0e2d2024a5",
|
|
163
165
|
release_date="2024-12-18",
|
|
164
166
|
n_parameters=30_000_000,
|
|
167
|
+
n_embedding_parameters=19_301_760,
|
|
165
168
|
memory_usage_mb=58,
|
|
166
169
|
embed_dim=384,
|
|
167
170
|
license="apache-2.0",
|
|
@@ -193,6 +196,7 @@ granite_125m_english = ModelMeta(
|
|
|
193
196
|
revision="e48d3a5b47eaa18e3fe07d4676e187fd80f32730",
|
|
194
197
|
release_date="2024-12-18",
|
|
195
198
|
n_parameters=125_000_000,
|
|
199
|
+
n_embedding_parameters=38_603_520,
|
|
196
200
|
memory_usage_mb=238,
|
|
197
201
|
embed_dim=768,
|
|
198
202
|
license="apache-2.0",
|
|
@@ -225,6 +229,7 @@ granite_english_r2 = ModelMeta(
|
|
|
225
229
|
revision="6e7b8ce0e76270394ac4669ba4bbd7133b60b7f9",
|
|
226
230
|
release_date="2025-08-15",
|
|
227
231
|
n_parameters=149_000_000,
|
|
232
|
+
n_embedding_parameters=None,
|
|
228
233
|
memory_usage_mb=284,
|
|
229
234
|
embed_dim=768,
|
|
230
235
|
license="apache-2.0",
|
|
@@ -250,6 +255,7 @@ granite_small_english_r2 = ModelMeta(
|
|
|
250
255
|
revision="54a8d2616a0844355a5164432d3f6dafb37b17a3",
|
|
251
256
|
release_date="2025-08-15",
|
|
252
257
|
n_parameters=47_000_000,
|
|
258
|
+
n_embedding_parameters=None,
|
|
253
259
|
memory_usage_mb=91,
|
|
254
260
|
embed_dim=384,
|
|
255
261
|
license="apache-2.0",
|
|
@@ -56,6 +56,7 @@ inf_retriever_v1 = ModelMeta(
|
|
|
56
56
|
revision="cb70ca7c31dfa866b2eff2dad229c144d8ddfd91",
|
|
57
57
|
release_date="2024-12-24", # initial commit of hf model.
|
|
58
58
|
n_parameters=7_069_121_024,
|
|
59
|
+
n_embedding_parameters=None,
|
|
59
60
|
memory_usage_mb=13483,
|
|
60
61
|
embed_dim=3584,
|
|
61
62
|
license="apache-2.0",
|
|
@@ -83,6 +84,7 @@ inf_retriever_v1_1_5b = ModelMeta(
|
|
|
83
84
|
revision="c9c05c2dd50707a486966ba81703021ae2094a06",
|
|
84
85
|
release_date="2025-02-08", # initial commit of hf model.
|
|
85
86
|
n_parameters=1_543_268_864,
|
|
87
|
+
n_embedding_parameters=232_928_256,
|
|
86
88
|
memory_usage_mb=2944,
|
|
87
89
|
embed_dim=1536,
|
|
88
90
|
license="apache-2.0",
|
|
@@ -299,6 +299,7 @@ jasper_en_v1 = ModelMeta(
|
|
|
299
299
|
revision="d6330ce98f8a0d741e781df845904c9484f00efa",
|
|
300
300
|
release_date="2024-12-11", # first commit
|
|
301
301
|
n_parameters=1_999_000_000,
|
|
302
|
+
n_embedding_parameters=232_932_864,
|
|
302
303
|
memory_usage_mb=3802,
|
|
303
304
|
max_tokens=131072,
|
|
304
305
|
embed_dim=8960,
|
|
@@ -346,6 +347,7 @@ Jasper_Token_Compression_600M = ModelMeta(
|
|
|
346
347
|
revision="06a100f753a5a96d9e583b3af79c6fcdfacc4719",
|
|
347
348
|
release_date="2025-11-14",
|
|
348
349
|
n_parameters=595776512,
|
|
350
|
+
n_embedding_parameters=None,
|
|
349
351
|
memory_usage_mb=2272,
|
|
350
352
|
embed_dim=2048,
|
|
351
353
|
license="mit",
|
|
@@ -733,6 +733,7 @@ jina_reranker_v3 = ModelMeta(
|
|
|
733
733
|
release_date="2025-09-18", # official release date
|
|
734
734
|
modalities=["text"],
|
|
735
735
|
n_parameters=int(0.6 * 1e9),
|
|
736
|
+
n_embedding_parameters=None,
|
|
736
737
|
memory_usage_mb=1138,
|
|
737
738
|
max_tokens=131072,
|
|
738
739
|
embed_dim=None,
|
|
@@ -776,6 +777,7 @@ jina_embeddings_v4 = ModelMeta(
|
|
|
776
777
|
release_date="2025-06-24", # official release date
|
|
777
778
|
modalities=["image", "text"],
|
|
778
779
|
n_parameters=int(3.8 * 1e9),
|
|
780
|
+
n_embedding_parameters=None,
|
|
779
781
|
memory_usage_mb=7500,
|
|
780
782
|
max_tokens=32768,
|
|
781
783
|
embed_dim=2048,
|
|
@@ -824,6 +826,7 @@ jina_embeddings_v3 = ModelMeta(
|
|
|
824
826
|
revision="215a6e121fa0183376388ac6b1ae230326bfeaed",
|
|
825
827
|
release_date="2024-09-18", # official release date
|
|
826
828
|
n_parameters=int(572 * 1e6),
|
|
829
|
+
n_embedding_parameters=None,
|
|
827
830
|
memory_usage_mb=1092,
|
|
828
831
|
max_tokens=8194,
|
|
829
832
|
embed_dim=1024,
|
|
@@ -884,6 +887,7 @@ jina_embeddings_v2_base_en = ModelMeta(
|
|
|
884
887
|
revision="6e85f575bc273f1fd840a658067d0157933c83f0",
|
|
885
888
|
release_date="2023-09-27",
|
|
886
889
|
n_parameters=137_000_000,
|
|
890
|
+
n_embedding_parameters=23_445_504,
|
|
887
891
|
memory_usage_mb=262,
|
|
888
892
|
embed_dim=768,
|
|
889
893
|
license="apache-2.0",
|
|
@@ -948,6 +952,7 @@ jina_embeddings_v2_small_en = ModelMeta(
|
|
|
948
952
|
revision="44e7d1d6caec8c883c2d4b207588504d519788d0",
|
|
949
953
|
release_date="2023-09-27",
|
|
950
954
|
n_parameters=32_700_000,
|
|
955
|
+
n_embedding_parameters=15_630_336,
|
|
951
956
|
memory_usage_mb=62,
|
|
952
957
|
embed_dim=512,
|
|
953
958
|
license="apache-2.0",
|
|
@@ -1009,6 +1014,7 @@ jina_embedding_b_en_v1 = ModelMeta(
|
|
|
1009
1014
|
revision="32aa658e5ceb90793454d22a57d8e3a14e699516",
|
|
1010
1015
|
release_date="2023-07-07",
|
|
1011
1016
|
n_parameters=110_000_000,
|
|
1017
|
+
n_embedding_parameters=24_674_304,
|
|
1012
1018
|
memory_usage_mb=420,
|
|
1013
1019
|
embed_dim=768,
|
|
1014
1020
|
license="apache-2.0",
|
|
@@ -1066,6 +1072,7 @@ jina_embedding_s_en_v1 = ModelMeta(
|
|
|
1066
1072
|
revision="5ac6cd473e2324c6d5f9e558a6a9f65abb57143e",
|
|
1067
1073
|
release_date="2023-07-07",
|
|
1068
1074
|
n_parameters=35_000_000,
|
|
1075
|
+
n_embedding_parameters=16_449_536,
|
|
1069
1076
|
memory_usage_mb=134,
|
|
1070
1077
|
embed_dim=512,
|
|
1071
1078
|
license="apache-2.0",
|
|
@@ -780,6 +780,7 @@ HIT_TMG__KaLM_embedding_multilingual_mini_instruct_v1 = ModelMeta(
|
|
|
780
780
|
release_date="2024-10-23",
|
|
781
781
|
languages=["eng-Latn", "zho-Hans"],
|
|
782
782
|
n_parameters=494032768,
|
|
783
|
+
n_embedding_parameters=136_134_656,
|
|
783
784
|
memory_usage_mb=1885,
|
|
784
785
|
max_tokens=512,
|
|
785
786
|
embed_dim=896,
|
|
@@ -805,6 +806,7 @@ HIT_TMG__KaLM_embedding_multilingual_mini_v1 = ModelMeta(
|
|
|
805
806
|
release_date="2024-08-27",
|
|
806
807
|
languages=["eng-Latn", "zho-Hans"],
|
|
807
808
|
n_parameters=494032768,
|
|
809
|
+
n_embedding_parameters=136_134_656,
|
|
808
810
|
memory_usage_mb=1885,
|
|
809
811
|
max_tokens=512,
|
|
810
812
|
embed_dim=896,
|
|
@@ -836,6 +838,7 @@ HIT_TMG__KaLM_embedding_multilingual_mini_instruct_v1_5 = ModelMeta(
|
|
|
836
838
|
release_date="2024-12-26",
|
|
837
839
|
languages=["eng-Latn", "zho-Hans"],
|
|
838
840
|
n_parameters=494032768,
|
|
841
|
+
n_embedding_parameters=136_134_656,
|
|
839
842
|
memory_usage_mb=1885,
|
|
840
843
|
max_tokens=512,
|
|
841
844
|
embed_dim=896,
|
|
@@ -867,6 +870,7 @@ HIT_TMG__KaLM_embedding_multilingual_mini_instruct_v2 = ModelMeta(
|
|
|
867
870
|
release_date="2025-06-25",
|
|
868
871
|
languages=["eng-Latn", "zho-Hans"],
|
|
869
872
|
n_parameters=494032768,
|
|
873
|
+
n_embedding_parameters=136_134_656,
|
|
870
874
|
memory_usage_mb=942,
|
|
871
875
|
max_tokens=512,
|
|
872
876
|
embed_dim=896,
|
|
@@ -898,6 +902,7 @@ KaLM_Embedding_KaLM_embedding_multilingual_mini_instruct_v2_5 = ModelMeta(
|
|
|
898
902
|
release_date="2025-09-30",
|
|
899
903
|
languages=["eng-Latn", "zho-Hans"],
|
|
900
904
|
n_parameters=494032768,
|
|
905
|
+
n_embedding_parameters=136_134_656,
|
|
901
906
|
memory_usage_mb=1885,
|
|
902
907
|
max_tokens=512,
|
|
903
908
|
embed_dim=896,
|
|
@@ -948,6 +953,7 @@ KaLM_Embedding_gemma_3_12b_2511 = ModelMeta(
|
|
|
948
953
|
open_weights=True,
|
|
949
954
|
release_date="2025-11-06",
|
|
950
955
|
n_parameters=11.76 * 1e9,
|
|
956
|
+
n_embedding_parameters=None,
|
|
951
957
|
memory_usage_mb=44884,
|
|
952
958
|
max_tokens=32768,
|
|
953
959
|
embed_dim=3840,
|
|
@@ -12,6 +12,7 @@ dfm_enc_large = ModelMeta(
|
|
|
12
12
|
revision="132c53391e7a780dc6a2f9a03724d0158fe7122c",
|
|
13
13
|
release_date="2023-07-12",
|
|
14
14
|
n_parameters=355087360,
|
|
15
|
+
n_embedding_parameters=51_200_000,
|
|
15
16
|
memory_usage_mb=1554,
|
|
16
17
|
embed_dim=1024,
|
|
17
18
|
license="mit",
|
|
@@ -47,6 +48,7 @@ dfm_enc_med = ModelMeta(
|
|
|
47
48
|
revision="701bce95d499fa97610d57e8823c54fd1fb79930",
|
|
48
49
|
release_date="2023-07-12",
|
|
49
50
|
n_parameters=124445952,
|
|
51
|
+
n_embedding_parameters=38_403_840,
|
|
50
52
|
memory_usage_mb=475,
|
|
51
53
|
embed_dim=768,
|
|
52
54
|
license="mit",
|
|
@@ -9,6 +9,7 @@ kowshik24_bangla_embedding_model = ModelMeta(
|
|
|
9
9
|
revision="6689c21e69be5950596bad084457cbaa138728d8",
|
|
10
10
|
release_date="2025-11-10",
|
|
11
11
|
n_parameters=278_000_000,
|
|
12
|
+
n_embedding_parameters=192_001_536,
|
|
12
13
|
memory_usage_mb=1061,
|
|
13
14
|
embed_dim=768,
|
|
14
15
|
license="apache-2.0",
|
|
@@ -18,6 +18,7 @@ lens_d4000 = ModelMeta(
|
|
|
18
18
|
revision="e473b33364e6c48a324796fd1411d3b93670c6fe",
|
|
19
19
|
release_date="2025-01-17",
|
|
20
20
|
n_parameters=int(7.11 * 1e9),
|
|
21
|
+
n_embedding_parameters=131_084_288,
|
|
21
22
|
memory_usage_mb=27125,
|
|
22
23
|
embed_dim=4000,
|
|
23
24
|
license="apache-2.0",
|
|
@@ -41,6 +42,7 @@ lens_d8000 = ModelMeta(
|
|
|
41
42
|
revision="a0b87bd91cb27b6f2f0b0fe22c28026da1d464ef",
|
|
42
43
|
release_date="2025-01-17",
|
|
43
44
|
n_parameters=int(7.11 * 1e9),
|
|
45
|
+
n_embedding_parameters=131_084_288,
|
|
44
46
|
memory_usage_mb=27125,
|
|
45
47
|
embed_dim=8000,
|
|
46
48
|
license="apache-2.0",
|
|
@@ -43,6 +43,7 @@ Linq_Embed_Mistral = ModelMeta(
|
|
|
43
43
|
revision="0c1a0b0589177079acc552433cad51d7c9132379",
|
|
44
44
|
release_date="2024-05-29", # initial commit of hf model.
|
|
45
45
|
n_parameters=7_110_000_000,
|
|
46
|
+
n_embedding_parameters=None,
|
|
46
47
|
memory_usage_mb=13563,
|
|
47
48
|
embed_dim=4096,
|
|
48
49
|
license="cc-by-nc-4.0",
|
|
@@ -123,6 +123,7 @@ listconranker = ModelMeta(
|
|
|
123
123
|
revision="95ae6a5f422a916bc36520f0f3e198e7d91520a0",
|
|
124
124
|
release_date="2024-12-11",
|
|
125
125
|
n_parameters=401_000_000,
|
|
126
|
+
n_embedding_parameters=None,
|
|
126
127
|
memory_usage_mb=1242,
|
|
127
128
|
similarity_fn_name="cosine",
|
|
128
129
|
training_datasets=listconranker_training_datasets,
|
|
@@ -194,6 +194,7 @@ llm2clip_openai_l_14_336 = ModelMeta(
|
|
|
194
194
|
release_date="2024-11-07",
|
|
195
195
|
modalities=["image", "text"],
|
|
196
196
|
n_parameters=579_000_000,
|
|
197
|
+
n_embedding_parameters=None,
|
|
197
198
|
memory_usage_mb=None,
|
|
198
199
|
max_tokens=None,
|
|
199
200
|
embed_dim=1280,
|
|
@@ -219,6 +220,7 @@ llm2clip_openai_l_14_224 = ModelMeta(
|
|
|
219
220
|
release_date="2024-11-07",
|
|
220
221
|
modalities=["image", "text"],
|
|
221
222
|
n_parameters=578_000_000,
|
|
223
|
+
n_embedding_parameters=None,
|
|
222
224
|
memory_usage_mb=None,
|
|
223
225
|
max_tokens=None,
|
|
224
226
|
embed_dim=1280,
|
|
@@ -243,6 +245,7 @@ llm2clip_openai_b_16 = ModelMeta(
|
|
|
243
245
|
release_date="2024-11-07",
|
|
244
246
|
modalities=["image", "text"],
|
|
245
247
|
n_parameters=361_000_000,
|
|
248
|
+
n_embedding_parameters=None,
|
|
246
249
|
memory_usage_mb=None,
|
|
247
250
|
max_tokens=None,
|
|
248
251
|
embed_dim=1280,
|
|
@@ -145,6 +145,7 @@ llm2vec_llama3_8b_supervised = ModelMeta(
|
|
|
145
145
|
# TODO: Not sure what to put here as a model is made of two peft repos, each with a different revision
|
|
146
146
|
release_date="2024-04-09",
|
|
147
147
|
n_parameters=7_505_000_000,
|
|
148
|
+
n_embedding_parameters=None,
|
|
148
149
|
memory_usage_mb=28629,
|
|
149
150
|
max_tokens=8192,
|
|
150
151
|
embed_dim=4096,
|
|
@@ -174,6 +175,7 @@ llm2vec_llama3_8b_unsupervised = ModelMeta(
|
|
|
174
175
|
revision="1cb7b735326d13a8541db8f57f35da5373f5e9c6",
|
|
175
176
|
release_date="2024-04-09",
|
|
176
177
|
n_parameters=7_505_000_000,
|
|
178
|
+
n_embedding_parameters=None,
|
|
177
179
|
memory_usage_mb=28629,
|
|
178
180
|
max_tokens=8192,
|
|
179
181
|
embed_dim=4096,
|
|
@@ -203,6 +205,7 @@ llm2vec_mistral7b_supervised = ModelMeta(
|
|
|
203
205
|
revision="0ae69bdd5816105778b971c3138e8f8a18eaa3ae",
|
|
204
206
|
release_date="2024-04-09",
|
|
205
207
|
n_parameters=7_111_000_000,
|
|
208
|
+
n_embedding_parameters=131_072_000,
|
|
206
209
|
memory_usage_mb=27126,
|
|
207
210
|
max_tokens=32768,
|
|
208
211
|
embed_dim=4096,
|
|
@@ -232,6 +235,7 @@ llm2vec_mistral7b_unsupervised = ModelMeta(
|
|
|
232
235
|
revision="2c055a5d77126c0d3dc6cd8ffa30e2908f4f45f8",
|
|
233
236
|
release_date="2024-04-09",
|
|
234
237
|
n_parameters=7_111_000_000,
|
|
238
|
+
n_embedding_parameters=131_072_000,
|
|
235
239
|
memory_usage_mb=27126,
|
|
236
240
|
max_tokens=32768,
|
|
237
241
|
embed_dim=4096,
|
|
@@ -261,6 +265,7 @@ llm2vec_llama2_7b_supervised = ModelMeta(
|
|
|
261
265
|
revision="2c055a5d77126c0d3dc6cd8ffa30e2908f4f45f8",
|
|
262
266
|
release_date="2024-04-09",
|
|
263
267
|
n_parameters=7_111_000_000,
|
|
268
|
+
n_embedding_parameters=None,
|
|
264
269
|
memory_usage_mb=27126,
|
|
265
270
|
max_tokens=32768,
|
|
266
271
|
embed_dim=4096,
|
|
@@ -290,6 +295,7 @@ llm2vec_llama2_7b_unsupervised = ModelMeta(
|
|
|
290
295
|
revision="a76944871d169ebe7c97eb921764cd063afed785",
|
|
291
296
|
release_date="2024-04-09",
|
|
292
297
|
n_parameters=7_111_000_000,
|
|
298
|
+
n_embedding_parameters=None,
|
|
293
299
|
memory_usage_mb=27126,
|
|
294
300
|
max_tokens=32768,
|
|
295
301
|
embed_dim=4096,
|
|
@@ -319,6 +325,7 @@ llm2vec_sheared_llama_supervised = ModelMeta(
|
|
|
319
325
|
revision="a5943d406c6b016fef3f07906aac183cf1a0b47d",
|
|
320
326
|
release_date="2024-04-09",
|
|
321
327
|
n_parameters=7_111_000_000,
|
|
328
|
+
n_embedding_parameters=65_536_000,
|
|
322
329
|
memory_usage_mb=27126,
|
|
323
330
|
max_tokens=32768,
|
|
324
331
|
embed_dim=4096,
|
|
@@ -348,6 +355,7 @@ llm2vec_sheared_llama_unsupervised = ModelMeta(
|
|
|
348
355
|
revision="a5943d406c6b016fef3f07906aac183cf1a0b47d",
|
|
349
356
|
release_date="2024-04-09",
|
|
350
357
|
n_parameters=7_111_000_000,
|
|
358
|
+
n_embedding_parameters=65_536_000,
|
|
351
359
|
memory_usage_mb=27126,
|
|
352
360
|
max_tokens=32768,
|
|
353
361
|
embed_dim=4096,
|
|
@@ -358,6 +358,7 @@ hakim = ModelMeta(
|
|
|
358
358
|
revision="1",
|
|
359
359
|
release_date="2025-05-10",
|
|
360
360
|
n_parameters=124_441_344,
|
|
361
|
+
n_embedding_parameters=None,
|
|
361
362
|
memory_usage_mb=475,
|
|
362
363
|
embed_dim=768,
|
|
363
364
|
license="not specified",
|
|
@@ -426,6 +427,7 @@ hakim_small = ModelMeta(
|
|
|
426
427
|
revision="1",
|
|
427
428
|
release_date="2025-05-10",
|
|
428
429
|
n_parameters=38_736_384,
|
|
430
|
+
n_embedding_parameters=None,
|
|
429
431
|
memory_usage_mb=148,
|
|
430
432
|
embed_dim=512,
|
|
431
433
|
license="not specified",
|
|
@@ -493,6 +495,7 @@ hakim_unsup = ModelMeta(
|
|
|
493
495
|
revision="1",
|
|
494
496
|
release_date="2025-05-10",
|
|
495
497
|
n_parameters=124_441_344,
|
|
498
|
+
n_embedding_parameters=None,
|
|
496
499
|
memory_usage_mb=475,
|
|
497
500
|
embed_dim=768,
|
|
498
501
|
license="not specified",
|
|
@@ -45,6 +45,7 @@ mdbr_leaf_ir = ModelMeta(
|
|
|
45
45
|
"Transformers",
|
|
46
46
|
],
|
|
47
47
|
n_parameters=22_861_056,
|
|
48
|
+
n_embedding_parameters=11_720_448,
|
|
48
49
|
memory_usage_mb=86,
|
|
49
50
|
max_tokens=512,
|
|
50
51
|
embed_dim=768,
|
|
@@ -79,6 +80,7 @@ mdbr_leaf_mt = ModelMeta(
|
|
|
79
80
|
"Transformers",
|
|
80
81
|
],
|
|
81
82
|
n_parameters=22_958_592,
|
|
83
|
+
n_embedding_parameters=11_720_448,
|
|
82
84
|
memory_usage_mb=86,
|
|
83
85
|
max_tokens=512,
|
|
84
86
|
embed_dim=1024,
|