PyPI - mteb - Versions diffs - 2.5.2__py3-none-any.whl → 2.7.2__py3-none-any.whl - Mend

mteb 2.5.2py3-none-any.whl → 2.7.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (241) hide show

mteb/__init__.py +2 -0
mteb/_create_dataloaders.py +17 -18
mteb/_evaluators/any_sts_evaluator.py +3 -3
mteb/_evaluators/clustering_evaluator.py +2 -2
mteb/_evaluators/evaluator.py +4 -2
mteb/_evaluators/image/imagetext_pairclassification_evaluator.py +10 -8
mteb/_evaluators/pair_classification_evaluator.py +5 -3
mteb/_evaluators/retrieval_evaluator.py +2 -2
mteb/_evaluators/retrieval_metrics.py +18 -17
mteb/_evaluators/sklearn_evaluator.py +11 -10
mteb/_evaluators/text/bitext_mining_evaluator.py +27 -18
mteb/_evaluators/text/summarization_evaluator.py +23 -18
mteb/_evaluators/zeroshot_classification_evaluator.py +5 -3
mteb/abstasks/_data_filter/filters.py +1 -1
mteb/abstasks/_data_filter/task_pipelines.py +3 -0
mteb/abstasks/_statistics_calculation.py +18 -10
mteb/abstasks/_stratification.py +18 -18
mteb/abstasks/abstask.py +35 -28
mteb/abstasks/aggregate_task_metadata.py +1 -9
mteb/abstasks/aggregated_task.py +10 -29
mteb/abstasks/classification.py +15 -10
mteb/abstasks/clustering.py +19 -15
mteb/abstasks/clustering_legacy.py +10 -10
mteb/abstasks/image/image_text_pair_classification.py +7 -4
mteb/abstasks/multilabel_classification.py +23 -19
mteb/abstasks/pair_classification.py +20 -11
mteb/abstasks/regression.py +4 -4
mteb/abstasks/retrieval.py +28 -24
mteb/abstasks/retrieval_dataset_loaders.py +2 -2
mteb/abstasks/sts.py +8 -5
mteb/abstasks/task_metadata.py +31 -33
mteb/abstasks/text/bitext_mining.py +39 -28
mteb/abstasks/text/reranking.py +8 -6
mteb/abstasks/text/summarization.py +10 -5
mteb/abstasks/zeroshot_classification.py +8 -4
mteb/benchmarks/benchmark.py +4 -2
mteb/benchmarks/benchmarks/__init__.py +4 -0
mteb/benchmarks/benchmarks/benchmarks.py +112 -11
mteb/benchmarks/get_benchmark.py +14 -55
mteb/cache.py +182 -29
mteb/cli/_display_tasks.py +2 -2
mteb/cli/build_cli.py +110 -14
mteb/cli/generate_model_card.py +43 -23
mteb/deprecated_evaluator.py +63 -49
mteb/descriptive_stats/Image/DocumentUnderstanding/KoVidore2CybersecurityRetrieval.json +32 -0
mteb/descriptive_stats/Image/DocumentUnderstanding/KoVidore2EconomicRetrieval.json +32 -0
mteb/descriptive_stats/Image/DocumentUnderstanding/KoVidore2EnergyRetrieval.json +32 -0
mteb/descriptive_stats/Image/DocumentUnderstanding/KoVidore2HrRetrieval.json +32 -0
mteb/descriptive_stats/Retrieval/ChemRxivRetrieval.json +30 -0
mteb/descriptive_stats/Retrieval/EuroPIRQRetrieval.json +116 -0
mteb/descriptive_stats/Retrieval/NanoClimateFEVER-VN.json +30 -0
mteb/descriptive_stats/Retrieval/NanoDBPedia-VN.json +30 -0
mteb/descriptive_stats/Retrieval/NanoFEVER-VN.json +30 -0
mteb/descriptive_stats/Retrieval/NanoHotpotQA-VN.json +30 -0
mteb/descriptive_stats/Retrieval/NanoMSMARCO-VN.json +30 -0
mteb/descriptive_stats/Retrieval/NanoNQ-VN.json +30 -0
mteb/descriptive_stats/Retrieval/TVPLRetrieval.json +30 -0
mteb/evaluate.py +44 -33
mteb/filter_tasks.py +25 -26
mteb/get_tasks.py +29 -30
mteb/languages/language_scripts.py +5 -3
mteb/leaderboard/app.py +162 -34
mteb/load_results.py +12 -12
mteb/models/abs_encoder.py +10 -6
mteb/models/cache_wrappers/cache_backend_protocol.py +3 -5
mteb/models/cache_wrappers/cache_backends/_hash_utils.py +5 -4
mteb/models/cache_wrappers/cache_backends/faiss_cache.py +6 -2
mteb/models/cache_wrappers/cache_backends/numpy_cache.py +43 -25
mteb/models/cache_wrappers/cache_wrapper.py +2 -2
mteb/models/get_model_meta.py +21 -3
mteb/models/instruct_wrapper.py +28 -8
mteb/models/model_implementations/align_models.py +1 -1
mteb/models/model_implementations/andersborges.py +4 -4
mteb/models/model_implementations/ara_models.py +1 -1
mteb/models/model_implementations/arctic_models.py +8 -8
mteb/models/model_implementations/b1ade_models.py +1 -1
mteb/models/model_implementations/bge_models.py +45 -21
mteb/models/model_implementations/bica_model.py +3 -3
mteb/models/model_implementations/blip2_models.py +2 -2
mteb/models/model_implementations/blip_models.py +16 -16
mteb/models/model_implementations/bm25.py +4 -4
mteb/models/model_implementations/bmretriever_models.py +6 -4
mteb/models/model_implementations/cadet_models.py +1 -1
mteb/models/model_implementations/cde_models.py +11 -4
mteb/models/model_implementations/clip_models.py +6 -6
mteb/models/model_implementations/clips_models.py +3 -3
mteb/models/model_implementations/codefuse_models.py +5 -5
mteb/models/model_implementations/codesage_models.py +3 -3
mteb/models/model_implementations/cohere_models.py +5 -5
mteb/models/model_implementations/cohere_v.py +2 -2
mteb/models/model_implementations/colpali_models.py +3 -3
mteb/models/model_implementations/colqwen_models.py +8 -8
mteb/models/model_implementations/colsmol_models.py +2 -2
mteb/models/model_implementations/conan_models.py +1 -1
mteb/models/model_implementations/dino_models.py +42 -42
mteb/models/model_implementations/e5_instruct.py +23 -4
mteb/models/model_implementations/e5_models.py +9 -9
mteb/models/model_implementations/e5_v.py +6 -6
mteb/models/model_implementations/eagerworks_models.py +1 -1
mteb/models/model_implementations/emillykkejensen_models.py +6 -6
mteb/models/model_implementations/en_code_retriever.py +1 -1
mteb/models/model_implementations/euler_models.py +2 -2
mteb/models/model_implementations/fa_models.py +9 -9
mteb/models/model_implementations/facebookai.py +14 -2
mteb/models/model_implementations/geogpt_models.py +1 -1
mteb/models/model_implementations/gme_v_models.py +6 -5
mteb/models/model_implementations/google_models.py +1 -1
mteb/models/model_implementations/granite_vision_embedding_models.py +1 -1
mteb/models/model_implementations/gritlm_models.py +2 -2
mteb/models/model_implementations/gte_models.py +25 -13
mteb/models/model_implementations/hinvec_models.py +1 -1
mteb/models/model_implementations/ibm_granite_models.py +30 -6
mteb/models/model_implementations/inf_models.py +2 -2
mteb/models/model_implementations/jasper_models.py +2 -2
mteb/models/model_implementations/jina_clip.py +48 -10
mteb/models/model_implementations/jina_models.py +18 -11
mteb/models/model_implementations/kblab.py +12 -6
mteb/models/model_implementations/kennethenevoldsen_models.py +4 -4
mteb/models/model_implementations/kfst.py +1 -1
mteb/models/model_implementations/kowshik24_models.py +1 -1
mteb/models/model_implementations/lgai_embedding_models.py +1 -1
mteb/models/model_implementations/linq_models.py +1 -1
mteb/models/model_implementations/listconranker.py +1 -1
mteb/models/model_implementations/llm2clip_models.py +6 -6
mteb/models/model_implementations/llm2vec_models.py +8 -8
mteb/models/model_implementations/mcinext_models.py +4 -1
mteb/models/model_implementations/mdbr_models.py +17 -3
mteb/models/model_implementations/misc_models.py +68 -68
mteb/models/model_implementations/mixedbread_ai_models.py +332 -0
mteb/models/model_implementations/mme5_models.py +1 -1
mteb/models/model_implementations/moco_models.py +4 -4
mteb/models/model_implementations/mod_models.py +1 -1
mteb/models/model_implementations/model2vec_models.py +14 -14
mteb/models/model_implementations/moka_models.py +1 -1
mteb/models/model_implementations/nbailab.py +3 -3
mteb/models/model_implementations/no_instruct_sentence_models.py +2 -2
mteb/models/model_implementations/nomic_models.py +30 -15
mteb/models/model_implementations/nomic_models_vision.py +1 -1
mteb/models/model_implementations/nvidia_llama_nemoretriever_colemb.py +15 -9
mteb/models/model_implementations/nvidia_models.py +151 -19
mteb/models/model_implementations/octen_models.py +61 -2
mteb/models/model_implementations/openclip_models.py +13 -13
mteb/models/model_implementations/opensearch_neural_sparse_models.py +5 -5
mteb/models/model_implementations/ops_moa_models.py +1 -1
mteb/models/model_implementations/ordalietech_solon_embeddings_mini_beta_1_1.py +1 -1
mteb/models/model_implementations/pawan_models.py +1 -1
mteb/models/model_implementations/piccolo_models.py +1 -1
mteb/models/model_implementations/pixie_models.py +56 -0
mteb/models/model_implementations/promptriever_models.py +4 -4
mteb/models/model_implementations/pylate_models.py +10 -9
mteb/models/model_implementations/qodo_models.py +2 -2
mteb/models/model_implementations/qtack_models.py +1 -1
mteb/models/model_implementations/qwen3_models.py +3 -3
mteb/models/model_implementations/qzhou_models.py +2 -2
mteb/models/model_implementations/random_baseline.py +3 -3
mteb/models/model_implementations/rasgaard_models.py +2 -2
mteb/models/model_implementations/reasonir_model.py +1 -1
mteb/models/model_implementations/repllama_models.py +3 -3
mteb/models/model_implementations/rerankers_custom.py +12 -6
mteb/models/model_implementations/rerankers_monot5_based.py +17 -17
mteb/models/model_implementations/richinfoai_models.py +1 -1
mteb/models/model_implementations/ru_sentence_models.py +20 -20
mteb/models/model_implementations/ruri_models.py +10 -10
mteb/models/model_implementations/salesforce_models.py +3 -3
mteb/models/model_implementations/samilpwc_models.py +1 -1
mteb/models/model_implementations/sarashina_embedding_models.py +2 -2
mteb/models/model_implementations/searchmap_models.py +1 -1
mteb/models/model_implementations/seed_1_6_embedding_models_1215.py +113 -146
mteb/models/model_implementations/sentence_transformers_models.py +124 -22
mteb/models/model_implementations/shuu_model.py +1 -1
mteb/models/model_implementations/siglip_models.py +20 -20
mteb/models/model_implementations/slm_models.py +416 -0
mteb/models/model_implementations/spartan8806_atles_champion.py +1 -1
mteb/models/model_implementations/stella_models.py +17 -4
mteb/models/model_implementations/tarka_models.py +2 -2
mteb/models/model_implementations/text2vec_models.py +9 -3
mteb/models/model_implementations/ua_sentence_models.py +1 -1
mteb/models/model_implementations/uae_models.py +7 -1
mteb/models/model_implementations/vdr_models.py +1 -1
mteb/models/model_implementations/vi_vn_models.py +6 -6
mteb/models/model_implementations/vlm2vec_models.py +3 -3
mteb/models/model_implementations/voyage_models.py +84 -0
mteb/models/model_implementations/voyage_v.py +9 -7
mteb/models/model_implementations/youtu_models.py +1 -1
mteb/models/model_implementations/yuan_models.py +1 -1
mteb/models/model_implementations/yuan_models_en.py +1 -1
mteb/models/model_meta.py +80 -31
mteb/models/models_protocols.py +22 -6
mteb/models/search_encoder_index/search_indexes/faiss_search_index.py +9 -6
mteb/models/search_wrappers.py +33 -18
mteb/models/sentence_transformer_wrapper.py +50 -25
mteb/models/vllm_wrapper.py +327 -0
mteb/py.typed +0 -0
mteb/results/benchmark_results.py +29 -21
mteb/results/model_result.py +52 -22
mteb/results/task_result.py +80 -58
mteb/similarity_functions.py +11 -7
mteb/tasks/classification/dan/dk_hate_classification.py +1 -1
mteb/tasks/classification/est/estonian_valence.py +1 -1
mteb/tasks/classification/kur/kurdish_sentiment_classification.py +2 -2
mteb/tasks/classification/multilingual/scala_classification.py +1 -1
mteb/tasks/clustering/eng/hume_wiki_cities_clustering.py +1 -1
mteb/tasks/clustering/eng/wiki_cities_clustering.py +1 -1
mteb/tasks/clustering/zho/cmteb_clustering.py +2 -2
mteb/tasks/image_text_pair_classification/eng/sugar_crepe.py +1 -1
mteb/tasks/reranking/multilingual/wikipedia_reranking_multilingual.py +1 -1
mteb/tasks/retrieval/code/code_rag.py +12 -12
mteb/tasks/retrieval/dan/dan_fever_retrieval.py +1 -1
mteb/tasks/retrieval/dan/tv2_nordretrieval.py +2 -2
mteb/tasks/retrieval/dan/twitter_hjerne_retrieval.py +2 -2
mteb/tasks/retrieval/eng/__init__.py +2 -0
mteb/tasks/retrieval/eng/chemrxiv.py +33 -0
mteb/tasks/retrieval/eng/cub200_i2i_retrieval.py +1 -1
mteb/tasks/retrieval/kor/__init__.py +15 -1
mteb/tasks/retrieval/kor/kovidore2_bench_retrieval.py +142 -0
mteb/tasks/retrieval/multilingual/__init__.py +2 -0
mteb/tasks/retrieval/multilingual/euro_pirq_retrieval.py +43 -0
mteb/tasks/retrieval/multilingual/vidore3_bench_retrieval.py +90 -100
mteb/tasks/retrieval/nob/norquad.py +2 -2
mteb/tasks/retrieval/nob/snl_retrieval.py +2 -2
mteb/tasks/retrieval/tur/tur_hist_quad.py +1 -1
mteb/tasks/retrieval/vie/__init__.py +14 -6
mteb/tasks/retrieval/vie/climate_fevervn_retrieval.py +39 -0
mteb/tasks/retrieval/vie/db_pedia_vn_retrieval.py +39 -0
mteb/tasks/retrieval/vie/fevervn_retrieval.py +39 -0
mteb/tasks/retrieval/vie/hotpot_qavn_retrieval.py +39 -0
mteb/tasks/retrieval/vie/msmarcovn_retrieval.py +48 -0
mteb/tasks/retrieval/vie/nqvn_retrieval.py +39 -0
mteb/tasks/retrieval/vie/tvpl_retrieval.py +42 -0
mteb/tasks/retrieval/vie/zac_legal_text_retrieval.py +15 -1
mteb/types/__init__.py +2 -0
mteb/types/_encoder_io.py +12 -0
mteb/types/_result.py +2 -1
mteb/types/statistics.py +9 -3
{mteb-2.5.2.dist-info → mteb-2.7.2.dist-info}/METADATA +15 -4
{mteb-2.5.2.dist-info → mteb-2.7.2.dist-info}/RECORD +240 -219
mteb/models/model_implementations/mxbai_models.py +0 -111
{mteb-2.5.2.dist-info → mteb-2.7.2.dist-info}/WHEEL +0 -0
{mteb-2.5.2.dist-info → mteb-2.7.2.dist-info}/entry_points.txt +0 -0
{mteb-2.5.2.dist-info → mteb-2.7.2.dist-info}/licenses/LICENSE +0 -0
{mteb-2.5.2.dist-info → mteb-2.7.2.dist-info}/top_level.txt +0 -0

mteb/models/model_implementations/codesage_models.py CHANGED Viewed

@@ -35,7 +35,7 @@ codesage_large = ModelMeta(
     open_weights=True,
     public_training_code=None,
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers"],
     reference="https://huggingface.co/codesage/codesage-large-v2",
     similarity_fn_name=ScoringFunction.COSINE,
     use_instructions=False,
@@ -62,7 +62,7 @@ codesage_base = ModelMeta(
     open_weights=True,
     public_training_code=None,
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers"],
     reference="https://huggingface.co/codesage/codesage-base-v2",
     similarity_fn_name=ScoringFunction.COSINE,
     use_instructions=False,
@@ -89,7 +89,7 @@ codesage_small = ModelMeta(
     open_weights=True,
     public_training_code=None,
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers"],
     reference="https://huggingface.co/codesage/codesage-small-v2",
     similarity_fn_name=ScoringFunction.COSINE,
     use_instructions=False,

mteb/models/model_implementations/cohere_models.py CHANGED Viewed

@@ -222,7 +222,7 @@ class CohereTextEmbeddingModel(AbsEncoder):
     ) -> None:
         requires_package(self, "cohere", model_name, "pip install 'mteb[cohere]'")
-        import cohere  # type: ignore
+        import cohere
         self.model_name = model_name.removeprefix("Cohere/Cohere-")
         self.sep = sep
@@ -392,7 +392,7 @@ cohere_mult_3 = ModelMeta(
     reference="https://cohere.com/blog/introducing-embed-v3",
     license=None,
     similarity_fn_name=ScoringFunction.COSINE,
-    framework=["API"],
+    framework=["API", "Transformers"],
     use_instructions=True,
     public_training_code=None,
     public_training_data=None,  # assumed
@@ -417,7 +417,7 @@ cohere_eng_3 = ModelMeta(
     embed_dim=1024,
     license=None,
     similarity_fn_name=ScoringFunction.COSINE,
-    framework=["API"],
+    framework=["API", "Transformers"],
     use_instructions=True,
     public_training_code=None,
     public_training_data=None,  # assumed
@@ -442,7 +442,7 @@ cohere_mult_light_3 = ModelMeta(
     embed_dim=384,
     license=None,
     similarity_fn_name=ScoringFunction.COSINE,
-    framework=["API"],
+    framework=["API", "Transformers"],
     use_instructions=True,
     public_training_code=None,
     public_training_data=None,  # assumed
@@ -467,7 +467,7 @@ cohere_eng_light_3 = ModelMeta(
     embed_dim=384,
     license=None,
     similarity_fn_name=ScoringFunction.COSINE,
-    framework=["API"],
+    framework=["API", "Transformers"],
     use_instructions=True,
     public_training_code=None,
     public_training_data=None,  # assumed

mteb/models/model_implementations/cohere_v.py CHANGED Viewed

@@ -378,7 +378,7 @@ def cohere_v_loader(model_name, **kwargs):
 cohere_mult_3 = ModelMeta(
-    loader=cohere_v_loader,  # type: ignore
+    loader=cohere_v_loader,
     loader_kwargs={"model_name": "embed-multilingual-v3.0"},
     name="cohere/embed-multilingual-v3.0",
     model_type=["dense"],
@@ -402,7 +402,7 @@ cohere_mult_3 = ModelMeta(
 )
 cohere_eng_3 = ModelMeta(
-    loader=cohere_v_loader,  # type: ignore
+    loader=cohere_v_loader,
     loader_kwargs={"model_name": "embed-english-v3.0"},
     name="cohere/embed-english-v3.0",
     model_type=["dense"],

mteb/models/model_implementations/colpali_models.py CHANGED Viewed

@@ -226,7 +226,7 @@ colpali_v1_1 = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/illuin-tech/colpali",
     public_training_data="https://huggingface.co/datasets/vidore/colpali_train_set",
-    framework=["ColPali"],
+    framework=["ColPali", "safetensors"],
     reference="https://huggingface.co/vidore/colpali-v1.1",
     similarity_fn_name=ScoringFunction.MAX_SIM,
     use_instructions=True,
@@ -253,7 +253,7 @@ colpali_v1_2 = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/illuin-tech/colpali",
     public_training_data="https://huggingface.co/datasets/vidore/colpali_train_set",
-    framework=["ColPali"],
+    framework=["ColPali", "safetensors"],
     reference="https://huggingface.co/vidore/colpali-v1.2",
     similarity_fn_name=ScoringFunction.MAX_SIM,
     use_instructions=True,
@@ -280,7 +280,7 @@ colpali_v1_3 = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/illuin-tech/colpali",
     public_training_data="https://huggingface.co/datasets/vidore/colpali_train_set",
-    framework=["ColPali"],
+    framework=["ColPali", "safetensors"],
     reference="https://huggingface.co/vidore/colpali-v1.3",
     similarity_fn_name=ScoringFunction.MAX_SIM,
     use_instructions=True,

mteb/models/model_implementations/colqwen_models.py CHANGED Viewed

@@ -226,7 +226,7 @@ colqwen2 = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/illuin-tech/colpali",
     public_training_data="https://huggingface.co/datasets/vidore/colpali_train_set",
-    framework=["ColPali"],
+    framework=["ColPali", "safetensors"],
     reference="https://huggingface.co/vidore/colqwen2-v1.0",
     similarity_fn_name="MaxSim",
     use_instructions=True,
@@ -253,7 +253,7 @@ colqwen2_5 = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/illuin-tech/colpali",
     public_training_data="https://huggingface.co/datasets/vidore/colpali_train_set",
-    framework=["ColPali"],
+    framework=["ColPali", "safetensors"],
     reference="https://huggingface.co/vidore/colqwen2.5-v0.2",
     similarity_fn_name="MaxSim",
     use_instructions=True,
@@ -297,7 +297,7 @@ colqwen3_8b = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/illuin-tech/colpali",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/TomoroAI/tomoro-colqwen3-embed-8b",
     similarity_fn_name=ScoringFunction.MAX_SIM,
     use_instructions=True,
@@ -321,7 +321,7 @@ colqwen3_4b = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/illuin-tech/colpali",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/TomoroAI/tomoro-colqwen3-embed-4b",
     similarity_fn_name=ScoringFunction.MAX_SIM,
     use_instructions=True,
@@ -348,7 +348,7 @@ colnomic_7b = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/nomic-ai/colpali",
     public_training_data="https://huggingface.co/datasets/vidore/colpali_train_set",
-    framework=["ColPali"],
+    framework=["ColPali", "safetensors"],
     reference="https://huggingface.co/nomic-ai/colnomic-embed-multimodal-7b",
     similarity_fn_name="MaxSim",
     use_instructions=True,
@@ -393,7 +393,7 @@ colnomic_3b = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/nomic-ai/colpali",
     public_training_data="https://huggingface.co/datasets/vidore/colpali_train_set",
-    framework=["ColPali"],
+    framework=["ColPali", "safetensors"],
     reference="https://huggingface.co/nomic-ai/colnomic-embed-multimodal-3b",
     similarity_fn_name="MaxSim",
     use_instructions=True,
@@ -458,7 +458,7 @@ evoqwen25_vl_retriever_3b_v1 = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/illuin-tech/colpali",
     public_training_data="https://huggingface.co/datasets/vidore/colpali_train_set",
-    framework=["ColPali"],
+    framework=["ColPali", "safetensors"],
     reference="https://huggingface.co/ApsaraStackMaaS/EvoQwen2.5-VL-Retriever-3B-v1",
     similarity_fn_name="MaxSim",
     use_instructions=True,
@@ -484,7 +484,7 @@ evoqwen25_vl_retriever_7b_v1 = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/illuin-tech/colpali",
     public_training_data="https://huggingface.co/datasets/vidore/colpali_train_set",
-    framework=["ColPali"],
+    framework=["ColPali", "safetensors"],
     reference="https://huggingface.co/ApsaraStackMaaS/EvoQwen2.5-VL-Retriever-7B-v1",
     similarity_fn_name="MaxSim",
     use_instructions=True,

mteb/models/model_implementations/colsmol_models.py CHANGED Viewed

@@ -67,7 +67,7 @@ colsmol_256m = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/illuin-tech/colpali",
     public_training_data="https://huggingface.co/datasets/vidore/colpali_train_set",
-    framework=["ColPali"],
+    framework=["ColPali", "safetensors"],
     reference="https://huggingface.co/vidore/colSmol-256M",
     similarity_fn_name="MaxSim",
     use_instructions=True,
@@ -94,7 +94,7 @@ colsmol_500m = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/illuin-tech/colpali",
     public_training_data="https://huggingface.co/datasets/vidore/colpali_train_set",
-    framework=["ColPali"],
+    framework=["ColPali", "safetensors"],
     reference="https://huggingface.co/vidore/colSmol-500M",
     similarity_fn_name="MaxSim",
     use_instructions=True,

mteb/models/model_implementations/conan_models.py CHANGED Viewed

@@ -209,7 +209,7 @@ Conan_embedding_v2 = ModelMeta(
     license="apache-2.0",
     reference="https://huggingface.co/TencentBAC/Conan-embedding-v2",
     similarity_fn_name="cosine",
-    framework=["API"],
+    framework=["API", "Sentence Transformers", "Transformers"],
     use_instructions=True,
     training_datasets=E5_MISTRAL_TRAINING_DATA | bge_full_data | conan_zh_datasets,
     public_training_code=None,

mteb/models/model_implementations/dino_models.py CHANGED Viewed

@@ -104,7 +104,7 @@ dinov2_training_datasets = set(
 dinov2_small = ModelMeta(
-    loader=DINOModel,  # type: ignore
+    loader=DINOModel,
     name="facebook/dinov2-small",
     model_type=["dense"],
     languages=["eng-Latn"],
@@ -119,13 +119,13 @@ dinov2_small = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/facebookresearch/dinov2",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/dinov2-small",
     similarity_fn_name=ScoringFunction.COSINE,
     use_instructions=False,
     training_datasets=dinov2_training_datasets,
     citation="""@misc{oquab2023dinov2,
-      title={DINOv2: Learning Robust Visual Features without Supervision},
+      title={DINOv2: Learning Robust Visual Features without Supervision},
       author={Maxime Oquab and Timothée Darcet and Théo Moutakanni and Huy Vo and Marc Szafraniec and Vasil Khalidov and Pierre Fernandez and Daniel Haziza and Francisco Massa and Alaaeldin El-Nouby and Mahmoud Assran and Nicolas Ballas and Wojciech Galuba and Russell Howes and Po-Yao Huang and Shang-Wen Li and Ishan Misra and Michael Rabbat and Vasu Sharma and Gabriel Synnaeve and Hu Xu and Hervé Jegou and Julien Mairal and Patrick Labatut and Armand Joulin and Piotr Bojanowski},
       year={2023},
       eprint={2304.07193},
@@ -135,7 +135,7 @@ dinov2_small = ModelMeta(
 )
 dinov2_base = ModelMeta(
-    loader=DINOModel,  # type: ignore
+    loader=DINOModel,
     name="facebook/dinov2-base",
     model_type=["dense"],
     languages=["eng-Latn"],
@@ -150,13 +150,13 @@ dinov2_base = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/facebookresearch/dinov2",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/dinov2-base",
     similarity_fn_name=ScoringFunction.COSINE,
     use_instructions=False,
     training_datasets=dinov2_training_datasets,
     citation="""@misc{oquab2023dinov2,
-      title={DINOv2: Learning Robust Visual Features without Supervision},
+      title={DINOv2: Learning Robust Visual Features without Supervision},
       author={Maxime Oquab and Timothée Darcet and Théo Moutakanni and Huy Vo and Marc Szafraniec and Vasil Khalidov and Pierre Fernandez and Daniel Haziza and Francisco Massa and Alaaeldin El-Nouby and Mahmoud Assran and Nicolas Ballas and Wojciech Galuba and Russell Howes and Po-Yao Huang and Shang-Wen Li and Ishan Misra and Michael Rabbat and Vasu Sharma and Gabriel Synnaeve and Hu Xu and Hervé Jegou and Julien Mairal and Patrick Labatut and Armand Joulin and Piotr Bojanowski},
       year={2023},
       eprint={2304.07193},
@@ -166,7 +166,7 @@ dinov2_base = ModelMeta(
 )
 dinov2_large = ModelMeta(
-    loader=DINOModel,  # type: ignore
+    loader=DINOModel,
     name="facebook/dinov2-large",
     model_type=["dense"],
     languages=["eng-Latn"],
@@ -181,13 +181,13 @@ dinov2_large = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/facebookresearch/dinov2",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/dinov2-large",
     similarity_fn_name=ScoringFunction.COSINE,
     use_instructions=False,
     training_datasets=dinov2_training_datasets,
     citation="""@misc{oquab2023dinov2,
-      title={DINOv2: Learning Robust Visual Features without Supervision},
+      title={DINOv2: Learning Robust Visual Features without Supervision},
       author={Maxime Oquab and Timothée Darcet and Théo Moutakanni and Huy Vo and Marc Szafraniec and Vasil Khalidov and Pierre Fernandez and Daniel Haziza and Francisco Massa and Alaaeldin El-Nouby and Mahmoud Assran and Nicolas Ballas and Wojciech Galuba and Russell Howes and Po-Yao Huang and Shang-Wen Li and Ishan Misra and Michael Rabbat and Vasu Sharma and Gabriel Synnaeve and Hu Xu and Hervé Jegou and Julien Mairal and Patrick Labatut and Armand Joulin and Piotr Bojanowski},
       year={2023},
       eprint={2304.07193},
@@ -197,7 +197,7 @@ dinov2_large = ModelMeta(
 )
 dinov2_giant = ModelMeta(
-    loader=DINOModel,  # type: ignore
+    loader=DINOModel,
     name="facebook/dinov2-giant",
     model_type=["dense"],
     languages=["eng-Latn"],
@@ -212,13 +212,13 @@ dinov2_giant = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/facebookresearch/dinov2",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/dinov2-giant",
     similarity_fn_name=ScoringFunction.COSINE,
     use_instructions=False,
     training_datasets=dinov2_training_datasets,
     citation="""@misc{oquab2023dinov2,
-      title={DINOv2: Learning Robust Visual Features without Supervision},
+      title={DINOv2: Learning Robust Visual Features without Supervision},
       author={Maxime Oquab and Timothée Darcet and Théo Moutakanni and Huy Vo and Marc Szafraniec and Vasil Khalidov and Pierre Fernandez and Daniel Haziza and Francisco Massa and Alaaeldin El-Nouby and Mahmoud Assran and Nicolas Ballas and Wojciech Galuba and Russell Howes and Po-Yao Huang and Shang-Wen Li and Ishan Misra and Michael Rabbat and Vasu Sharma and Gabriel Synnaeve and Hu Xu and Hervé Jegou and Julien Mairal and Patrick Labatut and Armand Joulin and Piotr Bojanowski},
       year={2023},
       eprint={2304.07193},
@@ -247,13 +247,13 @@ webssl_dino300m_full2b = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-dino300m-full2b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -278,13 +278,13 @@ webssl_dino1b_full2b = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-dino1b-full2b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -309,13 +309,13 @@ webssl_dino2b_full2b = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-dino2b-full2b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -340,13 +340,13 @@ webssl_dino3b_full2b = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-dino3b-full2b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -371,13 +371,13 @@ webssl_dino5b_full2b = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-dino5b-full2b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -402,13 +402,13 @@ webssl_dino7b_full8b_224 = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-dino7b-full8b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -433,13 +433,13 @@ webssl_dino7b_full8b_378 = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-dino7b-full8b-378",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -464,13 +464,13 @@ webssl_dino7b_full8b_518 = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-dino7b-full8b-518",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -496,13 +496,13 @@ webssl_dino2b_light2b = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-dino2b-light2b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -527,13 +527,13 @@ webssl_dino2b_heavy2b = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-dino2b-heavy2b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -558,13 +558,13 @@ webssl_dino3b_light2b = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-dino3b-light2b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -589,13 +589,13 @@ webssl_dino3b_heavy2b = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-dino3b-heavy2b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -620,13 +620,13 @@ webssl_mae300m_full2b = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-mae300m-full2b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -651,13 +651,13 @@ webssl_mae700m_full2b = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-mae700m-full2b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},
@@ -682,13 +682,13 @@ webssl_mae1b_full2b = ModelMeta(
     open_weights=True,
     public_training_code="",
     public_training_data=None,
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/facebook/webssl-mae1b-full2b-224",
     similarity_fn_name=None,
     use_instructions=False,
     training_datasets=webssl_dino_training_datasets,
     citation="""@article{fan2025scaling,
-  title={Scaling Language-Free Visual Representation Learning},
+  title={Scaling Language-Free Visual Representation Learning},
   author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
   year={2025},
   eprint={2504.01017},

mteb/models/model_implementations/e5_instruct.py CHANGED Viewed

@@ -45,7 +45,14 @@ e5_instruct = ModelMeta(
     open_weights=True,
     revision="baa7be480a7de1539afce709c8f13f833a510e0a",
     release_date=E5_PAPER_RELEASE_DATE,
-    framework=["GritLM", "PyTorch", "Sentence Transformers"],
+    framework=[
+        "GritLM",
+        "PyTorch",
+        "Sentence Transformers",
+        "ONNX",
+        "safetensors",
+        "Transformers",
+    ],
     similarity_fn_name=ScoringFunction.COSINE,
     use_instructions=True,
     reference="https://huggingface.co/intfloat/multilingual-e5-large-instruct",
@@ -84,7 +91,13 @@ e5_mistral = ModelMeta(
     open_weights=True,
     revision="07163b72af1488142a360786df853f237b1a3ca1",
     release_date=E5_PAPER_RELEASE_DATE,
-    framework=["GritLM", "PyTorch", "Sentence Transformers"],
+    framework=[
+        "GritLM",
+        "PyTorch",
+        "Sentence Transformers",
+        "safetensors",
+        "Transformers",
+    ],
     similarity_fn_name=ScoringFunction.COSINE,
     use_instructions=True,
     reference="https://huggingface.co/intfloat/e5-mistral-7b-instruct",
@@ -139,7 +152,13 @@ zeta_alpha_ai__zeta_alpha_e5_mistral = ModelMeta(
     open_weights=True,
     public_training_data=None,
     public_training_code=None,
-    framework=["PyTorch", "Sentence Transformers", "GritLM"],
+    framework=[
+        "PyTorch",
+        "Sentence Transformers",
+        "GritLM",
+        "safetensors",
+        "Transformers",
+    ],
     reference="https://huggingface.co/zeta-alpha-ai/Zeta-Alpha-E5-Mistral",
     similarity_fn_name=ScoringFunction.COSINE,
     use_instructions=True,
@@ -216,7 +235,7 @@ BeastyZ__e5_R_mistral_7b = ModelMeta(
     open_weights=True,
     public_training_code="https://github.com/LeeSureman/E5-Retrieval-Reproduction",
     public_training_data="https://huggingface.co/datasets/BeastyZ/E5-R",
-    framework=["PyTorch"],
+    framework=["PyTorch", "Transformers", "safetensors"],
     reference="https://huggingface.co/BeastyZ/e5-R-mistral-7b",
     similarity_fn_name="cosine",
     use_instructions=True,

mteb 2.5.2__py3-none-any.whl → 2.7.2__py3-none-any.whl

mteb 2.5.2py3-none-any.whl → 2.7.2py3-none-any.whl