PyPI - mteb - Versions diffs - 1.39.5__py3-none-any.whl → 1.39.7__py3-none-any.whl - Mend

mteb 1.39.5py3-none-any.whl → 1.39.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

mteb/benchmarks/_create_table.py CHANGED Viewed

@@ -500,3 +500,132 @@ def _create_summary_table_mean_subset(
     joint_table.insert(0, "Rank (Borda)", joint_table.pop("borda_rank"))
     return joint_table
+def _create_summary_table_mean_task_type(
+    benchmark_results: BenchmarkResults,
+) -> pd.DataFrame:
+    """Create summary table from BenchmarkResults.
+    Returns a DataFrame with one row per model containing summary statistics
+    and task type averages.
+    Args:
+        benchmark_results: BenchmarkResults object containing model results
+    Returns:
+        DataFrame with model summaries, ready for styling in the leaderboard
+    """
+    data = benchmark_results.to_dataframe(format="long")
+    if data.empty:
+        no_results_frame = pd.DataFrame(
+            {"No results": ["You can try relaxing your criteria"]}
+        )
+        return no_results_frame
+    # Convert to DataFrame and pivot
+    per_task = data.pivot(index="model_name", columns="task_name", values="score")
+    # Remove models with no scores
+    to_remove = per_task.isna().all(axis="columns")
+    if to_remove.all():
+        no_results_frame = pd.DataFrame(
+            {"No results": ["You can try relaxing your criteria"]}
+        )
+        return no_results_frame
+    models_to_remove = list(per_task[to_remove].index)
+    per_task = per_task.drop(models_to_remove, axis=0)
+    # Calculate means by task type
+    mean_per_type = _get_means_per_types(per_task)
+    mean_per_type = mean_per_type.pivot(
+        index="model_name", columns="task_type", values="score"
+    )
+    mean_per_type.columns = [
+        _split_on_capital(column) for column in mean_per_type.columns
+    ]
+    # Calculate overall means
+    typed_mean = mean_per_type.mean(skipna=False, axis=1)
+    # Build joint table
+    joint_table = mean_per_type.copy()
+    joint_table = joint_table.drop(models_to_remove, axis=0)
+    joint_table.insert(0, "mean_by_task_type", typed_mean)
+    joint_table = joint_table.sort_values("mean_by_task_type", ascending=False)
+    joint_table["borda_rank"] = _get_borda_rank(per_task)
+    joint_table["rank"] = [i + 1 for i in range(len(joint_table))]
+    joint_table = joint_table.reset_index()
+    # Add model metadata
+    model_metas = joint_table["model_name"].map(_failsafe_get_model_meta)
+    joint_table = joint_table[model_metas.notna()]
+    joint_table["model_link"] = model_metas.map(lambda m: m.reference)
+    # Insert model metadata columns
+    joint_table.insert(
+        1,
+        "Max Tokens",
+        model_metas.map(lambda m: _format_max_tokens(m.max_tokens)),
+    )
+    joint_table.insert(
+        1,
+        "Embedding Dimensions",
+        model_metas.map(lambda m: str(int(m.embed_dim)) if m.embed_dim else "Unknown"),
+    )
+    joint_table.insert(
+        1,
+        "Number of Parameters",
+        model_metas.map(lambda m: _format_n_parameters(m.n_parameters)),
+    )
+    joint_table.insert(
+        1,
+        "Memory Usage (MB)",
+        model_metas.map(
+            lambda m: str(int(m.memory_usage_mb)) if m.memory_usage_mb else "Unknown"
+        ),
+    )
+    # Add zero-shot percentage
+    tasks = get_tasks(tasks=list(data["task_name"].unique()))
+    joint_table.insert(
+        1, "Zero-shot", model_metas.map(lambda m: m.zero_shot_percentage(tasks))
+    )
+    joint_table["Zero-shot"] = joint_table["Zero-shot"].fillna(-1)
+    # Clean up model names (remove HF organization)
+    joint_table["model_name"] = joint_table["model_name"].map(
+        lambda name: name.split("/")[-1]
+    )
+    # Add markdown links to model names
+    name_w_link = (
+        "[" + joint_table["model_name"] + "](" + joint_table["model_link"] + ")"
+    )
+    joint_table["model_name"] = joint_table["model_name"].mask(
+        joint_table["model_link"].notna(), name_w_link
+    )
+    joint_table = joint_table.drop(columns=["model_link"])
+    # Rename columns
+    joint_table = joint_table.rename(
+        columns={
+            "model_name": "Model",
+            "mean_by_task_type": "Mean (TaskType)",
+            "borda_rank": "Rank (Borda)",
+        }
+    )
+    if "Any Any Multilingual Retrieval" in joint_table.columns:
+        joint_table = joint_table.rename(
+            columns={"Any Any Multilingual Retrieval": "Multilingual Retrieval"}
+        )
+    if "Any Any Retrieval" in joint_table.columns:
+        joint_table = joint_table.rename(columns={"Any Any Retrieval": "Retrieval"})
+    # Move borda rank to front
+    joint_table.insert(0, "Rank", joint_table.pop("rank"))
+    return joint_table

mteb/benchmarks/benchmark.py CHANGED Viewed

@@ -12,6 +12,7 @@ from mteb.benchmarks._create_table import (
     _create_summary_table_from_benchmark_results,
     _create_summary_table_mean_public_private,
     _create_summary_table_mean_subset,
+    _create_summary_table_mean_task_type,
 )
 from mteb.load_results.load_results import load_results
@@ -107,3 +108,11 @@ class HUMEBenchmark(Benchmark):
     ) -> pd.DataFrame:
         """Create summary table. Called by the leaderboard app."""
         return _create_summary_table_mean_subset(benchmark_results)
+class MIEBBenchmark(Benchmark):
+    def _create_summary_table(
+        self, benchmark_results: BenchmarkResults
+    ) -> pd.DataFrame:
+        """Create summary table. Called by the leaderboard app."""
+        return _create_summary_table_mean_task_type(benchmark_results)

mteb/benchmarks/benchmarks/benchmarks.py CHANGED Viewed

@@ -4,7 +4,7 @@ from typing import TYPE_CHECKING, Annotated
 from pydantic import AnyUrl, BeforeValidator, TypeAdapter
-from mteb.benchmarks.benchmark import Benchmark, HUMEBenchmark
+from mteb.benchmarks.benchmark import Benchmark, HUMEBenchmark, MIEBBenchmark
 from mteb.overview import MTEBTasks, get_task, get_tasks
 if TYPE_CHECKING:
@@ -1754,7 +1754,7 @@ MIEB_common_tasks = [
     "WebQAT2TRetrieval",
 ]
-MIEB_ENG = Benchmark(
+MIEB_ENG = MIEBBenchmark(
     name="MIEB(eng)",
     display_name="Image-Text, English",
     icon="https://github.com/DennisSuitters/LibreICONS/raw/2d2172d15e3c6ca03c018629d60050e4b99e5c55/svg-color/libre-gui-picture.svg",
@@ -1783,7 +1783,7 @@ MIEB_ENG = Benchmark(
 """,
 )
-MIEB_MULTILINGUAL = Benchmark(
+MIEB_MULTILINGUAL = MIEBBenchmark(
     name="MIEB(Multilingual)",
     display_name="Image-Text, Multilingual",
     icon="https://github.com/DennisSuitters/LibreICONS/raw/2d2172d15e3c6ca03c018629d60050e4b99e5c55/svg-color/libre-gui-pictures.svg",
@@ -1818,7 +1818,7 @@ MIEB_MULTILINGUAL = Benchmark(
 """,
 )
-MIEB_LITE = Benchmark(
+MIEB_LITE = MIEBBenchmark(
     name="MIEB(lite)",
     display_name="Image-Text, Lite",
     icon="https://github.com/DennisSuitters/LibreICONS/raw/2d2172d15e3c6ca03c018629d60050e4b99e5c55/svg-color/libre-map-landscape.svg",
@@ -1902,7 +1902,7 @@ MIEB_LITE = Benchmark(
 """,
 )
-MIEB_IMG = Benchmark(
+MIEB_IMG = MIEBBenchmark(
     name="MIEB(Img)",
     display_name="Image only",
     icon="https://github.com/DennisSuitters/LibreICONS/raw/2d2172d15e3c6ca03c018629d60050e4b99e5c55/svg-color/libre-gui-pictures.svg",

mteb/evaluation/evaluators/RegressionEvaluator.py CHANGED Viewed

@@ -53,19 +53,13 @@ class LinearRegressionEvaluator(Evaluator):
         scores = {}
         X_train = model.encode(
             self.sentences_train,
-            model=model,
             task_name=self.task_name,
-            hf_split="train",
-            hf_subset=self.hf_subset,
             **encode_kwargs,
         )
         if test_cache is None:
             X_test = model.encode(
                 self.sentences_test,
-                model=model,
                 task_name=self.task_name,
-                hf_split=self.hf_split,
-                hf_subset=self.hf_subset,
                 **encode_kwargs,
             )
             test_cache = X_test

mteb/leaderboard/table.py CHANGED Viewed

@@ -116,6 +116,7 @@ def _apply_summary_table_styling(joint_table: pd.DataFrame) -> gr.DataFrame:
     """Apply styling to a raw summary DataFrame"""
     excluded_columns = [
         "Rank (Borda)",
+        "Rank",
         "Model",
         "Number of Parameters",
         "Embedding Dimensions",

mteb/tasks/Classification/__init__.py CHANGED Viewed

@@ -150,11 +150,11 @@ from .sin.SinhalaNewsClassification import *
 from .sin.SinhalaNewsSourceClassification import *
 from .slk.CSFDSKMovieReviewSentimentClassification import *
 from .slk.SlovakHateSpeechClassification import *
+from .slk.SlovakMovieReviewSentimentClassification import *
 from .slv.FrenkSlClassification import *
 from .spa.SpanishNewsClassification import *
 from .spa.SpanishSentimentClassification import *
 from .ssw.SiswatiNewsClassification import *
-from .svk.SlovakMovieReviewSentimentClassification import *
 from .swa.SwahiliNewsClassification import *
 from .swe.DalajClassification import *
 from .swe.SwedishSentimentClassification import *

mteb/tasks/Classification/{svk → slk}/SlovakMovieReviewSentimentClassification.py RENAMED Viewed

@@ -18,7 +18,7 @@ class SlovakMovieReviewSentimentClassification(AbsTaskClassification):
         category="s2s",
         modalities=["text"],
         eval_splits=["test"],
-        eval_langs=["svk-Latn"],
+        eval_langs=["slk-Latn"],
         main_score="accuracy",
         date=("2002-05-21", "2020-03-05"),
         dialect=[],
@@ -59,7 +59,7 @@ class SlovakMovieReviewSentimentClassificationV2(AbsTaskClassification):
         category="s2s",
         modalities=["text"],
         eval_splits=["test"],
-        eval_langs=["svk-Latn"],
+        eval_langs=["slk-Latn"],
         main_score="accuracy",
         date=("2002-05-21", "2020-03-05"),
         dialect=[],

mteb/tasks/Retrieval/multilingual/MIRACLRetrieval.py CHANGED Viewed

@@ -30,6 +30,39 @@ _LANGUAGES = {
     "zh": ["zho-Hans"],
 }
+_common_metadata = dict(
+    reference="http://miracl.ai",
+    type="Retrieval",
+    category="s2p",
+    modalities=["text"],
+    eval_splits=[_EVAL_SPLIT],
+    eval_langs=_LANGUAGES,
+    main_score="ndcg_at_10",
+    date=("2022-06-01", "2023-01-30"),
+    domains=["Encyclopaedic", "Written"],
+    task_subtypes=[],
+    license="cc-by-sa-4.0",
+    annotations_creators="expert-annotated",
+    dialect=[],
+    sample_creation="created",
+    bibtex_citation=r"""
+@article{10.1162/tacl_a_00595,
+  abstract = {{MIRACL is a multilingual dataset for ad hoc retrieval across 18 languages that collectively encompass over three billion native speakers around the world. This resource is designed to support monolingual retrieval tasks, where the queries and the corpora are in the same language. In total, we have gathered over 726k high-quality relevance judgments for 78k queries over Wikipedia in these languages, where all annotations have been performed by native speakers hired by our team. MIRACL covers languages that are both typologically close as well as distant from 10 language families and 13 sub-families, associated with varying amounts of publicly available resources. Extensive automatic heuristic verification and manual assessments were performed during the annotation process to control data quality. In total, MIRACL represents an investment of around five person-years of human annotator effort. Our goal is to spur research on improving retrieval across a continuum of languages, thus enhancing information access capabilities for diverse populations around the world, particularly those that have traditionally been underserved. MIRACL is available at http://miracl.ai/.}},
+  author = {Zhang, Xinyu and Thakur, Nandan and Ogundepo, Odunayo and Kamalloo, Ehsan and Alfonso-Hermelo, David and Li, Xiaoguang and Liu, Qun and Rezagholizadeh, Mehdi and Lin, Jimmy},
+  doi = {10.1162/tacl_a_00595},
+  eprint = {https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl\_a\_00595/2157340/tacl\_a\_00595.pdf},
+  issn = {2307-387X},
+  journal = {Transactions of the Association for Computational Linguistics},
+  month = {09},
+  pages = {1114-1131},
+  title = {{MIRACL: A Multilingual Retrieval Dataset Covering 18 Diverse Languages}},
+  url = {https://doi.org/10.1162/tacl\_a\_00595},
+  volume = {11},
+  year = {2023},
+}
+""",
+)
 def _load_miracl_data(
     path: str,
@@ -106,44 +139,15 @@ class MIRACLRetrieval(MultilingualTask, AbsTaskRetrieval):
     metadata = TaskMetadata(
         name="MIRACLRetrieval",
         description="MIRACL (Multilingual Information Retrieval Across a Continuum of Languages) is a multilingual retrieval dataset that focuses on search across 18 different languages.",
-        reference="http://miracl.ai",
         dataset={
             "path": "miracl/mmteb-miracl",
             "revision": "main",
             "trust_remote_code": True,
         },
-        type="Retrieval",
-        category="s2p",
-        modalities=["text"],
-        eval_splits=[_EVAL_SPLIT],
-        eval_langs=_LANGUAGES,
-        main_score="ndcg_at_10",
-        date=("2022-06-01", "2023-01-30"),
-        domains=["Encyclopaedic", "Written"],
-        task_subtypes=[],
-        license="cc-by-sa-4.0",
-        annotations_creators="expert-annotated",
-        dialect=[],
-        sample_creation="created",
-        bibtex_citation=r"""
-@article{10.1162/tacl_a_00595,
-  abstract = {{MIRACL is a multilingual dataset for ad hoc retrieval across 18 languages that collectively encompass over three billion native speakers around the world. This resource is designed to support monolingual retrieval tasks, where the queries and the corpora are in the same language. In total, we have gathered over 726k high-quality relevance judgments for 78k queries over Wikipedia in these languages, where all annotations have been performed by native speakers hired by our team. MIRACL covers languages that are both typologically close as well as distant from 10 language families and 13 sub-families, associated with varying amounts of publicly available resources. Extensive automatic heuristic verification and manual assessments were performed during the annotation process to control data quality. In total, MIRACL represents an investment of around five person-years of human annotator effort. Our goal is to spur research on improving retrieval across a continuum of languages, thus enhancing information access capabilities for diverse populations around the world, particularly those that have traditionally been underserved. MIRACL is available at http://miracl.ai/.}},
-  author = {Zhang, Xinyu and Thakur, Nandan and Ogundepo, Odunayo and Kamalloo, Ehsan and Alfonso-Hermelo, David and Li, Xiaoguang and Liu, Qun and Rezagholizadeh, Mehdi and Lin, Jimmy},
-  doi = {10.1162/tacl_a_00595},
-  eprint = {https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl\_a\_00595/2157340/tacl\_a\_00595.pdf},
-  issn = {2307-387X},
-  journal = {Transactions of the Association for Computational Linguistics},
-  month = {09},
-  pages = {1114-1131},
-  title = {{MIRACL: A Multilingual Retrieval Dataset Covering 18 Diverse Languages}},
-  url = {https://doi.org/10.1162/tacl\_a\_00595},
-  volume = {11},
-  year = {2023},
-}
-""",
         prompt={
             "query": "Given a question, retrieve Wikipedia passages that answer the question"
         },
+        **_common_metadata,
     )
     def load_data(self, **kwargs):
@@ -300,45 +304,58 @@ def _load_miracl_data_hard_negatives(
 class MIRACLRetrievalHardNegatives(MultilingualTask, AbsTaskRetrieval):
+    # in current version prompt for instruction models different from original task
+    superseded_by = "MIRACLRetrievalHardNegatives.v2"
     metadata = TaskMetadata(
         name="MIRACLRetrievalHardNegatives",
         description="MIRACL (Multilingual Information Retrieval Across a Continuum of Languages) is a multilingual retrieval dataset that focuses on search across 18 different languages. The hard negative version has been created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct.",
-        reference="http://miracl.ai",
         dataset={
             "path": "mteb/miracl-hard-negatives",
             "revision": "95c8db7d4a6e9c1d8a60601afd63d553ae20a2eb",
             "trust_remote_code": True,
         },
-        type="Retrieval",
-        category="s2p",
-        modalities=["text"],
-        eval_splits=[_EVAL_SPLIT],
-        eval_langs=_LANGUAGES,
-        main_score="ndcg_at_10",
-        date=("2022-06-01", "2023-01-30"),
-        domains=["Encyclopaedic", "Written"],
-        task_subtypes=[],
-        license="cc-by-sa-4.0",
-        annotations_creators="expert-annotated",
-        dialect=[],
-        sample_creation="created",
-        bibtex_citation=r"""
-@article{10.1162/tacl_a_00595,
-  abstract = {{MIRACL is a multilingual dataset for ad hoc retrieval across 18 languages that collectively encompass over three billion native speakers around the world. This resource is designed to support monolingual retrieval tasks, where the queries and the corpora are in the same language. In total, we have gathered over 726k high-quality relevance judgments for 78k queries over Wikipedia in these languages, where all annotations have been performed by native speakers hired by our team. MIRACL covers languages that are both typologically close as well as distant from 10 language families and 13 sub-families, associated with varying amounts of publicly available resources. Extensive automatic heuristic verification and manual assessments were performed during the annotation process to control data quality. In total, MIRACL represents an investment of around five person-years of human annotator effort. Our goal is to spur research on improving retrieval across a continuum of languages, thus enhancing information access capabilities for diverse populations around the world, particularly those that have traditionally been underserved. MIRACL is available at http://miracl.ai/.}},
-  author = {Zhang, Xinyu and Thakur, Nandan and Ogundepo, Odunayo and Kamalloo, Ehsan and Alfonso-Hermelo, David and Li, Xiaoguang and Liu, Qun and Rezagholizadeh, Mehdi and Lin, Jimmy},
-  doi = {10.1162/tacl_a_00595},
-  eprint = {https://direct.mit.edu/tacl/article-pdf/doi/10.1162/tacl\_a\_00595/2157340/tacl\_a\_00595.pdf},
-  issn = {2307-387X},
-  journal = {Transactions of the Association for Computational Linguistics},
-  month = {09},
-  pages = {1114-1131},
-  title = {{MIRACL: A Multilingual Retrieval Dataset Covering 18 Diverse Languages}},
-  url = {https://doi.org/10.1162/tacl\_a\_00595},
-  volume = {11},
-  year = {2023},
-}
-""",
         adapted_from=["MIRACLRetrieval"],
+        **_common_metadata,
+    )
+    def load_data(self, **kwargs):
+        if self.data_loaded:
+            return
+        self.corpus, self.queries, self.relevant_docs = (
+            _load_miracl_data_hard_negatives(
+                path=self.metadata.dataset["path"],
+                langs=self.hf_subsets,
+                splits=self.metadata_dict["eval_splits"],
+                cache_dir=kwargs.get("cache_dir", None),
+                revision=self.metadata.dataset["revision"],
+                trust_remote_code=self.metadata.dataset.get("trust_remote_code", False),
+            )
+        )
+        self.data_loaded = True
+class MIRACLRetrievalHardNegativesV2(MultilingualTask, AbsTaskRetrieval):
+    metadata = TaskMetadata(
+        name="MIRACLRetrievalHardNegatives.v2",
+        description=(
+            "MIRACL (Multilingual Information Retrieval Across a Continuum of Languages) is a multilingual retrieval "
+            "dataset that focuses on search across 18 different languages. The hard negative version has been "
+            "created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct."
+            "V2 uses a more appropriate prompt rather than the default prompt for retrieval."
+        ),
+        dataset={
+            "path": "mteb/miracl-hard-negatives",
+            "revision": "95c8db7d4a6e9c1d8a60601afd63d553ae20a2eb",
+            "trust_remote_code": True,
+        },
+        prompt={
+            "query": "Given a question, retrieve Wikipedia passages that answer the question",
+        },
+        adapted_from=["MIRACLRetrieval"],
+        **_common_metadata,
     )
     def load_data(self, **kwargs):

{mteb-1.39.5.dist-info → mteb-1.39.7.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: mteb
-Version: 1.39.5
+Version: 1.39.7
 Summary: Massive Text Embedding Benchmark
 Author-email: MTEB Contributors <niklas@huggingface.co>, nouamane@huggingface.co, info@nils-reimers.de
 License:                                  Apache License

{mteb-1.39.5.dist-info → mteb-1.39.7.dist-info}/RECORD RENAMED Viewed

@@ -48,11 +48,11 @@ mteb/abstasks/Image/AbsTaskVisualSTS.py,sha256=Gyke5MxDseNzZqz56it_tMI5jCNVdURrb
 mteb/abstasks/Image/AbsTaskZeroShotClassification.py,sha256=BC_Ev8ldT3gd4om4tzkTjUTwr7GFw7vePosNLSCdgZU,5163
 mteb/abstasks/Image/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 mteb/benchmarks/__init__.py,sha256=xfFZhvNbha5RS5dJL-j9cSYWdWckbZXHuM3ijmO7nCs,335
-mteb/benchmarks/_create_table.py,sha256=czqUoL9yXjY-jzS-2QL2PNwO8ObLVraJZCPFyoDTAdQ,16435
-mteb/benchmarks/benchmark.py,sha256=dpkku0__5nqFcSMUqirofMeW4i89YggEmIwC1nd3a4s,3859
+mteb/benchmarks/_create_table.py,sha256=9oc4szgHVNIAYTSAcR21DK3rot3Av-EXReDjEaOfSIQ,20758
+mteb/benchmarks/benchmark.py,sha256=I_qOOSUYz3Mxa3sSv3LfbxUESsw9yevFYtvzEkzskEg,4177
 mteb/benchmarks/get_benchmark.py,sha256=WxjPpjxcLtkAlxKnD9cQ2MtwpkxsIlvAtwwhE73EwsA,2744
 mteb/benchmarks/benchmarks/__init__.py,sha256=AdowVnEur-DVwKHtk_FoV3rIlmX9_lXoSsx95ZqkkqE,2131
-mteb/benchmarks/benchmarks/benchmarks.py,sha256=WKLa1VTRlWaE1myskseJr0aRfKIglH8o_vAIPQ2TNpk,83868
+mteb/benchmarks/benchmarks/benchmarks.py,sha256=fmjPlHTNgeJPvclT9K2F9CKfN43L-2Q1eJkTyRjLE2A,83899
 mteb/benchmarks/benchmarks/rteb_benchmarks.py,sha256=M4oRsbYe8daKlZZF0yUpEgxt7I4STVUD_ouIdp2RsRE,10640
 mteb/evaluation/LangMapping.py,sha256=_ipd6Cg_Za2xFS50t4DEAPxCVpOZPCs8c9lhp7Kv1q0,2831
 mteb/evaluation/MTEB.py,sha256=eN2xqG_rTmG4NRVltn0-8uBU0pK3y1Q0NAVPX9axsL0,32002
@@ -63,7 +63,7 @@ mteb/evaluation/evaluators/ClusteringEvaluator.py,sha256=8AhwqPiX_XPn8WuFLlAMuy7
 mteb/evaluation/evaluators/Evaluator.py,sha256=MXRcAAdg9SSKLIUf-rouDyCWz4zzUaGd_FXdB6aJYY0,896
 mteb/evaluation/evaluators/InstructionRetrievalEvaluator.py,sha256=xfT0C1g1FdOSonl6H7BR_8XE05N9VMxryCwm3zTfNLI,1525
 mteb/evaluation/evaluators/PairClassificationEvaluator.py,sha256=CZfYYVBwaqoc5nQ3A9JAIAgeNEtHgruhDG4fyVJlhBQ,9068
-mteb/evaluation/evaluators/RegressionEvaluator.py,sha256=qMwtCPhXH3jyg42SiXPOQnXASQRlNP_vcpx3wdPlxnk,2314
+mteb/evaluation/evaluators/RegressionEvaluator.py,sha256=ZZl3jAxOYFibNlD1bPX_uvJNntn4LTsHJiYtMxYMRFQ,2110
 mteb/evaluation/evaluators/RerankingEvaluator.py,sha256=E_XojL1my7iqNjtP8dtytWaGoVQEdCptIuPv3JDx6nc,22364
 mteb/evaluation/evaluators/RetrievalEvaluator.py,sha256=TCYwl1SbNp54QqhG1Zxlztgye8RgOGwpqgfeBfz2fHU,23558
 mteb/evaluation/evaluators/STSEvaluator.py,sha256=z59KeCDj_BzoMIgANQ_brFBumaqXNLfLEFX4V5NkGKs,3481
@@ -82,7 +82,7 @@ mteb/leaderboard/__init__.py,sha256=rb6vKGZV31m6x33LpKruPAwIBlQ5QzJVT0Y0do9DUSc,
 mteb/leaderboard/app.py,sha256=N6Ox5gzZHXdLaIyl8Yf1_Wu4yoOtyl0y6aVe_kzszts,31522
 mteb/leaderboard/benchmark_selector.py,sha256=dhZ9x3sqCkdcw7hJbqVr6PHSucPMbsGAgGPT6F_sow8,7196
 mteb/leaderboard/figures.py,sha256=wcSJWDJO4oATZlao_mY-oLDpj0QKvJp8pUhf4FbrI6s,7465
-mteb/leaderboard/table.py,sha256=X13bMrak-KQMEYo-zrJITcWLq7ZSOUBhAC9TSL40tSI,7323
+mteb/leaderboard/table.py,sha256=1Yx2xlKzn--RSLi1GAAwGx9mpGBcZVU5ECr191G385s,7339
 mteb/leaderboard/text_segments.py,sha256=fokW080HKfLbyHH-HAcoNQ1PoW4K1IQSr-MukHjEVhU,6609
 mteb/load_results/__init__.py,sha256=vtxMb4Zz2Jpn4GjY59qhsTyQpfX3z57-b0iLSqm5pBQ,250
 mteb/load_results/benchmark_results.py,sha256=XQSCCnJ967A0tjIZoOVVmjRWxYA663c6Xcob-t3psRY,31671
@@ -233,7 +233,7 @@ mteb/tasks/BitextMining/srn/SRNCorpusBitextMining.py,sha256=1KY3kQd31Wz2GPKTyshw
 mteb/tasks/BitextMining/srn/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 mteb/tasks/BitextMining/vie/VieMedEVBitextMining.py,sha256=KsEY8e6Mx2SjGlV5_JGqPrzcFxJxnSXh7fWt32zefR8,2760
 mteb/tasks/BitextMining/vie/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-mteb/tasks/Classification/__init__.py,sha256=bk9rC7VS5BFDkSai6GT9k3BzVHZFHu4U2o6J55sGgsw,9191
+mteb/tasks/Classification/__init__.py,sha256=8gKeMJfGQIAEXRAGsWwtbL43cY1DiRJYP66AsfUWXnI,9191
 mteb/tasks/Classification/ara/AJGT.py,sha256=GNhn0ddAmjhEsH2e-7Yva8ap0W53E0TNfGSTMY4vOqs,3142
 mteb/tasks/Classification/ara/HotelReviewSentimentClassification.py,sha256=Tb3uzfYHI5fbrC726IuXU0o7N0fCgiKFqTAycsBKZe8,3101
 mteb/tasks/Classification/ara/OnlineStoreReviewSentimentClassification.py,sha256=oenRFbJbIONJ04k4_tPHlUMpOdniE9P6_1v1gy9wlCI,2502
@@ -426,6 +426,7 @@ mteb/tasks/Classification/sin/SinhalaNewsSourceClassification.py,sha256=ShaqgmTF
 mteb/tasks/Classification/sin/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 mteb/tasks/Classification/slk/CSFDSKMovieReviewSentimentClassification.py,sha256=vCHn3qAb2hkZ1uVM7Pz1xNOsmDg6VjIJ91bJ5QB9O9U,3625
 mteb/tasks/Classification/slk/SlovakHateSpeechClassification.py,sha256=CgcXv4yvZ6wv82eE5d7P35PjDvxvWHlvoWg64kcMSGk,2400
+mteb/tasks/Classification/slk/SlovakMovieReviewSentimentClassification.py,sha256=Dj-2AxHElAITkL7nhMuv0OBC7HEImRYBT_8x_2Csshg,3365
 mteb/tasks/Classification/slk/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 mteb/tasks/Classification/slv/FrenkSlClassification.py,sha256=VjOwvpTDhEsKTR1zIWR3M998ZuWUz6MNm4_30ui0zYE,3266
 mteb/tasks/Classification/slv/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -434,8 +435,6 @@ mteb/tasks/Classification/spa/SpanishSentimentClassification.py,sha256=gEiTSir_3
 mteb/tasks/Classification/spa/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 mteb/tasks/Classification/ssw/SiswatiNewsClassification.py,sha256=YipX9ACHi25m-LDzQ5CxIRNgOL62oAT5NBapeQkzhKc,3110
 mteb/tasks/Classification/ssw/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-mteb/tasks/Classification/svk/SlovakMovieReviewSentimentClassification.py,sha256=ByiHVk6EpL2QLxHS3LAw4JBivN5hHXtXPdzTBb71ZUw,3365
-mteb/tasks/Classification/svk/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 mteb/tasks/Classification/swa/SwahiliNewsClassification.py,sha256=Iml296uPAsYNpMuRZTcTAa-BCvkh6WXAw0iemKS0yIg,3644
 mteb/tasks/Classification/swa/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 mteb/tasks/Classification/swe/DalajClassification.py,sha256=kWC4mzpRtP6iC3K9jNK0vKsO1zk7poIw_r7smCQ8OP8,4228
@@ -980,7 +979,7 @@ mteb/tasks/Retrieval/multilingual/CUREv1Retrieval.py,sha256=1icEnr1bhZTSwu05MTsx
 mteb/tasks/Retrieval/multilingual/CrossLingualSemanticDiscriminationWMT19.py,sha256=d_lcwJFEOzF_XWESftIW7dY6VAOTAHCvsFAIGqcuYSw,4885
 mteb/tasks/Retrieval/multilingual/CrossLingualSemanticDiscriminationWMT21.py,sha256=aPJ7Q3q6bF08fYO8JF7lRHIIzD42Rr0s0-SnL7TzHOE,4885
 mteb/tasks/Retrieval/multilingual/IndicQARetrieval.py,sha256=gcuYoqc8Oxw4eDC9JbsmSBzEK5ygFn7fIADX8A7EhJI,3863
-mteb/tasks/Retrieval/multilingual/MIRACLRetrieval.py,sha256=0DZYJgBICTmccCskm-YiUVH7L2bpt_YBSLH0lPVYif8,15039
+mteb/tasks/Retrieval/multilingual/MIRACLRetrieval.py,sha256=B-ingrCxfOyWkpE9aIIpwayAYlQt8QQA4Vbjm4EPSDE,14454
 mteb/tasks/Retrieval/multilingual/MKQARetrieval.py,sha256=d7KZAPROhcih_pXl2-p-d26QRR5i3UbyK2oYThC3vug,4477
 mteb/tasks/Retrieval/multilingual/MLQARetrieval.py,sha256=2hC-uGDGqJoRRIFNSRJXjFAzK4ITmFpsZ-jV0jCcdU8,6619
 mteb/tasks/Retrieval/multilingual/MintakaRetrieval.py,sha256=tnJ0PrUIsaWINxqfpU022ZGkUjAEVQeP0MWmwq70XPU,4400
@@ -1153,9 +1152,9 @@ mteb/tasks/aggregated_tasks/STS17MultilingualVisualSTS.py,sha256=uf02yWS1BOnffl8
 mteb/tasks/aggregated_tasks/STSBenchmarkMultilingualVisualSTS.py,sha256=ImA29OtG9sotn5PynAO4QSl5YdXgYVMbHfqfOD2skIk,3156
 mteb/tasks/aggregated_tasks/SynPerChatbotConvSAClassification.py,sha256=V2XjmsKqe4CTK2IPKuVM7T8hDPP7Uo1WkzbVZlHinKg,1220
 mteb/tasks/aggregated_tasks/__init__.py,sha256=MAU-3SqUN6nypOkdBv4MZVCA2tMnxuw317Jwct9QX-A,881
-mteb-1.39.5.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
-mteb-1.39.5.dist-info/METADATA,sha256=Z9wZ7ng9Ha9s_0Kpl3M3hLGDLDyd3WUPCXHhpsjpRPk,29039
-mteb-1.39.5.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-mteb-1.39.5.dist-info/entry_points.txt,sha256=8IJoEJFKoDHmVnNev-qJ9pp4Ln7_1-ma9QsXnzVCzGU,39
-mteb-1.39.5.dist-info/top_level.txt,sha256=OLVIjcQAlWBz0bdmutKlWHLF42FF0hp4uVAg3ZyiG4U,5
-mteb-1.39.5.dist-info/RECORD,,
+mteb-1.39.7.dist-info/licenses/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
+mteb-1.39.7.dist-info/METADATA,sha256=9vYlBQSFrtp81iE0lKTdsZ5SVwD2H2gWANnBxqe-2H8,29039
+mteb-1.39.7.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+mteb-1.39.7.dist-info/entry_points.txt,sha256=8IJoEJFKoDHmVnNev-qJ9pp4Ln7_1-ma9QsXnzVCzGU,39
+mteb-1.39.7.dist-info/top_level.txt,sha256=OLVIjcQAlWBz0bdmutKlWHLF42FF0hp4uVAg3ZyiG4U,5
+mteb-1.39.7.dist-info/RECORD,,

mteb/tasks/Classification/svk/__init__.py DELETED Viewed

File without changes

{mteb-1.39.5.dist-info → mteb-1.39.7.dist-info}/WHEEL RENAMED Viewed

File without changes

{mteb-1.39.5.dist-info → mteb-1.39.7.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{mteb-1.39.5.dist-info → mteb-1.39.7.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{mteb-1.39.5.dist-info → mteb-1.39.7.dist-info}/top_level.txt RENAMED Viewed

File without changes

mteb 1.39.5__py3-none-any.whl → 1.39.7__py3-none-any.whl

mteb 1.39.5py3-none-any.whl → 1.39.7py3-none-any.whl