PyPI - mteb - Versions diffs - 2.0.5__py3-none-any.whl → 2.1.19__py3-none-any.whl - Mend

mteb 2.0.5py3-none-any.whl → 2.1.19py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (412) hide show

mteb/models/model_implementations/voyage_models.py CHANGED Viewed

@@ -156,16 +156,15 @@ class VoyageModel(AbsEncoder):
                 and len(batch) < batch_size
                 and batch_tokens < self._max_tokens_per_batch
             ):
-                n_tokens = len(
-                    self._client.tokenize([sentences[index]], model=self._model_name)[0]
-                )
+                txt = sentences[index] if len(sentences[index]) > 0 else " "
+                n_tokens = len(self._client.tokenize([txt], model=self._model_name)[0])
                 if (
                     batch_tokens + n_tokens > self._max_tokens_per_batch
                     and len(batch) > 0
                 ):
                     break
                 batch_tokens += n_tokens
-                batch.append(sentences[index])
+                batch.append(txt)
                 index += 1
             embeddings.extend(
@@ -249,7 +248,7 @@ voyage_3_5 = ModelMeta(
     n_parameters=None,
     memory_usage_mb=None,
     license=None,
-    reference="https://docs.voyageai.com/docs/embeddings",
+    reference="https://blog.voyageai.com/2025/05/20/voyage-3-5/",
     similarity_fn_name="cosine",
     framework=["API"],
     use_instructions=True,
@@ -274,7 +273,7 @@ voyage_3_5_int8 = ModelMeta(
     n_parameters=None,
     memory_usage_mb=None,
     license=None,
-    reference="https://docs.voyageai.com/docs/flexible-dimensions-and-quantization",
+    reference="https://blog.voyageai.com/2025/05/20/voyage-3-5/",
     similarity_fn_name="cosine",
     framework=["API"],
     use_instructions=True,
@@ -300,7 +299,7 @@ voyage_3_5_binary = ModelMeta(
     n_parameters=None,
     memory_usage_mb=None,
     license=None,
-    reference="https://docs.voyageai.com/docs/flexible-dimensions-and-quantization",
+    reference="https://blog.voyageai.com/2025/05/20/voyage-3-5/",
     similarity_fn_name="cosine",
     framework=["API"],
     use_instructions=True,

mteb/models/model_implementations/voyage_v.py CHANGED Viewed

@@ -51,7 +51,13 @@ def _downsample_image(
 def voyage_v_loader(model_name, **kwargs):
     requires_package(
         voyage_v_loader,
-        "voyageai and tenacity",
+        "voyageai",
+        model_name,
+        "pip install 'mteb[voyage_v]'",
+    )
+    requires_package(
+        voyage_v_loader,
+        "tenacity",
         model_name,
         "pip install 'mteb[voyage_v]'",
     )
@@ -65,11 +71,9 @@ def voyage_v_loader(model_name, **kwargs):
             **kwargs: Any,
         ):
             requires_image_dependencies()
-            from torchvision import transforms
             self.model_name = model_name.split("/")[-1]
             self.vo = voyageai.Client()
-            self.tensor_to_image = transforms.Compose([transforms.PILToTensor()])
         @retry(
             stop=stop_after_attempt(6),  # Stop after 6 attempts
@@ -126,10 +130,7 @@ def voyage_v_loader(model_name, **kwargs):
             for batch in tqdm(
                 images, disable=not show_progress_bar, desc="Image Encoding"
             ):
-                batch_images = [
-                    [_downsample_image(self.tensor_to_image(image))]
-                    for image in batch["image"]
-                ]
+                batch_images = [[_downsample_image(image)] for image in batch["image"]]
                 embeddings = self._multimodal_embed(
                     batch_images, model=self.model_name, input_type=input_type
                 ).embeddings
@@ -148,6 +149,7 @@ def voyage_v_loader(model_name, **kwargs):
             show_progress_bar: bool = True,
             **kwargs: Any,
         ) -> Array:
+            input_type = "document"  # default
             if prompt_type is not None:
                 if prompt_type == PromptType.document:
                     input_type = "document"
@@ -163,8 +165,7 @@ def voyage_v_loader(model_name, **kwargs):
                     inputs, disable=not show_progress_bar, desc="Interleaved Encoding"
                 ):
                     batch_images = [
-                        _downsample_image(self.tensor_to_image(image))
-                        for image in batch["image"]
+                        _downsample_image(image) for image in batch["image"]
                     ]
                     batch_texts = batch["text"]
                     interleaved_inputs = [

mteb/models/model_implementations/yuan_models.py ADDED Viewed

@@ -0,0 +1,33 @@
+from mteb.models import ModelMeta, sentence_transformers_loader
+yuan_emb_zh_datasets = {
+    "CMedQAv2-reranking",
+    "DuRetrieval",
+    "MMarcoReranking",
+    "T2Reranking",
+    "T2Retrieval",
+}
+# not in mteb
+# "Multi-CPR":"http://github.com/Alibaba-NLP/Multi-CPR",
+yuan_embedding_2_zh = ModelMeta(
+    name="IEITYuan/Yuan-embedding-2.0-zh",
+    loader=sentence_transformers_loader,
+    languages=["zho-Hans"],
+    open_weights=True,
+    revision="b5ebcace6f4fc6e5a4d1852557eb2dc2d1040cee",
+    release_date="2025-11-24",
+    n_parameters=326000000,
+    memory_usage_mb=1242,
+    embed_dim=1792,
+    license="apache-2.0",
+    max_tokens=512,
+    reference="https://huggingface.co/IEITYuan/Yuan-embedding-2.0-zh",
+    similarity_fn_name="cosine",
+    framework=["Sentence Transformers", "PyTorch"],
+    use_instructions=False,
+    public_training_code=None,
+    public_training_data=None,
+    training_datasets=yuan_emb_zh_datasets,
+)

mteb/models/search_wrappers.py CHANGED Viewed

@@ -90,7 +90,7 @@ class SearchEncoderWrapper:
             queries,
             task_metadata,
             prompt_type=PromptType.query,
-            batch_size=encode_kwargs.get("batch_size", 32),
+            **encode_kwargs,
         )
         query_embeddings = self.model.encode(
@@ -165,7 +165,7 @@ class SearchEncoderWrapper:
                     sub_corpus,
                     task_metadata,
                     prompt_type=PromptType.document,
-                    batch_size=encode_kwargs.get("batch_size", 32),
+                    **encode_kwargs,
                 ),
                 task_metadata=task_metadata,
                 hf_split=hf_split,
@@ -191,6 +191,7 @@ class SearchEncoderWrapper:
             cos_scores_top_k_idx = cos_scores_top_k_idx.cpu().tolist()
             cos_scores_top_k_values = cos_scores_top_k_values.cpu().tolist()
+            sub_corpus_ids = list(sub_corpus_ids)
             for query_itr in range(len(query_embeddings)):
                 query_id = query_idx_to_id[query_itr]
                 for sub_corpus_id, score in zip(
@@ -230,7 +231,7 @@ class SearchEncoderWrapper:
                 self.task_corpus,
                 task_metadata,
                 prompt_type=PromptType.document,
-                batch_size=encode_kwargs.get("batch_size", 32),
+                **encode_kwargs,
             ),
             task_metadata=task_metadata,
             hf_split=hf_split,
@@ -407,13 +408,13 @@ class SearchCrossEncoderWrapper:
             Dataset.from_list(total_queries),
             task_metadata,
             prompt_type=PromptType.document,
-            batch_size=encode_kwargs.get("batch_size", 32),
+            **encode_kwargs,
         )
         corpus_loader = create_dataloader(
             Dataset.from_list(total_docs),
             task_metadata,
             prompt_type=PromptType.document,
-            batch_size=encode_kwargs.get("batch_size", 32),
+            **encode_kwargs,
         )
         predictions = self.model.predict(
             inputs1=queries_loader,

mteb/results/task_result.py CHANGED Viewed

@@ -32,7 +32,7 @@ from mteb.types import (
 logger = logging.getLogger(__name__)
-class Criterias(HelpfulStrEnum):
+class Criteria(HelpfulStrEnum):
     """Enum for criteria to check when merging TaskResult objects."""
     MTEB_VERSION = "mteb_version"
@@ -671,7 +671,7 @@ class TaskResult(BaseModel):
     def is_mergeable(
         self,
         result: TaskResult | AbsTask,
-        criteria: list[str] | list[Criterias] = [
+        criteria: list[str] | list[Criteria] = [
             "mteb_version",
             "dataset_revision",
         ],
@@ -688,9 +688,7 @@ class TaskResult(BaseModel):
         Returns:
             True if the TaskResult object can be merged with the other object, False otherwise.
         """
-        criteria = [
-            Criterias.from_str(c) if isinstance(c, str) else c for c in criteria
-        ]
+        criteria = [Criteria.from_str(c) if isinstance(c, str) else c for c in criteria]
         if isinstance(result, TaskResult):
             name = result.task_name
             revision = result.dataset_revision
@@ -700,27 +698,31 @@ class TaskResult(BaseModel):
             name = result.metadata.name
             revision = result.metadata.revision
         else:
+            msg = "result must be a TaskResult or AbsTask object"
+            if raise_error:
+                raise ValueError(msg)
+            logger.debug(msg)
             return False
         if self.task_name != name:
+            msg = f"Cannot merge TaskResult objects as they are derived from different tasks ({self.task_name} and {name})"
             if raise_error:
-                raise ValueError(
-                    f"Cannot merge TaskResult objects as they are derived from different tasks ({self.task_name} and {name})"
-                )
+                raise ValueError(msg)
+            logger.debug(msg)
             return False
-        if Criterias.MTEB_VERSION in criteria and self.mteb_version != mteb_version:
+        if Criteria.MTEB_VERSION in criteria and self.mteb_version != mteb_version:
+            msg = f"Cannot merge TaskResult objects as they are derived from different MTEB versions ({self.mteb_version} (loaded) and {mteb_version} (current))"
             if raise_error:
-                raise ValueError(
-                    f"Cannot merge TaskResult objects as they are derived from different MTEB versions ({self.mteb_version} and {mteb_version})"
-                )
+                raise ValueError(msg)
+            logger.debug(msg)
             return False
-        if Criterias.DATASET_REVISION in criteria and self.dataset_revision != revision:
+        if Criteria.DATASET_REVISION in criteria and self.dataset_revision != revision:
+            msg = f"Cannot merge TaskResult objects as they are derived from different dataset revisions ({self.dataset_revision} and {revision})"
             if raise_error:
-                raise ValueError(
-                    f"Cannot merge TaskResult objects as they are derived from different dataset revisions ({self.dataset_revision} and {revision})"
-                )
+                raise ValueError(msg)
+            logger.debug(msg)
             return False
         return True
@@ -728,7 +730,7 @@ class TaskResult(BaseModel):
     def merge(
         self,
         new_results: TaskResult,
-        criteria: list[str] | list[Criterias] = [
+        criteria: list[str] | list[Criteria] = [
             "mteb_version",
             "dataset_revision",
         ],

mteb/tasks/bitext_mining/multilingual/bucc_bitext_mining.py CHANGED Viewed

@@ -23,7 +23,7 @@ class BUCCBitextMining(AbsTaskBitextMining):
             "path": "mteb/BUCC",
             "revision": "414572247440f0ccacf7eb0bb70a31533a0e5443",
         },
-        description="BUCC bitext mining dataset",
+        description="BUCC bitext mining dataset train split.",
         reference="https://comparable.limsi.fr/bucc2018/bucc2018-task.html",
         type="BitextMining",
         category="t2t",
@@ -71,7 +71,9 @@ Rapp, Reinhard},
                 sentence1 = data["sentence1"][0]
                 sentence2 = data["sentence2"][0]
-                sentence1 = [sentence1[i] for (i, j) in gold]
+                sentence1 = [
+                    sentence1[i] for (i, j) in gold
+                ]  # keep only sentences in gold. The 2nd value is meant for sentence2 but not used here. This is fixed in BUCC.v2.
                 logger.info(f"Lang {lang} num gold {len(gold)}")
                 logger.info(f"Lang {lang} num sentence1 {len(sentence1)}")
                 logger.info(f"Lang {lang} num sentence2 {len(sentence2)}")

mteb/tasks/bitext_mining/multilingual/bucc_bitext_mining_fast.py CHANGED Viewed

@@ -20,7 +20,7 @@ class BUCCBitextMiningFast(AbsTaskBitextMining):
             "path": "mteb/bucc-bitext-mining",
             "revision": "1739dc11ffe9b7bfccd7f3d585aeb4c544fc6677",
         },
-        description="BUCC bitext mining dataset",
+        description="BUCC bitext mining dataset train split, gold set only.",
         reference="https://comparable.limsi.fr/bucc2018/bucc2018-task.html",
         type="BitextMining",
         category="t2t",

mteb/tasks/bitext_mining/multilingual/ru_sci_bench_bitext_mining.py CHANGED Viewed

@@ -10,11 +10,7 @@ class RuSciBenchBitextMining(AbsTaskBitextMining):
             "path": "mlsa-iai-msu-lab/ru_sci_bench_bitext_mining",
             "revision": "e5840033c5cf2573932db027ac8001fe0a7eb6fa",
         },
-        description="""This task focuses on finding translations of scientific articles.
-        The dataset is sourced from eLibrary, Russia's largest electronic library of scientific publications.
-        Russian authors often provide English translations for their abstracts and titles,
-        and the data consists of these paired titles and abstracts. The task evaluates a model's ability
-        to match an article's Russian title and abstract to its English counterpart, or vice versa.""",
+        description="This task focuses on finding translations of scientific articles. The dataset is sourced from eLibrary, Russia's largest electronic library of scientific publications. Russian authors often provide English translations for their abstracts and titles, and the data consists of these paired titles and abstracts. The task evaluates a model's ability to match an article's Russian title and abstract to its English counterpart, or vice versa.",
         reference="https://github.com/mlsa-iai-msu-lab/ru_sci_bench_mteb",
         type="BitextMining",
         category="t2c",

mteb/tasks/bitext_mining/multilingual/web_faq_bitext_mining.py CHANGED Viewed

@@ -198,9 +198,7 @@ _SPLITS = ["default"]
 class WebFAQBitextMiningQuestions(AbsTaskBitextMining):
     metadata = TaskMetadata(
         name="WebFAQBitextMiningQuestions",
-        description="""The WebFAQ Bitext Dataset consists of natural FAQ-style Question-Answer pairs that align across languages.
-A sentence in the "WebFAQBitextMiningQuestions" task is the question originating from an aligned QA.
-The dataset is sourced from FAQ pages on the web.""",
+        description='The WebFAQ Bitext Dataset consists of natural FAQ-style Question-Answer pairs that align across languages. A sentence in the "WebFAQBitextMiningQuestions" task is the question originating from an aligned QA. The dataset is sourced from FAQ pages on the web.',
         reference="https://huggingface.co/PaDaS-Lab",
         dataset={
             "path": "PaDaS-Lab/webfaq-bitexts",
@@ -254,9 +252,7 @@ The dataset is sourced from FAQ pages on the web.""",
 class WebFAQBitextMiningQAs(AbsTaskBitextMining):
     metadata = TaskMetadata(
         name="WebFAQBitextMiningQAs",
-        description="""The WebFAQ Bitext Dataset consists of natural FAQ-style Question-Answer pairs that align across languages.
-A sentence in the "WebFAQBitextMiningQAs" task is a concatenation of a question and its corresponding answer.
-The dataset is sourced from FAQ pages on the web.""",
+        description='The WebFAQ Bitext Dataset consists of natural FAQ-style Question-Answer pairs that align across languages. A sentence in the "WebFAQBitextMiningQAs" task is a concatenation of a question and its corresponding answer. The dataset is sourced from FAQ pages on the web.',
         reference="https://huggingface.co/PaDaS-Lab",
         dataset={
             "path": "PaDaS-Lab/webfaq-bitexts",

mteb/tasks/classification/ara/ajgt.py CHANGED Viewed

@@ -45,8 +45,7 @@ class AJGTV2(AbsTaskClassification):
             "path": "mteb/ajgt",
             "revision": "0a3dea7301ee0c051891f04d32f3e8577a9eae36",
         },
-        description="""Arabic Jordanian General Tweets (AJGT) Corpus consisted of 1,800 tweets (900 for training and 900 for testing) annotated as positive and negative. Modern Standard Arabic (MSA) or Jordanian dialect.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)""",
+        description="Arabic Jordanian General Tweets (AJGT) Corpus consisted of 1,800 tweets (900 for training and 900 for testing) annotated as positive and negative. Modern Standard Arabic (MSA) or Jordanian dialect. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)",
         reference="https://link.springer.com/chapter/10.1007/978-3-319-60042-0_66/",
         type="Classification",
         category="t2c",

mteb/tasks/classification/ara/hotel_review_sentiment_classification.py CHANGED Viewed

@@ -45,8 +45,7 @@ class HotelReviewSentimentClassificationV2(AbsTaskClassification):
             "path": "mteb/HotelReviewSentimentClassification",
             "revision": "f5e6a24acbed4182114ffdf46747090b3f51e836",
         },
-        description="""HARD is a dataset of Arabic hotel reviews collected from the Booking.com website.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)""",
+        description="HARD is a dataset of Arabic hotel reviews collected from the Booking.com website. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)",
         reference="https://link.springer.com/chapter/10.1007/978-3-319-67056-0_3",
         type="Classification",
         category="t2c",

mteb/tasks/classification/ara/online_store_review_sentiment_classification.py CHANGED Viewed

@@ -41,8 +41,7 @@ class OnlineStoreReviewSentimentClassificationV2(AbsTaskClassification):
             "path": "mteb/online_store_review_sentiment",
             "revision": "de0e8eed65adf1cbc58f8743a5f5c5df556de4c4",
         },
-        description="""This dataset contains Arabic reviews of products from the SHEIN online store.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)""",
+        description="This dataset contains Arabic reviews of products from the SHEIN online store. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)",
         reference="https://huggingface.co/datasets/Ruqiya/Arabic_Reviews_of_SHEIN",
         type="Classification",
         category="t2c",

mteb/tasks/classification/ara/restaurant_review_sentiment_classification.py CHANGED Viewed

@@ -52,8 +52,7 @@ class RestaurantReviewSentimentClassificationV2(AbsTaskClassification):
             "path": "mteb/restaurant_review_sentiment",
             "revision": "5d28c1e8fb393173a849696ed178b90a6f78754a",
         },
-        description="""Dataset of 8156 restaurant reviews from qaym.com in Arabic for sentiment analysis
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)""",
+        description="Dataset of 8156 restaurant reviews from qaym.com in Arabic for sentiment analysis This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)",
         reference="https://link.springer.com/chapter/10.1007/978-3-319-18117-2_2",
         type="Classification",
         category="t2c",

mteb/tasks/classification/ara/tweet_emotion_classification.py CHANGED Viewed

@@ -45,8 +45,7 @@ class TweetEmotionClassificationV2(AbsTaskClassification):
             "path": "mteb/TweetEmotionClassification",
             "revision": "930d65840c089406ceed5241b1a9ba7294e5eeae",
         },
-        description="""A dataset of 10,012 tweets that was created with the aim of covering the most frequently used emotion categories in Arabic tweets.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)""",
+        description="A dataset of 10,012 tweets that was created with the aim of covering the most frequently used emotion categories in Arabic tweets. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)",
         reference="https://link.springer.com/chapter/10.1007/978-3-319-77116-8_8",
         type="Classification",
         category="t2c",

mteb/tasks/classification/ara/tweet_sarcasm_classification.py CHANGED Viewed

@@ -62,8 +62,7 @@ class TweetSarcasmClassificationV2(AbsTaskClassification):
             "path": "mteb/tweet_sarcasm",
             "revision": "3a20898e2ea3303844e907d55f7a815a7644150d",
         },
-        description="""Arabic sarcasm detection dataset, which was created through the reannotation of available Arabic sentiment analysis datasets.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)""",
+        description="Arabic sarcasm detection dataset, which was created through the reannotation of available Arabic sentiment analysis datasets. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)",
         reference="https://aclanthology.org/2020.osact-1.5/",
         type="Classification",
         category="t2c",

mteb/tasks/classification/ben/bengali_document_classification.py CHANGED Viewed

@@ -55,8 +55,7 @@ Islam, Tanvir},
 class BengaliDocumentClassificationV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="BengaliDocumentClassification.v2",
-        description="""Dataset for News Classification, categorized with 13 domains.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)""",
+        description="Dataset for News Classification, categorized with 13 domains. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)",
         reference="https://aclanthology.org/2023.eacl-main.4",
         dataset={
             "path": "mteb/bengali_document",

mteb/tasks/classification/ben/bengali_hate_speech_classification.py CHANGED Viewed

@@ -45,8 +45,7 @@ class BengaliHateSpeechClassification(AbsTaskClassification):
 class BengaliHateSpeechClassificationV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="BengaliHateSpeechClassification.v2",
-        description="""The Bengali Hate Speech Dataset is a Bengali-language dataset of news articles collected from various Bengali media sources and categorized based on the type of hate in the text.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)""",
+        description="The Bengali Hate Speech Dataset is a Bengali-language dataset of news articles collected from various Bengali media sources and categorized based on the type of hate in the text. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)",
         reference="https://huggingface.co/datasets/bn_hate_speech",
         dataset={
             "path": "mteb/bengali_hate_speech",

mteb/tasks/classification/ben/bengali_sentiment_analysis.py CHANGED Viewed

@@ -45,8 +45,7 @@ class BengaliSentimentAnalysis(AbsTaskClassification):
 class BengaliSentimentAnalysisV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="BengaliSentimentAnalysis.v2",
-        description="""dataset contains 2854 Negative reviews and 7238 Positive reviews collected and manually annotated from Youtube Bengali drama.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)""",
+        description="dataset contains 2854 Negative reviews and 7238 Positive reviews collected and manually annotated from Youtube Bengali drama. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2632)",
         reference="https://data.mendeley.com/datasets/p6zc7krs37/4",
         dataset={
             "path": "mteb/bengali_sentiment_analysis",

mteb/tasks/classification/ces/csfdcz_movie_review_sentiment_classification.py CHANGED Viewed

@@ -51,8 +51,7 @@ class CSFDCZMovieReviewSentimentClassification(AbsTaskClassification):
 class CSFDCZMovieReviewSentimentClassificationV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="CSFDCZMovieReviewSentimentClassification.v2",
-        description="""The dataset contains 30k user reviews from csfd.cz in Czech.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="The dataset contains 30k user reviews from csfd.cz in Czech. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://arxiv.org/abs/2304.01922",
         dataset={
             "path": "mteb/csfdcz_movie_review_sentiment",

mteb/tasks/classification/ces/czech_product_review_sentiment_classification.py CHANGED Viewed

@@ -58,8 +58,7 @@ Montoyo, Andres},
 class CzechProductReviewSentimentClassificationV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="CzechProductReviewSentimentClassification.v2",
-        description="""User reviews of products on Czech e-shop Mall.cz with 3 sentiment classes (positive, neutral, negative)
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="User reviews of products on Czech e-shop Mall.cz with 3 sentiment classes (positive, neutral, negative) This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://aclanthology.org/W13-1609/",
         dataset={
             "path": "mteb/czech_product_review_sentiment",

mteb/tasks/classification/ces/czech_so_me_sentiment_classification.py CHANGED Viewed

@@ -55,8 +55,7 @@ Montoyo, Andres},
 class CzechSoMeSentimentClassificationV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="CzechSoMeSentimentClassification.v2",
-        description="""User comments on Facebook
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="User comments on Facebook This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://aclanthology.org/W13-1609/",
         dataset={
             "path": "mteb/czech_so_me_sentiment",

mteb/tasks/classification/dan/angry_tweets_classification.py CHANGED Viewed

@@ -9,7 +9,7 @@ class AngryTweetsClassification(AbsTaskClassification):
             "path": "DDSC/angry-tweets",
             "revision": "20b0e6081892e78179356fada741b7afa381443d",
         },
-        description="A sentiment dataset with 3 classes (positiv, negativ, neutral) for Danish tweets",
+        description="A sentiment dataset with 3 classes (positive, negative, neutral) for Danish tweets",
         reference="https://aclanthology.org/2021.nodalida-main.53/",
         type="Classification",
         category="t2c",
@@ -47,8 +47,7 @@ class AngryTweetsClassificationV2(AbsTaskClassification):
             "path": "mteb/angry_tweets",
             "revision": "b9475fb66a13befda4fa9871cd92343bb2c0eb77",
         },
-        description="""A sentiment dataset with 3 classes (positiv, negativ, neutral) for Danish tweets
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="A sentiment dataset with 3 classes (positive, negative, neutral) for Danish tweets This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://aclanthology.org/2021.nodalida-main.53/",
         type="Classification",
         category="t2c",

mteb/tasks/classification/dan/danish_political_comments_classification.py CHANGED Viewed

@@ -49,8 +49,7 @@ class DanishPoliticalCommentsClassificationV2(AbsTaskClassification):
             "path": "mteb/danish_political_comments",
             "revision": "476a9e7327aba70ad3e97a169d7310b86be9b245",
         },
-        description="""A dataset of Danish political comments rated for sentiment
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="A dataset of Danish political comments rated for sentiment This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://huggingface.co/datasets/danish_political_comments",
         type="Classification",
         category="t2c",

mteb/tasks/classification/dan/ddisco_cohesion_classification.py CHANGED Viewed

@@ -69,8 +69,7 @@ class DdiscoCohesionClassificationV2(AbsTaskClassification):
             "path": "mteb/ddisco_cohesion",
             "revision": "b5a05bdecdfc6efc14eebc8f7a86e0986edaf5ff",
         },
-        description="""A Danish Discourse dataset with values for coherence and source (Wikipedia or Reddit)
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="A Danish Discourse dataset with values for coherence and source (Wikipedia or Reddit) This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://aclanthology.org/2022.lrec-1.260/",
         type="Classification",
         category="t2c",

mteb/tasks/classification/dan/dk_hate_classification.py CHANGED Viewed

@@ -76,8 +76,7 @@ class DKHateClassificationV2(AbsTaskClassification):
             "path": "mteb/dk_hate",
             "revision": "0468ff11393992d8347cf4282fb706fe970608d4",
         },
-        description="""Danish Tweets annotated for Hate Speech either being Offensive or not
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="Danish Tweets annotated for Hate Speech either being Offensive or not This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://aclanthology.org/2020.lrec-1.430/",
         type="Classification",
         category="t2c",

mteb/tasks/classification/deu/german_politicians_twitter_sentiment_classification.py CHANGED Viewed

@@ -56,8 +56,7 @@ Zesch, Torsten},
 class GermanPoliticiansTwitterSentimentClassificationV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="GermanPoliticiansTwitterSentimentClassification.v2",
-        description="""GermanPoliticiansTwitterSentiment is a dataset of German tweets categorized with their sentiment (3 classes).
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="GermanPoliticiansTwitterSentiment is a dataset of German tweets categorized with their sentiment (3 classes). This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://aclanthology.org/2022.konvens-1.9",
         dataset={
             "path": "mteb/german_politicians_twitter_sentiment",

mteb/tasks/classification/deu/ten_k_gnad_classification.py CHANGED Viewed

@@ -43,8 +43,7 @@ class TenKGnadClassification(AbsTaskClassification):
 class TenKGnadClassificationV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="TenKGnadClassification.v2",
-        description="""10k German News Articles Dataset (10kGNAD) contains news articles from the online Austrian newspaper website DER Standard with their topic classification (9 classes).
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="10k German News Articles Dataset (10kGNAD) contains news articles from the online Austrian newspaper website DER Standard with their topic classification (9 classes). This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://tblock.github.io/10kGNAD/",
         dataset={
             "path": "mteb/ten_k_gnad",

mteb/tasks/classification/eng/amazon_polarity_classification.py CHANGED Viewed

@@ -44,8 +44,7 @@ class AmazonPolarityClassification(AbsTaskClassification):
 class AmazonPolarityClassificationV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="AmazonPolarityClassification.v2",
-        description="""Amazon Polarity Classification Dataset.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="Amazon Polarity Classification Dataset. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://huggingface.co/datasets/amazon_polarity",
         dataset={
             "path": "mteb/amazon_polarity",

mteb/tasks/classification/eng/arxiv_classification.py CHANGED Viewed

@@ -43,8 +43,7 @@ class ArxivClassification(AbsTaskClassification):
 class ArxivClassificationV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="ArxivClassification.v2",
-        description="""Classification Dataset of Arxiv Papers
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="Classification Dataset of Arxiv Papers This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         dataset={
             "path": "mteb/arxiv",
             "revision": "202e10e9a5d37a5068397b48184d0728346a7b4a",

mteb/tasks/classification/eng/banking77_classification.py CHANGED Viewed

@@ -61,8 +61,7 @@ Shah, Rushin},
 class Banking77ClassificationV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="Banking77Classification.v2",
-        description="""Dataset composed of online banking queries annotated with their corresponding intents.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="Dataset composed of online banking queries annotated with their corresponding intents. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://arxiv.org/abs/2003.04807",
         dataset={
             "path": "mteb/banking77",

mteb/tasks/classification/eng/dbpedia_classification.py CHANGED Viewed

@@ -50,8 +50,7 @@ class DBpediaClassification(AbsTaskClassification):
 class DBpediaClassificationV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="DBpediaClassification.v2",
-        description="""DBpedia14 is a dataset of English texts from Wikipedia articles, categorized into 14 non-overlapping classes based on their DBpedia ontology.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="DBpedia14 is a dataset of English texts from Wikipedia articles, categorized into 14 non-overlapping classes based on their DBpedia ontology. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://arxiv.org/abs/1509.01626",
         dataset={
             "path": "mteb/d_bpedia",

mteb/tasks/classification/eng/emotion_classification.py CHANGED Viewed

@@ -59,8 +59,7 @@ Tsujii, Jun{'}ichi},
 class EmotionClassificationV2(AbsTaskClassification):
     metadata = TaskMetadata(
         name="EmotionClassification.v2",
-        description="""Emotion is a dataset of English Twitter messages with six basic emotions: anger, fear, joy, love, sadness, and surprise.
-        This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)""",
+        description="Emotion is a dataset of English Twitter messages with six basic emotions: anger, fear, joy, love, sadness, and surprise. This version corrects errors found in the original data. For details, see [pull request](https://github.com/embeddings-benchmark/mteb/pull/2900)",
         reference="https://www.aclweb.org/anthology/D18-1404",
         dataset={
             "path": "mteb/emotion",

mteb 2.0.5__py3-none-any.whl → 2.1.19__py3-none-any.whl

mteb 2.0.5py3-none-any.whl → 2.1.19py3-none-any.whl