PyPI - mteb - Versions diffs - 2.0.5__py3-none-any.whl → 2.1.19__py3-none-any.whl - Mend

mteb 2.0.5py3-none-any.whl → 2.1.19py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (412) hide show

mteb/tasks/retrieval/eng/dbpedia_retrieval.py CHANGED Viewed

@@ -1,30 +1,21 @@
 from mteb.abstasks.retrieval import AbsTaskRetrieval
 from mteb.abstasks.task_metadata import TaskMetadata
-class DBPedia(AbsTaskRetrieval):
-    metadata = TaskMetadata(
-        name="DBPedia",
-        description="DBpedia-Entity is a standard test collection for entity search over the DBpedia knowledge base",
-        reference="https://github.com/iai-group/DBpedia-Entity/",
-        dataset={
-            "path": "mteb/dbpedia",
-            "revision": "c0f706b76e590d620bd6618b3ca8efdd34e2d659",
-        },
-        type="Retrieval",
-        category="t2t",
-        modalities=["text"],
-        eval_splits=["test"],
-        eval_langs=["eng-Latn"],
-        main_score="ndcg_at_10",
-        date=("2017-01-01", "2017-01-01"),  # best guess: based on publication date
-        domains=["Written", "Encyclopaedic"],
-        task_subtypes=[],
-        license="mit",
-        annotations_creators="derived",
-        dialect=[],
-        sample_creation="found",
-        bibtex_citation=r"""
+_dbpedia_metadata = dict(
+    type="Retrieval",
+    category="t2t",
+    modalities=["text"],
+    eval_splits=["test"],
+    eval_langs=["eng-Latn"],
+    main_score="ndcg_at_10",
+    date=("2017-01-01", "2017-01-01"),  # best guess: based on publication date
+    domains=["Written", "Encyclopaedic"],
+    task_subtypes=[],
+    license="mit",
+    annotations_creators="derived",
+    dialect=[],
+    sample_creation="found",
+    bibtex_citation=r"""
 @inproceedings{Hasibi:2017:DVT,
   author = {Hasibi, Faegheh and Nikolaev, Fedor and Xiong, Chenyan and Balog, Krisztian and Bratsberg, Svein Erik and Kotov, Alexander and Callan, Jamie},
   booktitle = {Proceedings of the 40th International ACM SIGIR Conference on Research and Development in Information Retrieval},
@@ -36,45 +27,59 @@ class DBPedia(AbsTaskRetrieval):
   year = {2017},
 }
 """,
+)
+class DBPedia(AbsTaskRetrieval):
+    metadata = TaskMetadata(
+        name="DBPedia",
+        description="DBpedia-Entity is a standard test collection for entity search over the DBpedia knowledge base",
+        reference="https://github.com/iai-group/DBpedia-Entity/",
+        dataset={
+            "path": "mteb/dbpedia",
+            "revision": "c0f706b76e590d620bd6618b3ca8efdd34e2d659",
+        },
         prompt={
             "query": "Given a query, retrieve relevant entity descriptions from DBPedia"
         },
+        **_dbpedia_metadata,
     )
 class DBPediaHardNegatives(AbsTaskRetrieval):
     metadata = TaskMetadata(
         name="DBPediaHardNegatives",
-        description="DBpedia-Entity is a standard test collection for entity search over the DBpedia knowledge base. The hard negative version has been created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct.",
+        description=(
+            "DBpedia-Entity is a standard test collection for entity search over the DBpedia knowledge base. "
+            "The hard negative version has been created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct."
+        ),
+        reference="https://github.com/iai-group/DBpedia-Entity/",
+        dataset={
+            "path": "mteb/DBPedia_test_top_250_only_w_correct-v2",
+            "revision": "943ec7fdfef3728b2ad1966c5b6479ff9ffd26c9",
+        },
+        superseded_by="DBPediaHardNegatives.v2",
+        adapted_from=["DBPedia"],
+        **_dbpedia_metadata,
+    )
+class DBPediaHardNegativesV2(AbsTaskRetrieval):
+    metadata = TaskMetadata(
+        name="DBPediaHardNegatives.v2",
+        description=(
+            "DBpedia-Entity is a standard test collection for entity search over the DBpedia knowledge base. "
+            "The hard negative version has been created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct. "
+            "V2 uses a more appropriate prompt rather than the default prompt for retrieval. You can get more information on the effect of different prompt in the [PR](https://github.com/embeddings-benchmark/mteb/pull/3469#issuecomment-3436467106)"
+        ),
         reference="https://github.com/iai-group/DBpedia-Entity/",
         dataset={
             "path": "mteb/DBPedia_test_top_250_only_w_correct-v2",
             "revision": "943ec7fdfef3728b2ad1966c5b6479ff9ffd26c9",
         },
-        type="Retrieval",
-        category="t2t",
-        modalities=["text"],
-        eval_splits=["test"],
-        eval_langs=["eng-Latn"],
-        main_score="ndcg_at_10",
-        date=("2017-01-01", "2017-01-01"),  # best guess: based on publication date
-        domains=["Written", "Encyclopaedic"],
-        task_subtypes=[],
-        license="mit",
-        annotations_creators="derived",
-        dialect=[],
-        sample_creation="found",
-        bibtex_citation=r"""
-@inproceedings{Hasibi:2017:DVT,
-  author = {Hasibi, Faegheh and Nikolaev, Fedor and Xiong, Chenyan and Balog, Krisztian and Bratsberg, Svein Erik and Kotov, Alexander and Callan, Jamie},
-  booktitle = {Proceedings of the 40th International ACM SIGIR Conference on Research and Development in Information Retrieval},
-  doi = {10.1145/3077136.3080751},
-  pages = {1265--1268},
-  publisher = {ACM},
-  series = {SIGIR '17},
-  title = {DBpedia-Entity V2: A Test Collection for Entity Search},
-  year = {2017},
-}
-""",
         adapted_from=["DBPedia"],
+        prompt={
+            "query": "Given a query, retrieve relevant entity descriptions from DBPedia"
+        },
+        **_dbpedia_metadata,
     )

mteb/tasks/retrieval/eng/fever_retrieval.py CHANGED Viewed

@@ -1,36 +1,22 @@
 from mteb.abstasks.retrieval import AbsTaskRetrieval
 from mteb.abstasks.task_metadata import TaskMetadata
-class FEVER(AbsTaskRetrieval):
-    ignore_identical_ids = True
-    metadata = TaskMetadata(
-        name="FEVER",
-        dataset={
-            "path": "mteb/fever",
-            "revision": "bea83ef9e8fb933d90a2f1d5515737465d613e12",
-        },
-        description=(
-            "FEVER (Fact Extraction and VERification) consists of 185,445 claims generated by altering sentences"
-            + " extracted from Wikipedia and subsequently verified without knowledge of the sentence they were"
-            + " derived from."
-        ),
-        reference="https://fever.ai/",
-        type="Retrieval",
-        category="t2t",
-        modalities=["text"],
-        eval_splits=["test"],
-        eval_langs=["eng-Latn"],
-        main_score="ndcg_at_10",
-        date=None,
-        domains=["Encyclopaedic", "Written"],
-        task_subtypes=["Claim verification"],
-        license="cc-by-nc-sa-3.0",
-        annotations_creators="human-annotated",
-        dialect=[],
-        sample_creation="found",
-        bibtex_citation=r"""
+_fever_metadata = dict(
+    reference="https://fever.ai/",
+    type="Retrieval",
+    category="t2t",
+    modalities=["text"],
+    eval_splits=["test"],
+    eval_langs=["eng-Latn"],
+    main_score="ndcg_at_10",
+    date=None,
+    domains=["Encyclopaedic", "Written"],
+    task_subtypes=["Claim verification"],
+    license="cc-by-nc-sa-3.0",
+    annotations_creators="human-annotated",
+    dialect=[],
+    sample_creation="found",
+    bibtex_citation=r"""
 @inproceedings{thorne-etal-2018-fever,
   address = {New Orleans, Louisiana},
   author = {Thorne, James  and
@@ -50,9 +36,27 @@ Stent, Amanda},
   year = {2018},
 }
 """,
+)
+class FEVER(AbsTaskRetrieval):
+    ignore_identical_ids = True
+    metadata = TaskMetadata(
+        name="FEVER",
+        dataset={
+            "path": "mteb/fever",
+            "revision": "bea83ef9e8fb933d90a2f1d5515737465d613e12",
+        },
+        description=(
+            "FEVER (Fact Extraction and VERification) consists of 185,445 claims generated by altering sentences "
+            "extracted from Wikipedia and subsequently verified without knowledge of the sentence they were "
+            "derived from."
+        ),
         prompt={
             "query": "Given a claim, retrieve documents that support or refute the claim"
         },
+        **_fever_metadata,
     )
@@ -66,43 +70,34 @@ class FEVERHardNegatives(AbsTaskRetrieval):
             "revision": "080c9ed6267b65029207906e815d44a9240bafca",
         },
         description=(
-            "FEVER (Fact Extraction and VERification) consists of 185,445 claims generated by altering sentences"
-            + " extracted from Wikipedia and subsequently verified without knowledge of the sentence they were"
-            + " derived from. The hard negative version has been created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct."
+            "FEVER (Fact Extraction and VERification) consists of 185,445 claims generated by altering sentences "
+            "extracted from Wikipedia and subsequently verified without knowledge of the sentence they were "
+            "derived from. The hard negative version has been created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct."
+        ),
+        adapted_from=["FEVER"],
+        superseded_by="FEVERHardNegatives.v2",
+        **_fever_metadata,
+    )
+class FEVERHardNegativesV2(AbsTaskRetrieval):
+    ignore_identical_ids = True
+    metadata = TaskMetadata(
+        name="FEVERHardNegatives.v2",
+        dataset={
+            "path": "mteb/FEVER_test_top_250_only_w_correct-v2",
+            "revision": "080c9ed6267b65029207906e815d44a9240bafca",
+        },
+        description=(
+            "FEVER (Fact Extraction and VERification) consists of 185,445 claims generated by altering sentences "
+            "extracted from Wikipedia and subsequently verified without knowledge of the sentence they were "
+            "derived from. The hard negative version has been created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct. "
+            "V2 uses a more appropriate prompt rather than the default prompt for retrieval. You can get more information on the effect of different prompt in the [PR](https://github.com/embeddings-benchmark/mteb/pull/3469#issuecomment-3436467106)"
         ),
-        reference="https://fever.ai/",
-        type="Retrieval",
-        category="t2t",
-        modalities=["text"],
-        eval_splits=["test"],
-        eval_langs=["eng-Latn"],
-        main_score="ndcg_at_10",
-        date=None,
-        domains=["Encyclopaedic", "Written"],
-        task_subtypes=["Claim verification"],
-        license="cc-by-nc-sa-3.0",
-        annotations_creators="human-annotated",
-        dialect=None,
-        sample_creation=None,
-        bibtex_citation=r"""
-@inproceedings{thorne-etal-2018-fever,
-  address = {New Orleans, Louisiana},
-  author = {Thorne, James  and
-Vlachos, Andreas  and
-Christodoulopoulos, Christos  and
-Mittal, Arpit},
-  booktitle = {Proceedings of the 2018 Conference of the North {A}merican Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long Papers)},
-  doi = {10.18653/v1/N18-1074},
-  editor = {Walker, Marilyn  and
-Ji, Heng  and
-Stent, Amanda},
-  month = jun,
-  pages = {809--819},
-  publisher = {Association for Computational Linguistics},
-  title = {{FEVER}: a Large-scale Dataset for Fact Extraction and {VER}ification},
-  url = {https://aclanthology.org/N18-1074},
-  year = {2018},
-}
-""",
         adapted_from=["FEVER"],
+        prompt={
+            "query": "Given a claim, retrieve documents that support or refute the claim"
+        },
+        **_fever_metadata,
     )

mteb/tasks/retrieval/eng/hateful_memes_i2t_retrieval.py CHANGED Viewed

@@ -24,9 +24,7 @@ def _load_data(path: str, splits: str, revision: str | None = None):
     shared_corpus = shared_corpus.map(
         lambda x: {
             "id": "corpus-" + str(x["id"]),
-            # "text": x["text"],
             "modality": "text",
-            "image": None,
         },
         remove_columns=[
             "split",
@@ -40,9 +38,7 @@ def _load_data(path: str, splits: str, revision: str | None = None):
         queries[split] = split_dataset.map(
             lambda x: {
                 "id": "query-" + str(x["id"]),
-                "text": None,
                 "modality": "image",
-                # "image": x["image"],
             },
             remove_columns=[
                 "split",

mteb/tasks/retrieval/eng/hateful_memes_t2i_retrieval.py CHANGED Viewed

@@ -24,9 +24,7 @@ def _load_data(path: str, splits: str, revision: str | None = None):
     shared_corpus = shared_corpus.map(
         lambda x: {
             "id": "corpus-" + str(x["id"]),
-            "text": None,
             "modality": "image",
-            # "image": None,
         },
         remove_columns=[
             "split",
@@ -40,9 +38,7 @@ def _load_data(path: str, splits: str, revision: str | None = None):
         queries[split] = split_dataset.map(
             lambda x: {
                 "id": "query-" + str(x["id"]),
-                # "text": None,
                 "modality": "text",
-                "image": None,
             },
             remove_columns=[
                 "split",

mteb/tasks/retrieval/eng/hotpot_qa_retrieval.py CHANGED Viewed

@@ -1,33 +1,22 @@
 from mteb.abstasks.retrieval import AbsTaskRetrieval
 from mteb.abstasks.task_metadata import TaskMetadata
-class HotpotQA(AbsTaskRetrieval):
-    metadata = TaskMetadata(
-        name="HotpotQA",
-        dataset={
-            "path": "mteb/hotpotqa",
-            "revision": "ab518f4d6fcca38d87c25209f94beba119d02014",
-        },
-        description=(
-            "HotpotQA is a question answering dataset featuring natural, multi-hop questions, with strong"
-            + " supervision for supporting facts to enable more explainable question answering systems."
-        ),
-        reference="https://hotpotqa.github.io/",
-        type="Retrieval",
-        category="t2t",
-        modalities=["text"],
-        eval_splits=["test"],
-        eval_langs=["eng-Latn"],
-        main_score="ndcg_at_10",
-        date=("2018-01-01", "2018-12-31"),  # best guess: based on publication date
-        domains=["Web", "Written"],
-        task_subtypes=["Question answering"],
-        license="cc-by-sa-4.0",
-        annotations_creators="human-annotated",
-        dialect=[],
-        sample_creation="found",
-        bibtex_citation=r"""
+_hotpot_qa_metadata = dict(
+    reference="https://hotpotqa.github.io/",
+    type="Retrieval",
+    category="t2t",
+    modalities=["text"],
+    eval_splits=["test"],
+    eval_langs=["eng-Latn"],
+    main_score="ndcg_at_10",
+    date=("2018-01-01", "2018-12-31"),  # best guess: based on publication date
+    domains=["Web", "Written"],
+    task_subtypes=["Question answering"],
+    license="cc-by-sa-4.0",
+    annotations_creators="human-annotated",
+    dialect=[],
+    sample_creation="found",
+    bibtex_citation=r"""
 @inproceedings{yang-etal-2018-hotpotqa,
   address = {Brussels, Belgium},
   author = {Yang, Zhilin  and
@@ -51,9 +40,24 @@ Tsujii, Jun{'}ichi},
   year = {2018},
 }
 """,
+)
+class HotpotQA(AbsTaskRetrieval):
+    metadata = TaskMetadata(
+        name="HotpotQA",
+        dataset={
+            "path": "mteb/hotpotqa",
+            "revision": "ab518f4d6fcca38d87c25209f94beba119d02014",
+        },
+        description=(
+            "HotpotQA is a question answering dataset featuring natural, multi-hop questions, with strong "
+            "supervision for supporting facts to enable more explainable question answering systems."
+        ),
         prompt={
             "query": "Given a multi-hop question, retrieve documents that can help answer the question"
         },
+        **_hotpot_qa_metadata,
     )
@@ -65,46 +69,32 @@ class HotpotQAHardNegatives(AbsTaskRetrieval):
             "revision": "617612fa63afcb60e3b134bed8b7216a99707c37",
         },
         description=(
-            "HotpotQA is a question answering dataset featuring natural, multi-hop questions, with strong"
-            + " supervision for supporting facts to enable more explainable question answering systems.  The hard negative version has been created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct."
+            "HotpotQA is a question answering dataset featuring natural, multi-hop questions, with strong "
+            "supervision for supporting facts to enable more explainable question answering systems. "
+            "The hard negative version has been created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct."
         ),
-        reference="https://hotpotqa.github.io/",
-        type="Retrieval",
-        category="t2t",
-        modalities=["text"],
-        eval_splits=["test"],
-        eval_langs=["eng-Latn"],
-        main_score="ndcg_at_10",
-        date=("2018-01-01", "2018-12-31"),  # best guess: based on publication date
-        domains=["Web", "Written"],
-        task_subtypes=["Question answering"],
-        license="cc-by-sa-4.0",
-        annotations_creators="human-annotated",
-        dialect=[],
-        sample_creation="found",
-        bibtex_citation=r"""
-@inproceedings{yang-etal-2018-hotpotqa,
-  address = {Brussels, Belgium},
-  author = {Yang, Zhilin  and
-Qi, Peng  and
-Zhang, Saizheng  and
-Bengio, Yoshua  and
-Cohen, William  and
-Salakhutdinov, Ruslan  and
-Manning, Christopher D.},
-  booktitle = {Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing},
-  doi = {10.18653/v1/D18-1259},
-  editor = {Riloff, Ellen  and
-Chiang, David  and
-Hockenmaier, Julia  and
-Tsujii, Jun{'}ichi},
-  month = oct # {-} # nov,
-  pages = {2369--2380},
-  publisher = {Association for Computational Linguistics},
-  title = {{H}otpot{QA}: A Dataset for Diverse, Explainable Multi-hop Question Answering},
-  url = {https://aclanthology.org/D18-1259},
-  year = {2018},
-}
-""",
         adapted_from=["HotpotQA"],
+        superseded_by="HotpotQAHardNegatives.v2",
+        **_hotpot_qa_metadata,
+    )
+class HotpotQAHardNegativesV2(AbsTaskRetrieval):
+    metadata = TaskMetadata(
+        name="HotpotQAHardNegatives.v2",
+        dataset={
+            "path": "mteb/HotpotQA_test_top_250_only_w_correct-v2",
+            "revision": "617612fa63afcb60e3b134bed8b7216a99707c37",
+        },
+        description=(
+            "HotpotQA is a question answering dataset featuring natural, multi-hop questions, with strong "
+            "supervision for supporting facts to enable more explainable question answering systems. "
+            "The hard negative version has been created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct."
+            "V2 uses a more appropriate prompt rather than the default prompt for retrieval. You can get more information on the effect of different prompt in the [PR](https://github.com/embeddings-benchmark/mteb/pull/3469#issuecomment-3436467106)"
+        ),
+        adapted_from=["HotpotQA"],
+        prompt={
+            "query": "Given a multi-hop question, retrieve documents that can help answer the question"
+        },
+        **_hotpot_qa_metadata,
     )

mteb/tasks/retrieval/eng/legal_summarization_retrieval.py CHANGED Viewed

@@ -5,7 +5,7 @@ from mteb.abstasks.task_metadata import TaskMetadata
 class LegalSummarization(AbsTaskRetrieval):
     metadata = TaskMetadata(
         name="LegalSummarization",
-        description="The dataset consistes of 439 pairs of contracts and their summarizations from https://tldrlegal.com and https://tosdr.org/.",
+        description="The dataset consists of 439 pairs of contracts and their summarizations from https://tldrlegal.com and https://tosdr.org/.",
         reference="https://github.com/lauramanor/legal_summarization",
         dataset={
             "path": "mteb/legal_summarization",

mteb/tasks/retrieval/eng/lit_search_retrieval.py CHANGED Viewed

@@ -7,14 +7,7 @@ from mteb.abstasks.task_metadata import TaskMetadata
 class LitSearchRetrieval(AbsTaskRetrieval):
     metadata = TaskMetadata(
         name="LitSearchRetrieval",
-        description="""
-        The dataset contains the query set and retrieval corpus for the paper LitSearch: A Retrieval Benchmark for
-        Scientific Literature Search. It introduces LitSearch, a retrieval benchmark comprising 597 realistic literature
-        search queries about recent ML and NLP papers. LitSearch is constructed using a combination of (1) questions
-        generated by GPT-4 based on paragraphs containing inline citations from research papers and (2) questions about
-        recently published papers, manually written by their authors. All LitSearch questions were manually examined or
-        edited by experts to ensure high quality.
-        """,
+        description="The dataset contains the query set and retrieval corpus for the paper LitSearch: A Retrieval Benchmark for Scientific Literature Search. It introduces LitSearch, a retrieval benchmark comprising 597 realistic literature search queries about recent ML and NLP papers. LitSearch is constructed using a combination of (1) questions generated by GPT-4 based on paragraphs containing inline citations from research papers and (2) questions about recently published papers, manually written by their authors. All LitSearch questions were manually examined or edited by experts to ensure high quality.",
         reference="https://github.com/princeton-nlp/LitSearch",
         dataset={
             "path": "princeton-nlp/LitSearch",

mteb/tasks/retrieval/eng/memotion_i2t_retrieval.py CHANGED Viewed

@@ -20,7 +20,6 @@ def _load_data(path: str, splits: str, revision: str | None = None):
             "id": f"corpus-{split_name}-{idx}",
             "text": x["text_corrected"],
             "modality": "text",
-            "image": None,
         }
     split_datasets = {}
@@ -56,9 +55,7 @@ def _load_data(path: str, splits: str, revision: str | None = None):
         queries[split] = split_dataset.map(
             lambda x, idx: {
                 "id": f"query-{split}-{idx}",
-                "text": None,
                 "modality": "image",
-                # "image": None,
             },
             with_indices=True,
             remove_columns=[

mteb/tasks/retrieval/eng/memotion_t2i_retrieval.py CHANGED Viewed

@@ -18,7 +18,6 @@ def _load_data(path: str, splits: str, revision: str | None = None):
     def map_function(split_name):
         return lambda x, idx: {
             "id": f"corpus-{split_name}-{idx}",
-            "text": None,
             "modality": "image",
         }
@@ -56,7 +55,6 @@ def _load_data(path: str, splits: str, revision: str | None = None):
                 "id": f"query-{split}-{idx}",
                 "text": x["text_corrected"],
                 "modality": "text",
-                "image": None,
             },
             with_indices=True,
             remove_columns=[

mteb/tasks/retrieval/eng/oven_it2t_retrieval.py CHANGED Viewed

@@ -12,7 +12,7 @@ class OVENIT2TRetrieval(AbsTaskRetrieval):
             "revision": "2192074af29422bc1dc41cf07936f198b8c69bd0",
         },
         type="Any2AnyRetrieval",
-        category="it2i",
+        category="it2t",
         eval_splits=["test"],
         eval_langs=["eng-Latn"],
         main_score="ndcg_at_10",

mteb/tasks/retrieval/eng/quora_retrieval.py CHANGED Viewed

@@ -1,6 +1,32 @@
 from mteb.abstasks.retrieval import AbsTaskRetrieval
 from mteb.abstasks.task_metadata import TaskMetadata
+_quora_metadata = dict(
+    reference="https://quoradata.quora.com/First-Quora-Dataset-Release-Question-Pairs",
+    type="Retrieval",
+    category="t2t",
+    modalities=["text"],
+    eval_splits=["test"],
+    eval_langs=["eng-Latn"],
+    main_score="ndcg_at_10",
+    date=None,
+    domains=["Written", "Web", "Blog"],
+    task_subtypes=["Question answering"],
+    license="not specified",
+    annotations_creators="human-annotated",
+    dialect=[],
+    sample_creation="found",
+    bibtex_citation=r"""
+@misc{quora-question-pairs,
+  author = {DataCanary, hilfialkaff, Lili Jiang, Meg Risdal, Nikhil Dandekar, tomtung},
+  publisher = {Kaggle},
+  title = {Quora Question Pairs},
+  url = {https://kaggle.com/competitions/quora-question-pairs},
+  year = {2017},
+}
+""",
+)
 class QuoraRetrieval(AbsTaskRetrieval):
     ignore_identical_ids = True
@@ -15,32 +41,10 @@ class QuoraRetrieval(AbsTaskRetrieval):
             "QuoraRetrieval is based on questions that are marked as duplicates on the Quora platform. Given a"
             + " question, find other (duplicate) questions."
         ),
-        reference="https://quoradata.quora.com/First-Quora-Dataset-Release-Question-Pairs",
-        type="Retrieval",
-        category="t2t",
-        modalities=["text"],
-        eval_splits=["test"],
-        eval_langs=["eng-Latn"],
-        main_score="ndcg_at_10",
-        date=None,
-        domains=["Written", "Web", "Blog"],
-        task_subtypes=["Question answering"],
-        license="not specified",
-        annotations_creators="human-annotated",
-        dialect=[],
-        sample_creation="found",
-        bibtex_citation=r"""
-@misc{quora-question-pairs,
-  author = {DataCanary, hilfialkaff, Lili Jiang, Meg Risdal, Nikhil Dandekar, tomtung},
-  publisher = {Kaggle},
-  title = {Quora Question Pairs},
-  url = {https://kaggle.com/competitions/quora-question-pairs},
-  year = {2017},
-}
-""",
         prompt={
             "query": "Given a question, retrieve questions that are semantically equivalent to the given question"
         },
+        **_quora_metadata,
     )
@@ -57,28 +61,29 @@ class QuoraRetrievalHardNegatives(AbsTaskRetrieval):
             "QuoraRetrieval is based on questions that are marked as duplicates on the Quora platform. Given a"
             + " question, find other (duplicate) questions. The hard negative version has been created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct."
         ),
-        reference="https://quoradata.quora.com/First-Quora-Dataset-Release-Question-Pairs",
-        type="Retrieval",
-        category="t2t",
-        modalities=["text"],
-        eval_splits=["test"],
-        eval_langs=["eng-Latn"],
-        main_score="ndcg_at_10",
-        date=None,
-        domains=None,
-        task_subtypes=None,
-        license=None,
-        annotations_creators=None,
-        dialect=None,
-        sample_creation=None,
-        bibtex_citation=r"""
-@misc{quora-question-pairs,
-  author = {DataCanary, hilfialkaff, Lili Jiang, Meg Risdal, Nikhil Dandekar, tomtung},
-  publisher = {Kaggle},
-  title = {Quora Question Pairs},
-  url = {https://kaggle.com/competitions/quora-question-pairs},
-  year = {2017},
-}
-""",
         adapted_from=["QuoraRetrieval"],
+        superseded_by="QuoraRetrievalHardNegatives.v2",
+        **_quora_metadata,
+    )
+class QuoraRetrievalHardNegativesV2(AbsTaskRetrieval):
+    ignore_identical_ids = True
+    metadata = TaskMetadata(
+        name="QuoraRetrievalHardNegatives.v2",
+        dataset={
+            "path": "mteb/QuoraRetrieval_test_top_250_only_w_correct-v2",
+            "revision": "907a33577e9506221d3ba20f5a851b7c3f8dc6d3",
+        },
+        description=(
+            "QuoraRetrieval is based on questions that are marked as duplicates on the Quora platform. Given a "
+            "question, find other (duplicate) questions. The hard negative version has been created by pooling the 250 top documents per query from BM25, e5-multilingual-large and e5-mistral-instruct."
+            "V2 uses a more appropriate prompt rather than the default prompt for retrieval. You can get more information on the effect of different prompt in the [PR](https://github.com/embeddings-benchmark/mteb/pull/3469#issuecomment-3436467106)"
+        ),
+        adapted_from=["QuoraRetrieval"],
+        prompt={
+            "query": "Given a question, retrieve questions that are semantically equivalent to the given question"
+        },
+        **_quora_metadata,
     )

mteb 2.0.5__py3-none-any.whl → 2.1.19__py3-none-any.whl

mteb 2.0.5py3-none-any.whl → 2.1.19py3-none-any.whl