mteb 2.0.4__py3-none-any.whl → 2.0.5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (59) hide show
  1. mteb/descriptive_stats/BitextMining/BUCC.json +70 -40
  2. mteb/descriptive_stats/Classification/DKHateClassification.json +40 -24
  3. mteb/descriptive_stats/Classification/FinancialPhrasebankClassification.json +23 -15
  4. mteb/descriptive_stats/Classification/ImdbClassification.json +40 -24
  5. mteb/descriptive_stats/Classification/KorHateClassification.json +23 -15
  6. mteb/descriptive_stats/Clustering/ArxivClusteringP2P.json +555 -550
  7. mteb/descriptive_stats/Clustering/ArxivClusteringP2P.v2.json +546 -541
  8. mteb/descriptive_stats/Clustering/ArxivClusteringS2S.json +555 -550
  9. mteb/descriptive_stats/Clustering/MLSUMClusteringP2P.json +2466 -2416
  10. mteb/descriptive_stats/Clustering/RedditClusteringP2P.json +1365 -1360
  11. mteb/descriptive_stats/Clustering/SNLClustering.json +378 -373
  12. mteb/descriptive_stats/Clustering/SwednClustering.json +28 -23
  13. mteb/descriptive_stats/Clustering/VGClustering.json +54 -49
  14. mteb/descriptive_stats/Image/Any2AnyMultilingualRetrieval/WITT2IRetrieval.json +324 -204
  15. mteb/descriptive_stats/Image/Any2AnyRetrieval/MemotionI2TRetrieval.json +28 -18
  16. mteb/descriptive_stats/Image/DocumentUnderstanding/JinaVDRAirbnbSyntheticRetrieval.json +334 -0
  17. mteb/descriptive_stats/Image/DocumentUnderstanding/JinaVDRGitHubReadmeRetrieval.json +544 -0
  18. mteb/descriptive_stats/Image/DocumentUnderstanding/JinaVDRTweetStockSyntheticsRetrieval.json +334 -0
  19. mteb/descriptive_stats/Image/DocumentUnderstanding/JinaVDRWikimediaCommonsDocumentsRetrieval.json +634 -0
  20. mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore2ESGReportsRetrieval.json +154 -0
  21. mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore2EconomicsReportsRetrieval.json +154 -0
  22. mteb/descriptive_stats/Image/ImageClassification/Imagenet1k.json +6039 -3007
  23. mteb/descriptive_stats/Image/ZeroShotClassification/Imagenet1kZeroShot.json +3024 -3010
  24. mteb/descriptive_stats/Image/ZeroShotClassification/PatchCamelyonZeroShot.json +30 -16
  25. mteb/descriptive_stats/Reranking/MIRACLReranking.json +555 -479
  26. mteb/descriptive_stats/Reranking/MindSmallReranking.json +29 -25
  27. mteb/descriptive_stats/Retrieval/AlloprofRetrieval.json +25 -26
  28. mteb/descriptive_stats/Retrieval/Code1Retrieval.json +30 -0
  29. mteb/descriptive_stats/Retrieval/DanFEVER.json +25 -26
  30. mteb/descriptive_stats/Retrieval/EnglishFinance1Retrieval.json +30 -0
  31. mteb/descriptive_stats/Retrieval/EnglishFinance2Retrieval.json +30 -0
  32. mteb/descriptive_stats/Retrieval/EnglishFinance3Retrieval.json +30 -0
  33. mteb/descriptive_stats/Retrieval/EnglishFinance4Retrieval.json +30 -0
  34. mteb/descriptive_stats/Retrieval/EnglishHealthcare1Retrieval.json +30 -0
  35. mteb/descriptive_stats/Retrieval/French1Retrieval.json +30 -0
  36. mteb/descriptive_stats/Retrieval/FrenchLegal1Retrieval.json +30 -0
  37. mteb/descriptive_stats/Retrieval/German1Retrieval.json +30 -0
  38. mteb/descriptive_stats/Retrieval/GermanHealthcare1Retrieval.json +30 -0
  39. mteb/descriptive_stats/Retrieval/GermanLegal1Retrieval.json +30 -0
  40. mteb/descriptive_stats/Retrieval/JapaneseCode1Retrieval.json +30 -0
  41. mteb/descriptive_stats/Retrieval/JapaneseLegal1Retrieval.json +30 -0
  42. mteb/descriptive_stats/Retrieval/MIRACLRetrieval.json +475 -494
  43. mteb/descriptive_stats/Retrieval/MSMARCO-Fa.json +25 -26
  44. mteb/descriptive_stats/Retrieval/MSMARCO.json +25 -84
  45. mteb/descriptive_stats/Retrieval/Touche2020.json +25 -26
  46. mteb/descriptive_stats/Summarization/SummEval.json +27 -50
  47. mteb/descriptive_stats/Summarization/SummEvalFr.json +27 -50
  48. mteb/models/model_implementations/kalm_models.py +29 -0
  49. mteb/tasks/bitext_mining/multilingual/bucc_bitext_mining.py +1 -1
  50. mteb/tasks/classification/eng/financial_phrasebank_classification.py +0 -3
  51. mteb/tasks/classification/kor/kor_hate_classification.py +0 -12
  52. mteb/tasks/clustering/swe/swedn_clustering.py +2 -2
  53. mteb/tasks/retrieval/multilingual/vdr_multilingual_retrieval.py +1 -1
  54. {mteb-2.0.4.dist-info → mteb-2.0.5.dist-info}/METADATA +1 -1
  55. {mteb-2.0.4.dist-info → mteb-2.0.5.dist-info}/RECORD +59 -40
  56. {mteb-2.0.4.dist-info → mteb-2.0.5.dist-info}/WHEEL +0 -0
  57. {mteb-2.0.4.dist-info → mteb-2.0.5.dist-info}/entry_points.txt +0 -0
  58. {mteb-2.0.4.dist-info → mteb-2.0.5.dist-info}/licenses/LICENSE +0 -0
  59. {mteb-2.0.4.dist-info → mteb-2.0.5.dist-info}/top_level.txt +0 -0
@@ -1,27 +1,32 @@
1
1
  {
2
- "all": {
3
- "num_samples": 4,
4
- "number_of_characters": 2048,
5
- "min_text_length": 512,
6
- "average_text_length": 512.0,
7
- "max_text_length": 512,
8
- "unique_texts": 2047,
9
- "min_labels_per_text": 234,
10
- "average_labels_per_text": 512.0,
11
- "max_labels_per_text": 1164,
12
- "unique_labels": 4,
13
- "labels": {
14
- "culture": {
15
- "count": 294
16
- },
17
- "domestic news": {
18
- "count": 1164
19
- },
20
- "economy": {
21
- "count": 234
22
- },
23
- "sports": {
24
- "count": 356
2
+ "test": {
3
+ "num_samples": 2048,
4
+ "text_statistics": {
5
+ "total_text_length": 3317163,
6
+ "min_text_length": 64,
7
+ "average_text_length": 1619.70849609375,
8
+ "max_text_length": 28913,
9
+ "unique_texts": 2047
10
+ },
11
+ "image_statistics": null,
12
+ "label_statistics": {
13
+ "min_labels_per_text": 1,
14
+ "average_label_per_text": 1.0,
15
+ "max_labels_per_text": 1,
16
+ "unique_labels": 4,
17
+ "labels": {
18
+ "culture": {
19
+ "count": 294
20
+ },
21
+ "domestic news": {
22
+ "count": 1164
23
+ },
24
+ "economy": {
25
+ "count": 234
26
+ },
27
+ "sports": {
28
+ "count": 356
29
+ }
25
30
  }
26
31
  }
27
32
  }
@@ -1,54 +1,59 @@
1
1
  {
2
2
  "test": {
3
- "num_samples": 4,
4
- "number_of_characters": 2048,
5
- "min_text_length": 512,
6
- "average_text_length": 512.0,
7
- "max_text_length": 512,
8
- "unique_texts": 2048,
9
- "min_labels_per_text": 2,
10
- "average_labels_per_text": 512.0,
11
- "max_labels_per_text": 1070,
12
- "unique_labels": 13,
13
- "labels": {
14
- "nyheter": {
15
- "count": 1070
16
- },
17
- "rampelys": {
18
- "count": 242
19
- },
20
- "musikk": {
21
- "count": 32
22
- },
23
- "sport": {
24
- "count": 596
25
- },
26
- "reise": {
27
- "count": 19
28
- },
29
- "forbruker": {
30
- "count": 47
31
- },
32
- "mat-og-drikke": {
33
- "count": 4
34
- },
35
- "helse": {
36
- "count": 9
37
- },
38
- "bil-og-motor": {
39
- "count": 9
40
- },
41
- "film": {
42
- "count": 9
43
- },
44
- "teknologi": {
45
- "count": 6
46
- },
47
- "dinepenger": {
48
- "count": 2
49
- },
50
- "spill": {
51
- "count": 3
3
+ "num_samples": 2048,
4
+ "text_statistics": {
5
+ "total_text_length": 2067767,
6
+ "min_text_length": 10,
7
+ "average_text_length": 1009.65185546875,
8
+ "max_text_length": 13082,
9
+ "unique_texts": 2048
10
+ },
11
+ "image_statistics": null,
12
+ "label_statistics": {
13
+ "min_labels_per_text": 1,
14
+ "average_label_per_text": 1.0,
15
+ "max_labels_per_text": 1,
16
+ "unique_labels": 13,
17
+ "labels": {
18
+ "nyheter": {
19
+ "count": 1070
20
+ },
21
+ "rampelys": {
22
+ "count": 242
23
+ },
24
+ "musikk": {
25
+ "count": 32
26
+ },
27
+ "sport": {
28
+ "count": 596
29
+ },
30
+ "reise": {
31
+ "count": 19
32
+ },
33
+ "forbruker": {
34
+ "count": 47
35
+ },
36
+ "mat-og-drikke": {
37
+ "count": 4
38
+ },
39
+ "helse": {
40
+ "count": 9
41
+ },
42
+ "bil-og-motor": {
43
+ "count": 9
44
+ },
45
+ "film": {
46
+ "count": 9
47
+ },
48
+ "teknologi": {
49
+ "count": 6
50
+ },
51
+ "dinepenger": {
52
+ "count": 2
53
+ },
54
+ "spill": {
55
+ "count": 3
56
+ }
52
57
  }
53
58
  }
54
59
  }