mteb 2.1.4__py3-none-any.whl → 2.7.2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (527) hide show
  1. mteb/__init__.py +6 -0
  2. mteb/_create_dataloaders.py +22 -20
  3. mteb/_evaluators/any_sts_evaluator.py +23 -14
  4. mteb/_evaluators/classification_metrics.py +54 -0
  5. mteb/_evaluators/clustering_evaluator.py +3 -3
  6. mteb/_evaluators/evaluator.py +4 -2
  7. mteb/_evaluators/image/imagetext_pairclassification_evaluator.py +18 -11
  8. mteb/_evaluators/pair_classification_evaluator.py +34 -40
  9. mteb/_evaluators/retrieval_evaluator.py +2 -2
  10. mteb/_evaluators/retrieval_metrics.py +18 -17
  11. mteb/_evaluators/sklearn_evaluator.py +25 -37
  12. mteb/_evaluators/text/bitext_mining_evaluator.py +31 -19
  13. mteb/_evaluators/text/summarization_evaluator.py +27 -20
  14. mteb/_evaluators/zeroshot_classification_evaluator.py +7 -5
  15. mteb/abstasks/_data_filter/__init__.py +0 -0
  16. mteb/abstasks/_data_filter/filters.py +125 -0
  17. mteb/abstasks/_data_filter/task_pipelines.py +105 -0
  18. mteb/abstasks/_statistics_calculation.py +23 -11
  19. mteb/abstasks/_stratification.py +18 -18
  20. mteb/abstasks/abstask.py +35 -28
  21. mteb/abstasks/aggregate_task_metadata.py +1 -9
  22. mteb/abstasks/aggregated_task.py +10 -29
  23. mteb/abstasks/classification.py +15 -12
  24. mteb/abstasks/clustering.py +20 -16
  25. mteb/abstasks/clustering_legacy.py +13 -10
  26. mteb/abstasks/image/image_text_pair_classification.py +7 -4
  27. mteb/abstasks/multilabel_classification.py +33 -22
  28. mteb/abstasks/pair_classification.py +27 -11
  29. mteb/abstasks/regression.py +4 -4
  30. mteb/abstasks/retrieval.py +28 -24
  31. mteb/abstasks/retrieval_dataset_loaders.py +2 -2
  32. mteb/abstasks/sts.py +14 -4
  33. mteb/abstasks/task_metadata.py +32 -33
  34. mteb/abstasks/text/bitext_mining.py +39 -28
  35. mteb/abstasks/text/reranking.py +8 -6
  36. mteb/abstasks/text/summarization.py +10 -5
  37. mteb/abstasks/zeroshot_classification.py +8 -4
  38. mteb/benchmarks/_create_table.py +84 -37
  39. mteb/benchmarks/benchmark.py +77 -16
  40. mteb/benchmarks/benchmarks/__init__.py +12 -0
  41. mteb/benchmarks/benchmarks/benchmarks.py +361 -16
  42. mteb/benchmarks/get_benchmark.py +14 -53
  43. mteb/cache.py +227 -37
  44. mteb/cli/_display_tasks.py +2 -2
  45. mteb/cli/build_cli.py +110 -14
  46. mteb/cli/generate_model_card.py +43 -23
  47. mteb/deprecated_evaluator.py +71 -62
  48. mteb/descriptive_stats/BitextMining/RuSciBenchBitextMining.v2.json +61 -0
  49. mteb/descriptive_stats/Classification/HebrewSentimentAnalysis.v3.json +60 -0
  50. mteb/descriptive_stats/Classification/TurkishConstitutionalCourtViolation.json +54 -0
  51. mteb/descriptive_stats/Image/DocumentUnderstanding/KoVidore2CybersecurityRetrieval.json +32 -0
  52. mteb/descriptive_stats/Image/DocumentUnderstanding/KoVidore2EconomicRetrieval.json +32 -0
  53. mteb/descriptive_stats/Image/DocumentUnderstanding/KoVidore2EnergyRetrieval.json +32 -0
  54. mteb/descriptive_stats/Image/DocumentUnderstanding/KoVidore2HrRetrieval.json +32 -0
  55. mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3ComputerScienceRetrieval.json +214 -0
  56. mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3EnergyRetrieval.json +214 -0
  57. mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3FinanceEnRetrieval.json +214 -0
  58. mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3FinanceFrRetrieval.json +214 -0
  59. mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3HrRetrieval.json +214 -0
  60. mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3IndustrialRetrieval.json +214 -0
  61. mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3NuclearRetrieval.json +214 -0
  62. mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3PharmaceuticalsRetrieval.json +214 -0
  63. mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3PhysicsRetrieval.json +214 -0
  64. mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3TelecomRetrieval.json +214 -0
  65. mteb/descriptive_stats/PairClassification/TERRa.V2.json +35 -0
  66. mteb/descriptive_stats/Reranking/JQaRARerankingLite.json +35 -0
  67. mteb/descriptive_stats/Reranking/JaCWIRRerankingLite.json +35 -0
  68. mteb/descriptive_stats/Reranking/MultiLongDocReranking.json +466 -0
  69. mteb/descriptive_stats/Retrieval/ArguAna-NL.v2.json +30 -0
  70. mteb/descriptive_stats/Retrieval/ChemRxivRetrieval.json +30 -0
  71. mteb/descriptive_stats/Retrieval/EuroPIRQRetrieval.json +116 -0
  72. mteb/descriptive_stats/Retrieval/JaCWIRRetrievalLite.json +30 -0
  73. mteb/descriptive_stats/Retrieval/JaqketRetrievalLite.json +30 -0
  74. mteb/descriptive_stats/Retrieval/MIRACLJaRetrievalLite.json +30 -0
  75. mteb/descriptive_stats/Retrieval/MrTyDiJaRetrievalLite.json +30 -0
  76. mteb/descriptive_stats/Retrieval/NFCorpus-NL.v2.json +30 -0
  77. mteb/descriptive_stats/Retrieval/NanoClimateFEVER-VN.json +30 -0
  78. mteb/descriptive_stats/Retrieval/NanoDBPedia-VN.json +30 -0
  79. mteb/descriptive_stats/Retrieval/NanoFEVER-VN.json +30 -0
  80. mteb/descriptive_stats/Retrieval/NanoHotpotQA-VN.json +30 -0
  81. mteb/descriptive_stats/Retrieval/NanoMSMARCO-VN.json +30 -0
  82. mteb/descriptive_stats/Retrieval/NanoNQ-VN.json +30 -0
  83. mteb/descriptive_stats/Retrieval/SCIDOCS-NL.v2.json +30 -0
  84. mteb/descriptive_stats/Retrieval/SQuADKorV1Retrieval.json +30 -0
  85. mteb/descriptive_stats/Retrieval/SciFact-NL.v2.json +30 -0
  86. mteb/descriptive_stats/Retrieval/TVPLRetrieval.json +30 -0
  87. mteb/evaluate.py +106 -75
  88. mteb/filter_tasks.py +25 -26
  89. mteb/get_tasks.py +29 -30
  90. mteb/languages/language_scripts.py +5 -3
  91. mteb/leaderboard/app.py +414 -151
  92. mteb/leaderboard/benchmark_selector.py +14 -5
  93. mteb/leaderboard/figures.py +13 -15
  94. mteb/leaderboard/table.py +82 -17
  95. mteb/load_results.py +12 -12
  96. mteb/models/__init__.py +4 -1
  97. mteb/models/abs_encoder.py +31 -23
  98. mteb/models/cache_wrappers/__init__.py +2 -1
  99. mteb/models/cache_wrappers/cache_backend_protocol.py +3 -5
  100. mteb/models/cache_wrappers/cache_backends/_hash_utils.py +7 -6
  101. mteb/models/cache_wrappers/cache_backends/faiss_cache.py +6 -2
  102. mteb/models/cache_wrappers/cache_backends/numpy_cache.py +43 -25
  103. mteb/models/cache_wrappers/cache_wrapper.py +3 -3
  104. mteb/models/get_model_meta.py +25 -118
  105. mteb/models/instruct_wrapper.py +33 -9
  106. mteb/models/model_implementations/align_models.py +8 -1
  107. mteb/models/model_implementations/amazon_models.py +1 -0
  108. mteb/models/model_implementations/andersborges.py +65 -0
  109. mteb/models/model_implementations/ara_models.py +9 -1
  110. mteb/models/model_implementations/arctic_models.py +16 -8
  111. mteb/models/model_implementations/b1ade_models.py +2 -1
  112. mteb/models/model_implementations/bedrock_models.py +4 -0
  113. mteb/models/model_implementations/bge_models.py +101 -17
  114. mteb/models/model_implementations/bica_model.py +35 -0
  115. mteb/models/model_implementations/blip2_models.py +13 -2
  116. mteb/models/model_implementations/blip_models.py +43 -16
  117. mteb/models/model_implementations/bm25.py +5 -4
  118. mteb/models/model_implementations/bmretriever_models.py +10 -4
  119. mteb/models/model_implementations/cadet_models.py +10 -1
  120. mteb/models/model_implementations/cde_models.py +25 -4
  121. mteb/models/model_implementations/clip_models.py +9 -6
  122. mteb/models/model_implementations/clips_models.py +100 -0
  123. mteb/models/model_implementations/codefuse_models.py +165 -3
  124. mteb/models/model_implementations/codesage_models.py +18 -3
  125. mteb/models/model_implementations/cohere_models.py +13 -6
  126. mteb/models/model_implementations/cohere_v.py +7 -2
  127. mteb/models/model_implementations/colpali_models.py +17 -9
  128. mteb/models/model_implementations/colqwen_models.py +275 -5
  129. mteb/models/model_implementations/colsmol_models.py +4 -2
  130. mteb/models/model_implementations/conan_models.py +2 -1
  131. mteb/models/model_implementations/dino_models.py +194 -23
  132. mteb/models/model_implementations/e5_instruct.py +27 -4
  133. mteb/models/model_implementations/e5_models.py +21 -110
  134. mteb/models/model_implementations/e5_v.py +7 -6
  135. mteb/models/model_implementations/eagerworks_models.py +164 -0
  136. mteb/models/model_implementations/emillykkejensen_models.py +91 -0
  137. mteb/models/model_implementations/en_code_retriever.py +2 -1
  138. mteb/models/model_implementations/euler_models.py +32 -0
  139. mteb/models/model_implementations/evaclip_models.py +4 -0
  140. mteb/models/model_implementations/fa_models.py +67 -9
  141. mteb/models/model_implementations/facebookai.py +205 -0
  142. mteb/models/model_implementations/geogpt_models.py +2 -1
  143. mteb/models/model_implementations/gme_v_models.py +17 -10
  144. mteb/models/model_implementations/google_models.py +17 -6
  145. mteb/models/model_implementations/granite_vision_embedding_models.py +8 -3
  146. mteb/models/model_implementations/gritlm_models.py +4 -2
  147. mteb/models/model_implementations/gte_models.py +99 -9
  148. mteb/models/model_implementations/hinvec_models.py +2 -1
  149. mteb/models/model_implementations/human.py +1 -0
  150. mteb/models/model_implementations/ibm_granite_models.py +36 -6
  151. mteb/models/model_implementations/inf_models.py +4 -2
  152. mteb/models/model_implementations/jasper_models.py +256 -3
  153. mteb/models/model_implementations/jina_clip.py +49 -10
  154. mteb/models/model_implementations/jina_models.py +222 -11
  155. mteb/models/model_implementations/kalm_models.py +203 -25
  156. mteb/models/model_implementations/kblab.py +37 -0
  157. mteb/models/model_implementations/kennethenevoldsen_models.py +74 -0
  158. mteb/models/model_implementations/kfst.py +25 -0
  159. mteb/models/model_implementations/kowshik24_models.py +32 -0
  160. mteb/models/model_implementations/lens_models.py +2 -0
  161. mteb/models/model_implementations/lgai_embedding_models.py +2 -1
  162. mteb/models/model_implementations/linq_models.py +4 -3
  163. mteb/models/model_implementations/listconranker.py +2 -2
  164. mteb/models/model_implementations/llm2clip_models.py +9 -6
  165. mteb/models/model_implementations/llm2vec_models.py +16 -8
  166. mteb/models/model_implementations/mcinext_models.py +7 -1
  167. mteb/models/model_implementations/mdbr_models.py +19 -3
  168. mteb/models/model_implementations/misc_models.py +422 -60
  169. mteb/models/model_implementations/mixedbread_ai_models.py +332 -0
  170. mteb/models/model_implementations/mme5_models.py +2 -1
  171. mteb/models/model_implementations/moco_models.py +15 -4
  172. mteb/models/model_implementations/mod_models.py +191 -0
  173. mteb/models/model_implementations/model2vec_models.py +27 -14
  174. mteb/models/model_implementations/moka_models.py +4 -1
  175. mteb/models/model_implementations/nbailab.py +70 -0
  176. mteb/models/model_implementations/no_instruct_sentence_models.py +3 -2
  177. mteb/models/model_implementations/nomic_models.py +173 -6
  178. mteb/models/model_implementations/nomic_models_vision.py +8 -3
  179. mteb/models/model_implementations/nvidia_llama_nemoretriever_colemb.py +32 -19
  180. mteb/models/model_implementations/nvidia_models.py +155 -20
  181. mteb/models/model_implementations/octen_models.py +254 -0
  182. mteb/models/model_implementations/openai_models.py +20 -16
  183. mteb/models/model_implementations/openclip_models.py +37 -13
  184. mteb/models/model_implementations/opensearch_neural_sparse_models.py +10 -5
  185. mteb/models/model_implementations/ops_moa_models.py +5 -3
  186. mteb/models/model_implementations/ordalietech_solon_embeddings_mini_beta_1_1.py +1 -1
  187. mteb/models/model_implementations/pawan_models.py +39 -0
  188. mteb/models/model_implementations/piccolo_models.py +9 -1
  189. mteb/models/model_implementations/pixie_models.py +56 -0
  190. mteb/models/model_implementations/promptriever_models.py +12 -8
  191. mteb/models/model_implementations/pylate_models.py +46 -12
  192. mteb/models/model_implementations/qodo_models.py +4 -2
  193. mteb/models/model_implementations/qtack_models.py +2 -1
  194. mteb/models/model_implementations/qwen3_models.py +9 -6
  195. mteb/models/model_implementations/qzhou_models.py +5 -3
  196. mteb/models/model_implementations/random_baseline.py +19 -24
  197. mteb/models/model_implementations/rasgaard_models.py +34 -0
  198. mteb/models/model_implementations/reasonir_model.py +2 -1
  199. mteb/models/model_implementations/repllama_models.py +5 -3
  200. mteb/models/model_implementations/rerankers_custom.py +15 -9
  201. mteb/models/model_implementations/rerankers_monot5_based.py +31 -31
  202. mteb/models/model_implementations/richinfoai_models.py +2 -1
  203. mteb/models/model_implementations/ru_sentence_models.py +71 -20
  204. mteb/models/model_implementations/ruri_models.py +322 -0
  205. mteb/models/model_implementations/salesforce_models.py +6 -3
  206. mteb/models/model_implementations/samilpwc_models.py +2 -1
  207. mteb/models/model_implementations/sarashina_embedding_models.py +168 -0
  208. mteb/models/model_implementations/searchmap_models.py +2 -1
  209. mteb/models/model_implementations/seed_1_6_embedding_models.py +8 -2
  210. mteb/models/model_implementations/seed_1_6_embedding_models_1215.py +625 -0
  211. mteb/models/model_implementations/seed_models.py +1 -0
  212. mteb/models/model_implementations/sentence_transformers_models.py +177 -18
  213. mteb/models/model_implementations/shuu_model.py +32 -31
  214. mteb/models/model_implementations/siglip_models.py +30 -20
  215. mteb/models/model_implementations/slm_models.py +416 -0
  216. mteb/models/model_implementations/sonar_models.py +1 -0
  217. mteb/models/model_implementations/spartan8806_atles_champion.py +34 -0
  218. mteb/models/model_implementations/stella_models.py +23 -4
  219. mteb/models/model_implementations/tarka_models.py +376 -0
  220. mteb/models/model_implementations/text2vec_models.py +9 -3
  221. mteb/models/model_implementations/ua_sentence_models.py +11 -1
  222. mteb/models/model_implementations/uae_models.py +8 -1
  223. mteb/models/model_implementations/vdr_models.py +3 -1
  224. mteb/models/model_implementations/vi_vn_models.py +45 -6
  225. mteb/models/model_implementations/vista_models.py +2 -0
  226. mteb/models/model_implementations/vlm2vec_models.py +5 -3
  227. mteb/models/model_implementations/voyage_models.py +99 -0
  228. mteb/models/model_implementations/voyage_v.py +17 -9
  229. mteb/models/model_implementations/xyz_models.py +1 -0
  230. mteb/models/model_implementations/youtu_models.py +2 -1
  231. mteb/models/model_implementations/yuan_models.py +34 -0
  232. mteb/models/model_implementations/yuan_models_en.py +58 -0
  233. mteb/models/model_meta.py +498 -29
  234. mteb/models/models_protocols.py +22 -6
  235. mteb/models/search_encoder_index/__init__.py +7 -0
  236. mteb/models/search_encoder_index/search_backend_protocol.py +50 -0
  237. mteb/models/search_encoder_index/search_indexes/__init__.py +5 -0
  238. mteb/models/search_encoder_index/search_indexes/faiss_search_index.py +160 -0
  239. mteb/models/search_wrappers.py +197 -65
  240. mteb/models/sentence_transformer_wrapper.py +52 -32
  241. mteb/models/vllm_wrapper.py +327 -0
  242. mteb/py.typed +0 -0
  243. mteb/results/benchmark_results.py +114 -65
  244. mteb/results/model_result.py +63 -26
  245. mteb/results/task_result.py +117 -77
  246. mteb/similarity_functions.py +60 -7
  247. mteb/tasks/bitext_mining/multilingual/__init__.py +2 -1
  248. mteb/tasks/bitext_mining/multilingual/bucc_bitext_mining.py +4 -2
  249. mteb/tasks/bitext_mining/multilingual/bucc_bitext_mining_fast.py +1 -1
  250. mteb/tasks/bitext_mining/multilingual/ru_sci_bench_bitext_mining.py +47 -5
  251. mteb/tasks/bitext_mining/multilingual/web_faq_bitext_mining.py +2 -6
  252. mteb/tasks/classification/ara/ajgt.py +1 -2
  253. mteb/tasks/classification/ara/hotel_review_sentiment_classification.py +1 -2
  254. mteb/tasks/classification/ara/online_store_review_sentiment_classification.py +1 -2
  255. mteb/tasks/classification/ara/restaurant_review_sentiment_classification.py +1 -2
  256. mteb/tasks/classification/ara/tweet_emotion_classification.py +1 -2
  257. mteb/tasks/classification/ara/tweet_sarcasm_classification.py +1 -2
  258. mteb/tasks/classification/ben/bengali_document_classification.py +1 -2
  259. mteb/tasks/classification/ben/bengali_hate_speech_classification.py +1 -2
  260. mteb/tasks/classification/ben/bengali_sentiment_analysis.py +1 -2
  261. mteb/tasks/classification/ces/csfdcz_movie_review_sentiment_classification.py +1 -2
  262. mteb/tasks/classification/ces/czech_product_review_sentiment_classification.py +1 -2
  263. mteb/tasks/classification/ces/czech_so_me_sentiment_classification.py +1 -2
  264. mteb/tasks/classification/dan/angry_tweets_classification.py +1 -2
  265. mteb/tasks/classification/dan/danish_political_comments_classification.py +1 -2
  266. mteb/tasks/classification/dan/ddisco_cohesion_classification.py +1 -2
  267. mteb/tasks/classification/dan/dk_hate_classification.py +2 -3
  268. mteb/tasks/classification/deu/german_politicians_twitter_sentiment_classification.py +1 -2
  269. mteb/tasks/classification/deu/ten_k_gnad_classification.py +1 -2
  270. mteb/tasks/classification/eng/amazon_polarity_classification.py +1 -2
  271. mteb/tasks/classification/eng/arxiv_classification.py +1 -2
  272. mteb/tasks/classification/eng/banking77_classification.py +1 -2
  273. mteb/tasks/classification/eng/dbpedia_classification.py +1 -2
  274. mteb/tasks/classification/eng/emotion_classification.py +1 -2
  275. mteb/tasks/classification/eng/financial_phrasebank_classification.py +1 -2
  276. mteb/tasks/classification/eng/frenk_en_classification.py +1 -2
  277. mteb/tasks/classification/eng/gtsrb_classification.py +1 -1
  278. mteb/tasks/classification/eng/imdb_classification.py +1 -2
  279. mteb/tasks/classification/eng/legal_bench_classification.py +14 -120
  280. mteb/tasks/classification/eng/news_classification.py +1 -2
  281. mteb/tasks/classification/eng/patch_camelyon_classification.py +1 -1
  282. mteb/tasks/classification/eng/patent_classification.py +1 -2
  283. mteb/tasks/classification/eng/poem_sentiment_classification.py +1 -2
  284. mteb/tasks/classification/eng/sds_eye_protection_classification.py +1 -2
  285. mteb/tasks/classification/eng/sds_gloves_classification.py +1 -2
  286. mteb/tasks/classification/eng/toxic_chat_classification.py +2 -19
  287. mteb/tasks/classification/eng/toxic_conversations_classification.py +1 -2
  288. mteb/tasks/classification/eng/tweet_sentiment_extraction_classification.py +1 -2
  289. mteb/tasks/classification/eng/tweet_topic_single_classification.py +2 -13
  290. mteb/tasks/classification/eng/ucf101_classification.py +1 -5
  291. mteb/tasks/classification/eng/wikipedia_bio_met_chem_classification.py +1 -2
  292. mteb/tasks/classification/eng/wikipedia_chem_fields_classification.py +1 -2
  293. mteb/tasks/classification/eng/wikipedia_comp_chem_spectroscopy_classification.py +1 -2
  294. mteb/tasks/classification/eng/wikipedia_crystallography_analytical_classification.py +1 -2
  295. mteb/tasks/classification/eng/wikipedia_theoretical_applied_classification.py +1 -2
  296. mteb/tasks/classification/eng/yahoo_answers_topics_classification.py +1 -2
  297. mteb/tasks/classification/eng/yelp_review_full_classification.py +1 -2
  298. mteb/tasks/classification/est/estonian_valence.py +2 -3
  299. mteb/tasks/classification/fas/fa_mteb_classification.py +7 -14
  300. mteb/tasks/classification/fil/filipino_hate_speech_classification.py +1 -2
  301. mteb/tasks/classification/fin/fin_toxicity_classification.py +2 -11
  302. mteb/tasks/classification/fra/french_book_reviews.py +1 -2
  303. mteb/tasks/classification/fra/movie_review_sentiment_classification.py +1 -2
  304. mteb/tasks/classification/guj/gujarati_news_classification.py +1 -2
  305. mteb/tasks/classification/heb/__init__.py +6 -1
  306. mteb/tasks/classification/heb/hebrew_sentiment_analysis.py +62 -4
  307. mteb/tasks/classification/hin/hindi_discourse_classification.py +1 -2
  308. mteb/tasks/classification/hin/sentiment_analysis_hindi.py +1 -2
  309. mteb/tasks/classification/hrv/frenk_hr_classification.py +1 -2
  310. mteb/tasks/classification/ind/indonesian_id_clickbait_classification.py +1 -2
  311. mteb/tasks/classification/ind/indonesian_mongabay_conservation_classification.py +1 -2
  312. mteb/tasks/classification/ita/italian_linguist_acceptability_classification.py +1 -2
  313. mteb/tasks/classification/jav/javanese_imdb_classification.py +1 -2
  314. mteb/tasks/classification/jpn/wrime_classification.py +1 -2
  315. mteb/tasks/classification/kan/kannada_news_classification.py +1 -2
  316. mteb/tasks/classification/kor/klue_tc.py +1 -2
  317. mteb/tasks/classification/kor/kor_hate_classification.py +2 -17
  318. mteb/tasks/classification/kor/kor_sarcasm_classification.py +2 -19
  319. mteb/tasks/classification/kur/kurdish_sentiment_classification.py +3 -4
  320. mteb/tasks/classification/mal/malayalam_news_classification.py +1 -2
  321. mteb/tasks/classification/mar/marathi_news_classification.py +1 -2
  322. mteb/tasks/classification/mkd/macedonian_tweet_sentiment_classification.py +1 -2
  323. mteb/tasks/classification/multilingual/catalonia_tweet_classification.py +1 -6
  324. mteb/tasks/classification/multilingual/multi_hate_classification.py +1 -4
  325. mteb/tasks/classification/multilingual/ru_sci_bench_classification.py +4 -23
  326. mteb/tasks/classification/multilingual/scala_classification.py +2 -3
  327. mteb/tasks/classification/multilingual/sib200_classification.py +1 -6
  328. mteb/tasks/classification/mya/myanmar_news.py +1 -2
  329. mteb/tasks/classification/nep/nepali_news_classification.py +1 -2
  330. mteb/tasks/classification/nld/dutch_book_review_sentiment_classification.py +4 -2
  331. mteb/tasks/classification/nld/dutch_cola_classification.py +3 -0
  332. mteb/tasks/classification/nld/dutch_government_bias_classification.py +3 -0
  333. mteb/tasks/classification/nld/dutch_news_articles_classification.py +3 -0
  334. mteb/tasks/classification/nld/dutch_sarcastic_headlines_classification.py +3 -0
  335. mteb/tasks/classification/nld/iconclass_classification.py +3 -0
  336. mteb/tasks/classification/nld/open_tender_classification.py +3 -0
  337. mteb/tasks/classification/nld/vaccin_chat_nl_classification.py +3 -0
  338. mteb/tasks/classification/nob/no_rec_classification.py +1 -2
  339. mteb/tasks/classification/nob/norwegian_parliament_classification.py +1 -2
  340. mteb/tasks/classification/ory/odia_news_classification.py +1 -2
  341. mteb/tasks/classification/pol/polish_classification.py +3 -6
  342. mteb/tasks/classification/ron/moroco.py +1 -2
  343. mteb/tasks/classification/ron/romanian_reviews_sentiment.py +1 -2
  344. mteb/tasks/classification/ron/romanian_sentiment_classification.py +1 -2
  345. mteb/tasks/classification/rus/georeview_classification.py +1 -2
  346. mteb/tasks/classification/rus/headline_classification.py +1 -2
  347. mteb/tasks/classification/rus/inappropriateness_classification.py +1 -2
  348. mteb/tasks/classification/rus/ru_reviews_classification.py +1 -2
  349. mteb/tasks/classification/rus/ru_toixic_classification_okmlcup.py +1 -2
  350. mteb/tasks/classification/rus/senti_ru_eval.py +1 -2
  351. mteb/tasks/classification/sin/sinhala_news_classification.py +1 -2
  352. mteb/tasks/classification/sin/sinhala_news_source_classification.py +1 -2
  353. mteb/tasks/classification/slk/csfdsk_movie_review_sentiment_classification.py +1 -2
  354. mteb/tasks/classification/slk/slovak_hate_speech_classification.py +1 -2
  355. mteb/tasks/classification/slk/slovak_movie_review_sentiment_classification.py +1 -2
  356. mteb/tasks/classification/slv/frenk_sl_classification.py +1 -2
  357. mteb/tasks/classification/spa/spanish_news_classification.py +1 -2
  358. mteb/tasks/classification/spa/spanish_sentiment_classification.py +1 -2
  359. mteb/tasks/classification/ssw/siswati_news_classification.py +1 -2
  360. mteb/tasks/classification/swa/swahili_news_classification.py +1 -2
  361. mteb/tasks/classification/swe/dalaj_classification.py +1 -2
  362. mteb/tasks/classification/swe/swe_rec_classification.py +1 -2
  363. mteb/tasks/classification/swe/swedish_sentiment_classification.py +1 -2
  364. mteb/tasks/classification/tam/tamil_news_classification.py +1 -2
  365. mteb/tasks/classification/tel/telugu_andhra_jyoti_news_classification.py +1 -2
  366. mteb/tasks/classification/tha/wisesight_sentiment_classification.py +1 -2
  367. mteb/tasks/classification/tsn/tswana_news_classification.py +1 -2
  368. mteb/tasks/classification/tur/__init__.py +4 -0
  369. mteb/tasks/classification/tur/turkish_constitutional_court.py +41 -0
  370. mteb/tasks/classification/tur/turkish_movie_sentiment_classification.py +1 -2
  371. mteb/tasks/classification/tur/turkish_product_sentiment_classification.py +1 -2
  372. mteb/tasks/classification/ukr/ukr_formality_classification.py +2 -15
  373. mteb/tasks/classification/urd/urdu_roman_sentiment_classification.py +1 -2
  374. mteb/tasks/classification/vie/amazon_counterfactual_vn_classification.py +1 -6
  375. mteb/tasks/classification/vie/amazon_polarity_vn_classification.py +1 -6
  376. mteb/tasks/classification/vie/amazon_reviews_vn_classification.py +1 -5
  377. mteb/tasks/classification/vie/banking77_vn_classification.py +1 -5
  378. mteb/tasks/classification/vie/emotion_vn_classification.py +1 -5
  379. mteb/tasks/classification/vie/imdb_vn_classification.py +1 -5
  380. mteb/tasks/classification/vie/massive_intent_vn_classification.py +1 -5
  381. mteb/tasks/classification/vie/massive_scenario_vn_classification.py +1 -5
  382. mteb/tasks/classification/vie/mtop_domain_vn_classification.py +1 -5
  383. mteb/tasks/classification/vie/mtop_intent_vn_classification.py +1 -5
  384. mteb/tasks/classification/vie/toxic_conversations_vn_classification.py +1 -5
  385. mteb/tasks/classification/vie/tweet_sentiment_extraction_vn_classification.py +1 -5
  386. mteb/tasks/classification/vie/vie_student_feedback_classification.py +1 -2
  387. mteb/tasks/classification/zho/cmteb_classification.py +5 -10
  388. mteb/tasks/classification/zho/yue_openrice_review_classification.py +1 -2
  389. mteb/tasks/classification/zul/isi_zulu_news_classification.py +1 -2
  390. mteb/tasks/clustering/eng/hume_wiki_cities_clustering.py +1 -1
  391. mteb/tasks/clustering/eng/wiki_cities_clustering.py +1 -1
  392. mteb/tasks/clustering/jpn/mews_c16_ja_clustering.py +1 -3
  393. mteb/tasks/clustering/multilingual/sib200_clustering_s2s.py +1 -6
  394. mteb/tasks/clustering/nld/dutch_news_articles_clustering_p2p.py +3 -0
  395. mteb/tasks/clustering/nld/dutch_news_articles_clustering_s2s.py +3 -0
  396. mteb/tasks/clustering/nld/iconclass_clustering_s2s.py +3 -0
  397. mteb/tasks/clustering/nld/open_tender_clustering_p2p.py +3 -0
  398. mteb/tasks/clustering/nld/open_tender_clustering_s2s.py +3 -0
  399. mteb/tasks/clustering/nld/vabb_clustering_p2p.py +3 -0
  400. mteb/tasks/clustering/nld/vabb_clustering_s2s.py +3 -0
  401. mteb/tasks/clustering/vie/reddit_clustering_p2p_vn.py +1 -5
  402. mteb/tasks/clustering/vie/reddit_clustering_vn.py +1 -5
  403. mteb/tasks/clustering/vie/stack_exchange_clustering_p2p_vn.py +1 -5
  404. mteb/tasks/clustering/vie/stack_exchange_clustering_vn.py +1 -5
  405. mteb/tasks/clustering/vie/twenty_newsgroups_clustering_vn.py +1 -5
  406. mteb/tasks/clustering/zho/cmteb_clustering.py +2 -2
  407. mteb/tasks/image_text_pair_classification/eng/sugar_crepe.py +1 -1
  408. mteb/tasks/multilabel_classification/ita/emit_classification.py +1 -5
  409. mteb/tasks/multilabel_classification/kor/kor_hate_speech_ml_classification.py +1 -9
  410. mteb/tasks/multilabel_classification/mlt/maltese_news_classification.py +1 -6
  411. mteb/tasks/multilabel_classification/nld/covid_disinformation_nl_multi_label_classification.py +3 -0
  412. mteb/tasks/multilabel_classification/nld/vabb_multi_label_classification.py +3 -0
  413. mteb/tasks/multilabel_classification/por/brazilian_toxic_tweets_classification.py +1 -6
  414. mteb/tasks/multilabel_classification/swe/swedish_patent_cpc_group_classification.py +1 -1
  415. mteb/tasks/multilabel_classification/swe/swedish_patent_cpc_subclass_classification.py +1 -2
  416. mteb/tasks/pair_classification/dan/talemaader_pc.py +1 -6
  417. mteb/tasks/pair_classification/eng/legal_bench_pc.py +1 -9
  418. mteb/tasks/pair_classification/nld/sick_nl_pair_classification.py +3 -0
  419. mteb/tasks/pair_classification/nld/xlwic_nl_pair_classification.py +3 -0
  420. mteb/tasks/pair_classification/rus/__init__.py +2 -2
  421. mteb/tasks/pair_classification/rus/terra.py +51 -25
  422. mteb/tasks/pair_classification/vie/sprint_duplicate_questions_pcvn.py +1 -5
  423. mteb/tasks/pair_classification/vie/twitter_sem_eval2015_pcvn.py +1 -5
  424. mteb/tasks/pair_classification/vie/twitter_url_corpus_pcvn.py +1 -5
  425. mteb/tasks/regression/multilingual/ru_sci_bench_regression.py +2 -6
  426. mteb/tasks/reranking/jpn/__init__.py +9 -1
  427. mteb/tasks/reranking/jpn/j_qa_ra_reranking_lite.py +49 -0
  428. mteb/tasks/reranking/jpn/ja_cwir_reranking_lite.py +47 -0
  429. mteb/tasks/reranking/multilingual/__init__.py +2 -0
  430. mteb/tasks/reranking/multilingual/multi_long_doc_reranking.py +70 -0
  431. mteb/tasks/reranking/multilingual/wikipedia_reranking_multilingual.py +1 -1
  432. mteb/tasks/reranking/multilingual/x_glue_wpr_reranking.py +1 -2
  433. mteb/tasks/reranking/vie/ask_ubuntu_dup_questions_vn.py +1 -5
  434. mteb/tasks/reranking/vie/sci_docs_reranking_vn.py +1 -5
  435. mteb/tasks/reranking/vie/stack_overflow_dup_questions_vn.py +1 -5
  436. mteb/tasks/retrieval/code/code_rag.py +12 -12
  437. mteb/tasks/retrieval/code/fresh_stack_retrieval.py +8 -5
  438. mteb/tasks/retrieval/dan/dan_fever_retrieval.py +1 -1
  439. mteb/tasks/retrieval/dan/tv2_nordretrieval.py +2 -2
  440. mteb/tasks/retrieval/dan/twitter_hjerne_retrieval.py +2 -2
  441. mteb/tasks/retrieval/eng/__init__.py +2 -0
  442. mteb/tasks/retrieval/eng/chemrxiv.py +33 -0
  443. mteb/tasks/retrieval/eng/cub200_i2i_retrieval.py +1 -1
  444. mteb/tasks/retrieval/eng/lit_search_retrieval.py +1 -8
  445. mteb/tasks/retrieval/eng/vidore_bench_retrieval.py +4 -0
  446. mteb/tasks/retrieval/jpn/__init__.py +8 -0
  447. mteb/tasks/retrieval/jpn/ja_cwir_retrieval.py +1 -4
  448. mteb/tasks/retrieval/jpn/ja_cwir_retrieval_lite.py +47 -0
  449. mteb/tasks/retrieval/jpn/jaqket_retrieval_lite.py +50 -0
  450. mteb/tasks/retrieval/jpn/miracl_ja_retrieval_lite.py +52 -0
  451. mteb/tasks/retrieval/jpn/mr_tydi_ja_retrieval_lite.py +48 -0
  452. mteb/tasks/retrieval/kat/georgian_faq_retrieval.py +11 -4
  453. mteb/tasks/retrieval/kor/__init__.py +16 -1
  454. mteb/tasks/retrieval/kor/kovidore2_bench_retrieval.py +142 -0
  455. mteb/tasks/retrieval/kor/squad_kor_v1_retrieval.py +47 -0
  456. mteb/tasks/retrieval/multilingual/__init__.py +24 -0
  457. mteb/tasks/retrieval/multilingual/belebele_retrieval.py +5 -4
  458. mteb/tasks/retrieval/multilingual/euro_pirq_retrieval.py +43 -0
  459. mteb/tasks/retrieval/multilingual/jina_vdr_bench_retrieval.py +56 -42
  460. mteb/tasks/retrieval/multilingual/mkqa_retrieval.py +1 -2
  461. mteb/tasks/retrieval/multilingual/mlqa_retrieval.py +1 -4
  462. mteb/tasks/retrieval/multilingual/multi_long_doc_retrieval.py +1 -2
  463. mteb/tasks/retrieval/multilingual/public_health_qa_retrieval.py +9 -4
  464. mteb/tasks/retrieval/multilingual/ru_sci_bench_retrieval.py +2 -12
  465. mteb/tasks/retrieval/multilingual/vidore2_bench_retrieval.py +4 -2
  466. mteb/tasks/retrieval/multilingual/vidore3_bench_retrieval.py +389 -0
  467. mteb/tasks/retrieval/nld/__init__.py +8 -4
  468. mteb/tasks/retrieval/nld/argu_ana_nl_retrieval.py +46 -27
  469. mteb/tasks/retrieval/nld/bbsard_nl_retrieval.py +3 -0
  470. mteb/tasks/retrieval/nld/dutch_news_articles_retrieval.py +3 -0
  471. mteb/tasks/retrieval/nld/legal_qa_nl_retrieval.py +3 -0
  472. mteb/tasks/retrieval/nld/nf_corpus_nl_retrieval.py +42 -25
  473. mteb/tasks/retrieval/nld/open_tender_retrieval.py +3 -0
  474. mteb/tasks/retrieval/nld/sci_fact_nl_retrieval.py +42 -24
  475. mteb/tasks/retrieval/nld/scidocsnl_retrieval.py +44 -27
  476. mteb/tasks/retrieval/nld/vabb_retrieval.py +3 -0
  477. mteb/tasks/retrieval/nob/norquad.py +2 -2
  478. mteb/tasks/retrieval/nob/snl_retrieval.py +2 -2
  479. mteb/tasks/retrieval/slk/slovak_sum_retrieval.py +1 -7
  480. mteb/tasks/retrieval/tur/tur_hist_quad.py +1 -1
  481. mteb/tasks/retrieval/vie/__init__.py +14 -6
  482. mteb/tasks/retrieval/vie/argu_ana_vn_retrieval.py +1 -5
  483. mteb/tasks/retrieval/vie/climate_fevervn_retrieval.py +40 -5
  484. mteb/tasks/retrieval/vie/cqa_dupstack_android_vn_retrieval.py +1 -5
  485. mteb/tasks/retrieval/vie/cqa_dupstack_gis_vn_retrieval.py +1 -5
  486. mteb/tasks/retrieval/vie/cqa_dupstack_mathematica_vn_retrieval.py +1 -5
  487. mteb/tasks/retrieval/vie/cqa_dupstack_physics_vn_retrieval.py +1 -5
  488. mteb/tasks/retrieval/vie/cqa_dupstack_programmers_vn_retrieval.py +1 -5
  489. mteb/tasks/retrieval/vie/cqa_dupstack_stats_vn_retrieval.py +1 -5
  490. mteb/tasks/retrieval/vie/cqa_dupstack_tex_vn_retrieval.py +1 -5
  491. mteb/tasks/retrieval/vie/cqa_dupstack_unix_vn_retrieval.py +1 -5
  492. mteb/tasks/retrieval/vie/cqa_dupstack_webmasters_vn_retrieval.py +1 -5
  493. mteb/tasks/retrieval/vie/cqa_dupstack_wordpress_vn_retrieval.py +1 -5
  494. mteb/tasks/retrieval/vie/db_pedia_vn_retrieval.py +40 -5
  495. mteb/tasks/retrieval/vie/fevervn_retrieval.py +40 -7
  496. mteb/tasks/retrieval/vie/fi_qa2018_vn_retrieval.py +1 -5
  497. mteb/tasks/retrieval/vie/green_node_table_markdown_retrieval.py +16 -1
  498. mteb/tasks/retrieval/vie/hotpot_qavn_retrieval.py +40 -6
  499. mteb/tasks/retrieval/vie/msmarcovn_retrieval.py +49 -5
  500. mteb/tasks/retrieval/vie/nf_corpus_vn_retrieval.py +1 -5
  501. mteb/tasks/retrieval/vie/nqvn_retrieval.py +40 -5
  502. mteb/tasks/retrieval/vie/quora_vn_retrieval.py +1 -6
  503. mteb/tasks/retrieval/vie/sci_fact_vn_retrieval.py +1 -5
  504. mteb/tasks/retrieval/vie/scidocsvn_retrieval.py +1 -6
  505. mteb/tasks/retrieval/vie/touche2020_vn_retrieval.py +1 -5
  506. mteb/tasks/retrieval/vie/treccovidvn_retrieval.py +1 -5
  507. mteb/tasks/retrieval/vie/tvpl_retrieval.py +42 -0
  508. mteb/tasks/retrieval/vie/zac_legal_text_retrieval.py +15 -1
  509. mteb/tasks/sts/nld/sick_nl_sts.py +1 -0
  510. mteb/tasks/sts/vie/biosses_stsvn.py +1 -5
  511. mteb/tasks/sts/vie/sickr_stsvn.py +1 -5
  512. mteb/tasks/sts/vie/sts_benchmark_stsvn.py +1 -5
  513. mteb/tasks/zeroshot_classification/eng/gtsrb.py +1 -1
  514. mteb/tasks/zeroshot_classification/eng/patch_camelyon.py +1 -1
  515. mteb/tasks/zeroshot_classification/eng/ucf101.py +1 -5
  516. mteb/types/__init__.py +2 -0
  517. mteb/types/_encoder_io.py +19 -2
  518. mteb/types/_result.py +2 -1
  519. mteb/types/statistics.py +9 -3
  520. {mteb-2.1.4.dist-info → mteb-2.7.2.dist-info}/METADATA +25 -8
  521. {mteb-2.1.4.dist-info → mteb-2.7.2.dist-info}/RECORD +525 -438
  522. mteb/models/model_implementations/mxbai_models.py +0 -102
  523. mteb/models/model_implementations/nb_sbert.py +0 -25
  524. {mteb-2.1.4.dist-info → mteb-2.7.2.dist-info}/WHEEL +0 -0
  525. {mteb-2.1.4.dist-info → mteb-2.7.2.dist-info}/entry_points.txt +0 -0
  526. {mteb-2.1.4.dist-info → mteb-2.7.2.dist-info}/licenses/LICENSE +0 -0
  527. {mteb-2.1.4.dist-info → mteb-2.7.2.dist-info}/top_level.txt +0 -0
@@ -104,8 +104,9 @@ dinov2_training_datasets = set(
104
104
 
105
105
 
106
106
  dinov2_small = ModelMeta(
107
- loader=DINOModel, # type: ignore
107
+ loader=DINOModel,
108
108
  name="facebook/dinov2-small",
109
+ model_type=["dense"],
109
110
  languages=["eng-Latn"],
110
111
  revision="ed25f3a31f01632728cabb09d1542f84ab7b0056",
111
112
  release_date="2023-07-18",
@@ -118,16 +119,25 @@ dinov2_small = ModelMeta(
118
119
  open_weights=True,
119
120
  public_training_code="https://github.com/facebookresearch/dinov2",
120
121
  public_training_data=None,
121
- framework=["PyTorch"],
122
+ framework=["PyTorch", "Transformers", "safetensors"],
122
123
  reference="https://huggingface.co/facebook/dinov2-small",
123
124
  similarity_fn_name=ScoringFunction.COSINE,
124
125
  use_instructions=False,
125
126
  training_datasets=dinov2_training_datasets,
127
+ citation="""@misc{oquab2023dinov2,
128
+ title={DINOv2: Learning Robust Visual Features without Supervision},
129
+ author={Maxime Oquab and Timothée Darcet and Théo Moutakanni and Huy Vo and Marc Szafraniec and Vasil Khalidov and Pierre Fernandez and Daniel Haziza and Francisco Massa and Alaaeldin El-Nouby and Mahmoud Assran and Nicolas Ballas and Wojciech Galuba and Russell Howes and Po-Yao Huang and Shang-Wen Li and Ishan Misra and Michael Rabbat and Vasu Sharma and Gabriel Synnaeve and Hu Xu and Hervé Jegou and Julien Mairal and Patrick Labatut and Armand Joulin and Piotr Bojanowski},
130
+ year={2023},
131
+ eprint={2304.07193},
132
+ archivePrefix={arXiv},
133
+ primaryClass={cs.CV}
134
+ }""",
126
135
  )
127
136
 
128
137
  dinov2_base = ModelMeta(
129
- loader=DINOModel, # type: ignore
138
+ loader=DINOModel,
130
139
  name="facebook/dinov2-base",
140
+ model_type=["dense"],
131
141
  languages=["eng-Latn"],
132
142
  revision="f9e44c814b77203eaa57a6bdbbd535f21ede1415",
133
143
  release_date="2023-07-18",
@@ -140,16 +150,25 @@ dinov2_base = ModelMeta(
140
150
  open_weights=True,
141
151
  public_training_code="https://github.com/facebookresearch/dinov2",
142
152
  public_training_data=None,
143
- framework=["PyTorch"],
153
+ framework=["PyTorch", "Transformers", "safetensors"],
144
154
  reference="https://huggingface.co/facebook/dinov2-base",
145
155
  similarity_fn_name=ScoringFunction.COSINE,
146
156
  use_instructions=False,
147
157
  training_datasets=dinov2_training_datasets,
158
+ citation="""@misc{oquab2023dinov2,
159
+ title={DINOv2: Learning Robust Visual Features without Supervision},
160
+ author={Maxime Oquab and Timothée Darcet and Théo Moutakanni and Huy Vo and Marc Szafraniec and Vasil Khalidov and Pierre Fernandez and Daniel Haziza and Francisco Massa and Alaaeldin El-Nouby and Mahmoud Assran and Nicolas Ballas and Wojciech Galuba and Russell Howes and Po-Yao Huang and Shang-Wen Li and Ishan Misra and Michael Rabbat and Vasu Sharma and Gabriel Synnaeve and Hu Xu and Hervé Jegou and Julien Mairal and Patrick Labatut and Armand Joulin and Piotr Bojanowski},
161
+ year={2023},
162
+ eprint={2304.07193},
163
+ archivePrefix={arXiv},
164
+ primaryClass={cs.CV}
165
+ }""",
148
166
  )
149
167
 
150
168
  dinov2_large = ModelMeta(
151
- loader=DINOModel, # type: ignore
169
+ loader=DINOModel,
152
170
  name="facebook/dinov2-large",
171
+ model_type=["dense"],
153
172
  languages=["eng-Latn"],
154
173
  revision="47b73eefe95e8d44ec3623f8890bd894b6ea2d6c",
155
174
  release_date="2023-07-18",
@@ -162,16 +181,25 @@ dinov2_large = ModelMeta(
162
181
  open_weights=True,
163
182
  public_training_code="https://github.com/facebookresearch/dinov2",
164
183
  public_training_data=None,
165
- framework=["PyTorch"],
184
+ framework=["PyTorch", "Transformers", "safetensors"],
166
185
  reference="https://huggingface.co/facebook/dinov2-large",
167
186
  similarity_fn_name=ScoringFunction.COSINE,
168
187
  use_instructions=False,
169
188
  training_datasets=dinov2_training_datasets,
189
+ citation="""@misc{oquab2023dinov2,
190
+ title={DINOv2: Learning Robust Visual Features without Supervision},
191
+ author={Maxime Oquab and Timothée Darcet and Théo Moutakanni and Huy Vo and Marc Szafraniec and Vasil Khalidov and Pierre Fernandez and Daniel Haziza and Francisco Massa and Alaaeldin El-Nouby and Mahmoud Assran and Nicolas Ballas and Wojciech Galuba and Russell Howes and Po-Yao Huang and Shang-Wen Li and Ishan Misra and Michael Rabbat and Vasu Sharma and Gabriel Synnaeve and Hu Xu and Hervé Jegou and Julien Mairal and Patrick Labatut and Armand Joulin and Piotr Bojanowski},
192
+ year={2023},
193
+ eprint={2304.07193},
194
+ archivePrefix={arXiv},
195
+ primaryClass={cs.CV}
196
+ }""",
170
197
  )
171
198
 
172
199
  dinov2_giant = ModelMeta(
173
- loader=DINOModel, # type: ignore
200
+ loader=DINOModel,
174
201
  name="facebook/dinov2-giant",
202
+ model_type=["dense"],
175
203
  languages=["eng-Latn"],
176
204
  revision="611a9d42f2335e0f921f1e313ad3c1b7178d206d",
177
205
  release_date="2023-07-18",
@@ -184,11 +212,19 @@ dinov2_giant = ModelMeta(
184
212
  open_weights=True,
185
213
  public_training_code="https://github.com/facebookresearch/dinov2",
186
214
  public_training_data=None,
187
- framework=["PyTorch"],
215
+ framework=["PyTorch", "Transformers", "safetensors"],
188
216
  reference="https://huggingface.co/facebook/dinov2-giant",
189
217
  similarity_fn_name=ScoringFunction.COSINE,
190
218
  use_instructions=False,
191
219
  training_datasets=dinov2_training_datasets,
220
+ citation="""@misc{oquab2023dinov2,
221
+ title={DINOv2: Learning Robust Visual Features without Supervision},
222
+ author={Maxime Oquab and Timothée Darcet and Théo Moutakanni and Huy Vo and Marc Szafraniec and Vasil Khalidov and Pierre Fernandez and Daniel Haziza and Francisco Massa and Alaaeldin El-Nouby and Mahmoud Assran and Nicolas Ballas and Wojciech Galuba and Russell Howes and Po-Yao Huang and Shang-Wen Li and Ishan Misra and Michael Rabbat and Vasu Sharma and Gabriel Synnaeve and Hu Xu and Hervé Jegou and Julien Mairal and Patrick Labatut and Armand Joulin and Piotr Bojanowski},
223
+ year={2023},
224
+ eprint={2304.07193},
225
+ archivePrefix={arXiv},
226
+ primaryClass={cs.CV}
227
+ }""",
192
228
  )
193
229
 
194
230
  webssl_dino_training_datasets = set(
@@ -198,6 +234,7 @@ webssl_dino_training_datasets = set(
198
234
  webssl_dino300m_full2b = ModelMeta(
199
235
  loader=DINOModel,
200
236
  name="facebook/webssl-dino300m-full2b-224",
237
+ model_type=["dense"],
201
238
  languages=["eng-Latn"],
202
239
  revision="8529cdb3fb75014932af3b896455fc21c386168e",
203
240
  release_date="2025-04-24",
@@ -210,16 +247,25 @@ webssl_dino300m_full2b = ModelMeta(
210
247
  open_weights=True,
211
248
  public_training_code="",
212
249
  public_training_data=None,
213
- framework=["PyTorch"],
250
+ framework=["PyTorch", "Transformers", "safetensors"],
214
251
  reference="https://huggingface.co/facebook/webssl-dino300m-full2b-224",
215
252
  similarity_fn_name=None,
216
253
  use_instructions=False,
217
254
  training_datasets=webssl_dino_training_datasets,
255
+ citation="""@article{fan2025scaling,
256
+ title={Scaling Language-Free Visual Representation Learning},
257
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
258
+ year={2025},
259
+ eprint={2504.01017},
260
+ archivePrefix={arXiv},
261
+ primaryClass={cs.CV}
262
+ }""",
218
263
  )
219
264
 
220
265
  webssl_dino1b_full2b = ModelMeta(
221
266
  loader=DINOModel,
222
267
  name="facebook/webssl-dino1b-full2b-224",
268
+ model_type=["dense"],
223
269
  languages=["eng-Latn"],
224
270
  revision="d3bf033d9c8cc62ea9e73c40956642cad2ec568a",
225
271
  release_date="2025-04-24",
@@ -232,16 +278,25 @@ webssl_dino1b_full2b = ModelMeta(
232
278
  open_weights=True,
233
279
  public_training_code="",
234
280
  public_training_data=None,
235
- framework=["PyTorch"],
281
+ framework=["PyTorch", "Transformers", "safetensors"],
236
282
  reference="https://huggingface.co/facebook/webssl-dino1b-full2b-224",
237
283
  similarity_fn_name=None,
238
284
  use_instructions=False,
239
285
  training_datasets=webssl_dino_training_datasets,
286
+ citation="""@article{fan2025scaling,
287
+ title={Scaling Language-Free Visual Representation Learning},
288
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
289
+ year={2025},
290
+ eprint={2504.01017},
291
+ archivePrefix={arXiv},
292
+ primaryClass={cs.CV}
293
+ }""",
240
294
  )
241
295
 
242
296
  webssl_dino2b_full2b = ModelMeta(
243
297
  loader=DINOModel,
244
298
  name="facebook/webssl-dino2b-full2b-224",
299
+ model_type=["dense"],
245
300
  languages=["eng-Latn"],
246
301
  revision="cd5893e3fd2e988eb716792049b3dd53b3f1b68b",
247
302
  release_date="2025-04-24",
@@ -254,16 +309,25 @@ webssl_dino2b_full2b = ModelMeta(
254
309
  open_weights=True,
255
310
  public_training_code="",
256
311
  public_training_data=None,
257
- framework=["PyTorch"],
312
+ framework=["PyTorch", "Transformers", "safetensors"],
258
313
  reference="https://huggingface.co/facebook/webssl-dino2b-full2b-224",
259
314
  similarity_fn_name=None,
260
315
  use_instructions=False,
261
316
  training_datasets=webssl_dino_training_datasets,
317
+ citation="""@article{fan2025scaling,
318
+ title={Scaling Language-Free Visual Representation Learning},
319
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
320
+ year={2025},
321
+ eprint={2504.01017},
322
+ archivePrefix={arXiv},
323
+ primaryClass={cs.CV}
324
+ }""",
262
325
  )
263
326
 
264
327
  webssl_dino3b_full2b = ModelMeta(
265
328
  loader=DINOModel,
266
329
  name="facebook/webssl-dino3b-full2b-224",
330
+ model_type=["dense"],
267
331
  languages=["eng-Latn"],
268
332
  revision="2d015c340b16bc47bc6557fcb4e6c83a9d4aa1d3",
269
333
  release_date="2025-04-24",
@@ -276,16 +340,25 @@ webssl_dino3b_full2b = ModelMeta(
276
340
  open_weights=True,
277
341
  public_training_code="",
278
342
  public_training_data=None,
279
- framework=["PyTorch"],
343
+ framework=["PyTorch", "Transformers", "safetensors"],
280
344
  reference="https://huggingface.co/facebook/webssl-dino3b-full2b-224",
281
345
  similarity_fn_name=None,
282
346
  use_instructions=False,
283
347
  training_datasets=webssl_dino_training_datasets,
348
+ citation="""@article{fan2025scaling,
349
+ title={Scaling Language-Free Visual Representation Learning},
350
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
351
+ year={2025},
352
+ eprint={2504.01017},
353
+ archivePrefix={arXiv},
354
+ primaryClass={cs.CV}
355
+ }""",
284
356
  )
285
357
 
286
358
  webssl_dino5b_full2b = ModelMeta(
287
359
  loader=DINOModel,
288
360
  name="facebook/webssl-dino5b-full2b-224",
361
+ model_type=["dense"],
289
362
  languages=["eng-Latn"],
290
363
  revision="88006b18b9af369f6c611db7a64d908bde3714e0",
291
364
  release_date="2025-04-24",
@@ -298,16 +371,25 @@ webssl_dino5b_full2b = ModelMeta(
298
371
  open_weights=True,
299
372
  public_training_code="",
300
373
  public_training_data=None,
301
- framework=["PyTorch"],
374
+ framework=["PyTorch", "Transformers", "safetensors"],
302
375
  reference="https://huggingface.co/facebook/webssl-dino5b-full2b-224",
303
376
  similarity_fn_name=None,
304
377
  use_instructions=False,
305
378
  training_datasets=webssl_dino_training_datasets,
379
+ citation="""@article{fan2025scaling,
380
+ title={Scaling Language-Free Visual Representation Learning},
381
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
382
+ year={2025},
383
+ eprint={2504.01017},
384
+ archivePrefix={arXiv},
385
+ primaryClass={cs.CV}
386
+ }""",
306
387
  )
307
388
 
308
389
  webssl_dino7b_full8b_224 = ModelMeta(
309
390
  loader=DINOModel,
310
391
  name="facebook/webssl-dino7b-full8b-224",
392
+ model_type=["dense"],
311
393
  languages=["eng-Latn"],
312
394
  revision="c6085463ea680043042a80c6d41db2c65e85f466",
313
395
  release_date="2025-04-24",
@@ -320,16 +402,25 @@ webssl_dino7b_full8b_224 = ModelMeta(
320
402
  open_weights=True,
321
403
  public_training_code="",
322
404
  public_training_data=None,
323
- framework=["PyTorch"],
405
+ framework=["PyTorch", "Transformers", "safetensors"],
324
406
  reference="https://huggingface.co/facebook/webssl-dino7b-full8b-224",
325
407
  similarity_fn_name=None,
326
408
  use_instructions=False,
327
409
  training_datasets=webssl_dino_training_datasets,
410
+ citation="""@article{fan2025scaling,
411
+ title={Scaling Language-Free Visual Representation Learning},
412
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
413
+ year={2025},
414
+ eprint={2504.01017},
415
+ archivePrefix={arXiv},
416
+ primaryClass={cs.CV}
417
+ }""",
328
418
  )
329
419
 
330
420
  webssl_dino7b_full8b_378 = ModelMeta(
331
421
  loader=DINOModel,
332
422
  name="facebook/webssl-dino7b-full8b-378",
423
+ model_type=["dense"],
333
424
  languages=["eng-Latn"],
334
425
  revision="53c8c5b43070bd2ddb3f66161140408ce832301f",
335
426
  release_date="2025-04-24",
@@ -342,16 +433,25 @@ webssl_dino7b_full8b_378 = ModelMeta(
342
433
  open_weights=True,
343
434
  public_training_code="",
344
435
  public_training_data=None,
345
- framework=["PyTorch"],
436
+ framework=["PyTorch", "Transformers", "safetensors"],
346
437
  reference="https://huggingface.co/facebook/webssl-dino7b-full8b-378",
347
438
  similarity_fn_name=None,
348
439
  use_instructions=False,
349
440
  training_datasets=webssl_dino_training_datasets,
441
+ citation="""@article{fan2025scaling,
442
+ title={Scaling Language-Free Visual Representation Learning},
443
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
444
+ year={2025},
445
+ eprint={2504.01017},
446
+ archivePrefix={arXiv},
447
+ primaryClass={cs.CV}
448
+ }""",
350
449
  )
351
450
 
352
451
  webssl_dino7b_full8b_518 = ModelMeta(
353
452
  loader=DINOModel,
354
453
  name="facebook/webssl-dino7b-full8b-518",
454
+ model_type=["dense"],
355
455
  languages=["eng-Latn"],
356
456
  revision="aee350d2c5e3e5fdb7ee6985291d808ea5eef431",
357
457
  release_date="2025-04-24",
@@ -364,17 +464,26 @@ webssl_dino7b_full8b_518 = ModelMeta(
364
464
  open_weights=True,
365
465
  public_training_code="",
366
466
  public_training_data=None,
367
- framework=["PyTorch"],
467
+ framework=["PyTorch", "Transformers", "safetensors"],
368
468
  reference="https://huggingface.co/facebook/webssl-dino7b-full8b-518",
369
469
  similarity_fn_name=None,
370
470
  use_instructions=False,
371
471
  training_datasets=webssl_dino_training_datasets,
472
+ citation="""@article{fan2025scaling,
473
+ title={Scaling Language-Free Visual Representation Learning},
474
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
475
+ year={2025},
476
+ eprint={2504.01017},
477
+ archivePrefix={arXiv},
478
+ primaryClass={cs.CV}
479
+ }""",
372
480
  )
373
481
 
374
482
 
375
483
  webssl_dino2b_light2b = ModelMeta(
376
484
  loader=DINOModel,
377
485
  name="facebook/webssl-dino2b-light2b-224",
486
+ model_type=["dense"],
378
487
  languages=["eng-Latn"],
379
488
  revision="633a663f304e63cc3cbec3f7f9ca2fbc94736128",
380
489
  release_date="2025-04-24",
@@ -387,16 +496,25 @@ webssl_dino2b_light2b = ModelMeta(
387
496
  open_weights=True,
388
497
  public_training_code="",
389
498
  public_training_data=None,
390
- framework=["PyTorch"],
499
+ framework=["PyTorch", "Transformers", "safetensors"],
391
500
  reference="https://huggingface.co/facebook/webssl-dino2b-light2b-224",
392
501
  similarity_fn_name=None,
393
502
  use_instructions=False,
394
503
  training_datasets=webssl_dino_training_datasets,
504
+ citation="""@article{fan2025scaling,
505
+ title={Scaling Language-Free Visual Representation Learning},
506
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
507
+ year={2025},
508
+ eprint={2504.01017},
509
+ archivePrefix={arXiv},
510
+ primaryClass={cs.CV}
511
+ }""",
395
512
  )
396
513
 
397
514
  webssl_dino2b_heavy2b = ModelMeta(
398
515
  loader=DINOModel,
399
516
  name="facebook/webssl-dino2b-heavy2b-224",
517
+ model_type=["dense"],
400
518
  languages=["eng-Latn"],
401
519
  revision="9f46eb0c0129656a1ef195fde072e3765abdb7c6",
402
520
  release_date="2025-04-24",
@@ -409,16 +527,25 @@ webssl_dino2b_heavy2b = ModelMeta(
409
527
  open_weights=True,
410
528
  public_training_code="",
411
529
  public_training_data=None,
412
- framework=["PyTorch"],
530
+ framework=["PyTorch", "Transformers", "safetensors"],
413
531
  reference="https://huggingface.co/facebook/webssl-dino2b-heavy2b-224",
414
532
  similarity_fn_name=None,
415
533
  use_instructions=False,
416
534
  training_datasets=webssl_dino_training_datasets,
535
+ citation="""@article{fan2025scaling,
536
+ title={Scaling Language-Free Visual Representation Learning},
537
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
538
+ year={2025},
539
+ eprint={2504.01017},
540
+ archivePrefix={arXiv},
541
+ primaryClass={cs.CV}
542
+ }""",
417
543
  )
418
544
 
419
545
  webssl_dino3b_light2b = ModelMeta(
420
546
  loader=DINOModel,
421
547
  name="facebook/webssl-dino3b-light2b-224",
548
+ model_type=["dense"],
422
549
  languages=["eng-Latn"],
423
550
  revision="4d0160f60673805431f4ad14983e712ed88be5b8",
424
551
  release_date="2025-04-24",
@@ -431,16 +558,25 @@ webssl_dino3b_light2b = ModelMeta(
431
558
  open_weights=True,
432
559
  public_training_code="",
433
560
  public_training_data=None,
434
- framework=["PyTorch"],
561
+ framework=["PyTorch", "Transformers", "safetensors"],
435
562
  reference="https://huggingface.co/facebook/webssl-dino3b-light2b-224",
436
563
  similarity_fn_name=None,
437
564
  use_instructions=False,
438
565
  training_datasets=webssl_dino_training_datasets,
566
+ citation="""@article{fan2025scaling,
567
+ title={Scaling Language-Free Visual Representation Learning},
568
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
569
+ year={2025},
570
+ eprint={2504.01017},
571
+ archivePrefix={arXiv},
572
+ primaryClass={cs.CV}
573
+ }""",
439
574
  )
440
575
 
441
576
  webssl_dino3b_heavy2b = ModelMeta(
442
577
  loader=DINOModel,
443
578
  name="facebook/webssl-dino3b-heavy2b-224",
579
+ model_type=["dense"],
444
580
  languages=["eng-Latn"],
445
581
  revision="dd39c2910747561b332285d96c4dce0bdb240775",
446
582
  release_date="2025-04-24",
@@ -453,16 +589,25 @@ webssl_dino3b_heavy2b = ModelMeta(
453
589
  open_weights=True,
454
590
  public_training_code="",
455
591
  public_training_data=None,
456
- framework=["PyTorch"],
592
+ framework=["PyTorch", "Transformers", "safetensors"],
457
593
  reference="https://huggingface.co/facebook/webssl-dino3b-heavy2b-224",
458
594
  similarity_fn_name=None,
459
595
  use_instructions=False,
460
596
  training_datasets=webssl_dino_training_datasets,
597
+ citation="""@article{fan2025scaling,
598
+ title={Scaling Language-Free Visual Representation Learning},
599
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
600
+ year={2025},
601
+ eprint={2504.01017},
602
+ archivePrefix={arXiv},
603
+ primaryClass={cs.CV}
604
+ }""",
461
605
  )
462
606
 
463
607
  webssl_mae300m_full2b = ModelMeta(
464
608
  loader=DINOModel,
465
609
  name="facebook/webssl-mae300m-full2b-224",
610
+ model_type=["dense"],
466
611
  languages=["eng-Latn"],
467
612
  revision="4655a0ac1726c206ba14d5ccb26758c62a4d03b0",
468
613
  release_date="2025-04-24",
@@ -475,16 +620,25 @@ webssl_mae300m_full2b = ModelMeta(
475
620
  open_weights=True,
476
621
  public_training_code="",
477
622
  public_training_data=None,
478
- framework=["PyTorch"],
623
+ framework=["PyTorch", "Transformers", "safetensors"],
479
624
  reference="https://huggingface.co/facebook/webssl-mae300m-full2b-224",
480
625
  similarity_fn_name=None,
481
626
  use_instructions=False,
482
627
  training_datasets=webssl_dino_training_datasets,
628
+ citation="""@article{fan2025scaling,
629
+ title={Scaling Language-Free Visual Representation Learning},
630
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
631
+ year={2025},
632
+ eprint={2504.01017},
633
+ archivePrefix={arXiv},
634
+ primaryClass={cs.CV}
635
+ }""",
483
636
  )
484
637
 
485
638
  webssl_mae700m_full2b = ModelMeta(
486
639
  loader=DINOModel,
487
640
  name="facebook/webssl-mae700m-full2b-224",
641
+ model_type=["dense"],
488
642
  languages=["eng-Latn"],
489
643
  revision="c32be382e757d73a178de1ead62c27391d4b4280",
490
644
  release_date="2025-04-24",
@@ -497,16 +651,25 @@ webssl_mae700m_full2b = ModelMeta(
497
651
  open_weights=True,
498
652
  public_training_code="",
499
653
  public_training_data=None,
500
- framework=["PyTorch"],
654
+ framework=["PyTorch", "Transformers", "safetensors"],
501
655
  reference="https://huggingface.co/facebook/webssl-mae700m-full2b-224",
502
656
  similarity_fn_name=None,
503
657
  use_instructions=False,
504
658
  training_datasets=webssl_dino_training_datasets,
659
+ citation="""@article{fan2025scaling,
660
+ title={Scaling Language-Free Visual Representation Learning},
661
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
662
+ year={2025},
663
+ eprint={2504.01017},
664
+ archivePrefix={arXiv},
665
+ primaryClass={cs.CV}
666
+ }""",
505
667
  )
506
668
 
507
669
  webssl_mae1b_full2b = ModelMeta(
508
670
  loader=DINOModel,
509
671
  name="facebook/webssl-mae1b-full2b-224",
672
+ model_type=["dense"],
510
673
  languages=["eng-Latn"],
511
674
  revision="5880aefedbad8db0f44d27358f6f08e8576f70fc",
512
675
  release_date="2025-04-24",
@@ -519,9 +682,17 @@ webssl_mae1b_full2b = ModelMeta(
519
682
  open_weights=True,
520
683
  public_training_code="",
521
684
  public_training_data=None,
522
- framework=["PyTorch"],
685
+ framework=["PyTorch", "Transformers", "safetensors"],
523
686
  reference="https://huggingface.co/facebook/webssl-mae1b-full2b-224",
524
687
  similarity_fn_name=None,
525
688
  use_instructions=False,
526
689
  training_datasets=webssl_dino_training_datasets,
690
+ citation="""@article{fan2025scaling,
691
+ title={Scaling Language-Free Visual Representation Learning},
692
+ author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
693
+ year={2025},
694
+ eprint={2504.01017},
695
+ archivePrefix={arXiv},
696
+ primaryClass={cs.CV}
697
+ }""",
527
698
  )
@@ -40,11 +40,19 @@ e5_instruct = ModelMeta(
40
40
  normalized=True,
41
41
  ),
42
42
  name="intfloat/multilingual-e5-large-instruct",
43
+ model_type=["dense"],
43
44
  languages=XLMR_LANGUAGES,
44
45
  open_weights=True,
45
46
  revision="baa7be480a7de1539afce709c8f13f833a510e0a",
46
47
  release_date=E5_PAPER_RELEASE_DATE,
47
- framework=["GritLM", "PyTorch", "Sentence Transformers"],
48
+ framework=[
49
+ "GritLM",
50
+ "PyTorch",
51
+ "Sentence Transformers",
52
+ "ONNX",
53
+ "safetensors",
54
+ "Transformers",
55
+ ],
48
56
  similarity_fn_name=ScoringFunction.COSINE,
49
57
  use_instructions=True,
50
58
  reference="https://huggingface.co/intfloat/multilingual-e5-large-instruct",
@@ -78,11 +86,18 @@ e5_mistral = ModelMeta(
78
86
  normalized=True,
79
87
  ),
80
88
  name="intfloat/e5-mistral-7b-instruct",
89
+ model_type=["dense"],
81
90
  languages=MISTRAL_LANGUAGES,
82
91
  open_weights=True,
83
92
  revision="07163b72af1488142a360786df853f237b1a3ca1",
84
93
  release_date=E5_PAPER_RELEASE_DATE,
85
- framework=["GritLM", "PyTorch", "Sentence Transformers"],
94
+ framework=[
95
+ "GritLM",
96
+ "PyTorch",
97
+ "Sentence Transformers",
98
+ "safetensors",
99
+ "Transformers",
100
+ ],
86
101
  similarity_fn_name=ScoringFunction.COSINE,
87
102
  use_instructions=True,
88
103
  reference="https://huggingface.co/intfloat/e5-mistral-7b-instruct",
@@ -125,6 +140,7 @@ zeta_alpha_ai__zeta_alpha_e5_mistral = ModelMeta(
125
140
  normalized=True,
126
141
  ),
127
142
  name="zeta-alpha-ai/Zeta-Alpha-E5-Mistral",
143
+ model_type=["dense"],
128
144
  revision="c791d37474fa6a5c72eb3a2522be346bc21fbfc3",
129
145
  release_date="2024-08-30",
130
146
  languages=["eng-Latn"],
@@ -136,7 +152,13 @@ zeta_alpha_ai__zeta_alpha_e5_mistral = ModelMeta(
136
152
  open_weights=True,
137
153
  public_training_data=None,
138
154
  public_training_code=None,
139
- framework=["PyTorch", "Sentence Transformers", "GritLM"],
155
+ framework=[
156
+ "PyTorch",
157
+ "Sentence Transformers",
158
+ "GritLM",
159
+ "safetensors",
160
+ "Transformers",
161
+ ],
140
162
  reference="https://huggingface.co/zeta-alpha-ai/Zeta-Alpha-E5-Mistral",
141
163
  similarity_fn_name=ScoringFunction.COSINE,
142
164
  use_instructions=True,
@@ -201,6 +223,7 @@ BeastyZ__e5_R_mistral_7b = ModelMeta(
201
223
  tokenizer_kwargs={"pad_token": "</s>"},
202
224
  ),
203
225
  name="BeastyZ/e5-R-mistral-7b",
226
+ model_type=["dense"],
204
227
  revision="3f810a6a7fd220369ad248e3705cf13d71803602",
205
228
  release_date="2024-06-28",
206
229
  languages=["eng-Latn"],
@@ -212,7 +235,7 @@ BeastyZ__e5_R_mistral_7b = ModelMeta(
212
235
  open_weights=True,
213
236
  public_training_code="https://github.com/LeeSureman/E5-Retrieval-Reproduction",
214
237
  public_training_data="https://huggingface.co/datasets/BeastyZ/E5-R",
215
- framework=["PyTorch"],
238
+ framework=["PyTorch", "Transformers", "safetensors"],
216
239
  reference="https://huggingface.co/BeastyZ/e5-R-mistral-7b",
217
240
  similarity_fn_name="cosine",
218
241
  use_instructions=True,