mteb 2.1.4__py3-none-any.whl → 2.7.2__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- mteb/__init__.py +6 -0
- mteb/_create_dataloaders.py +22 -20
- mteb/_evaluators/any_sts_evaluator.py +23 -14
- mteb/_evaluators/classification_metrics.py +54 -0
- mteb/_evaluators/clustering_evaluator.py +3 -3
- mteb/_evaluators/evaluator.py +4 -2
- mteb/_evaluators/image/imagetext_pairclassification_evaluator.py +18 -11
- mteb/_evaluators/pair_classification_evaluator.py +34 -40
- mteb/_evaluators/retrieval_evaluator.py +2 -2
- mteb/_evaluators/retrieval_metrics.py +18 -17
- mteb/_evaluators/sklearn_evaluator.py +25 -37
- mteb/_evaluators/text/bitext_mining_evaluator.py +31 -19
- mteb/_evaluators/text/summarization_evaluator.py +27 -20
- mteb/_evaluators/zeroshot_classification_evaluator.py +7 -5
- mteb/abstasks/_data_filter/__init__.py +0 -0
- mteb/abstasks/_data_filter/filters.py +125 -0
- mteb/abstasks/_data_filter/task_pipelines.py +105 -0
- mteb/abstasks/_statistics_calculation.py +23 -11
- mteb/abstasks/_stratification.py +18 -18
- mteb/abstasks/abstask.py +35 -28
- mteb/abstasks/aggregate_task_metadata.py +1 -9
- mteb/abstasks/aggregated_task.py +10 -29
- mteb/abstasks/classification.py +15 -12
- mteb/abstasks/clustering.py +20 -16
- mteb/abstasks/clustering_legacy.py +13 -10
- mteb/abstasks/image/image_text_pair_classification.py +7 -4
- mteb/abstasks/multilabel_classification.py +33 -22
- mteb/abstasks/pair_classification.py +27 -11
- mteb/abstasks/regression.py +4 -4
- mteb/abstasks/retrieval.py +28 -24
- mteb/abstasks/retrieval_dataset_loaders.py +2 -2
- mteb/abstasks/sts.py +14 -4
- mteb/abstasks/task_metadata.py +32 -33
- mteb/abstasks/text/bitext_mining.py +39 -28
- mteb/abstasks/text/reranking.py +8 -6
- mteb/abstasks/text/summarization.py +10 -5
- mteb/abstasks/zeroshot_classification.py +8 -4
- mteb/benchmarks/_create_table.py +84 -37
- mteb/benchmarks/benchmark.py +77 -16
- mteb/benchmarks/benchmarks/__init__.py +12 -0
- mteb/benchmarks/benchmarks/benchmarks.py +361 -16
- mteb/benchmarks/get_benchmark.py +14 -53
- mteb/cache.py +227 -37
- mteb/cli/_display_tasks.py +2 -2
- mteb/cli/build_cli.py +110 -14
- mteb/cli/generate_model_card.py +43 -23
- mteb/deprecated_evaluator.py +71 -62
- mteb/descriptive_stats/BitextMining/RuSciBenchBitextMining.v2.json +61 -0
- mteb/descriptive_stats/Classification/HebrewSentimentAnalysis.v3.json +60 -0
- mteb/descriptive_stats/Classification/TurkishConstitutionalCourtViolation.json +54 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/KoVidore2CybersecurityRetrieval.json +32 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/KoVidore2EconomicRetrieval.json +32 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/KoVidore2EnergyRetrieval.json +32 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/KoVidore2HrRetrieval.json +32 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3ComputerScienceRetrieval.json +214 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3EnergyRetrieval.json +214 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3FinanceEnRetrieval.json +214 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3FinanceFrRetrieval.json +214 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3HrRetrieval.json +214 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3IndustrialRetrieval.json +214 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3NuclearRetrieval.json +214 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3PharmaceuticalsRetrieval.json +214 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3PhysicsRetrieval.json +214 -0
- mteb/descriptive_stats/Image/DocumentUnderstanding/Vidore3TelecomRetrieval.json +214 -0
- mteb/descriptive_stats/PairClassification/TERRa.V2.json +35 -0
- mteb/descriptive_stats/Reranking/JQaRARerankingLite.json +35 -0
- mteb/descriptive_stats/Reranking/JaCWIRRerankingLite.json +35 -0
- mteb/descriptive_stats/Reranking/MultiLongDocReranking.json +466 -0
- mteb/descriptive_stats/Retrieval/ArguAna-NL.v2.json +30 -0
- mteb/descriptive_stats/Retrieval/ChemRxivRetrieval.json +30 -0
- mteb/descriptive_stats/Retrieval/EuroPIRQRetrieval.json +116 -0
- mteb/descriptive_stats/Retrieval/JaCWIRRetrievalLite.json +30 -0
- mteb/descriptive_stats/Retrieval/JaqketRetrievalLite.json +30 -0
- mteb/descriptive_stats/Retrieval/MIRACLJaRetrievalLite.json +30 -0
- mteb/descriptive_stats/Retrieval/MrTyDiJaRetrievalLite.json +30 -0
- mteb/descriptive_stats/Retrieval/NFCorpus-NL.v2.json +30 -0
- mteb/descriptive_stats/Retrieval/NanoClimateFEVER-VN.json +30 -0
- mteb/descriptive_stats/Retrieval/NanoDBPedia-VN.json +30 -0
- mteb/descriptive_stats/Retrieval/NanoFEVER-VN.json +30 -0
- mteb/descriptive_stats/Retrieval/NanoHotpotQA-VN.json +30 -0
- mteb/descriptive_stats/Retrieval/NanoMSMARCO-VN.json +30 -0
- mteb/descriptive_stats/Retrieval/NanoNQ-VN.json +30 -0
- mteb/descriptive_stats/Retrieval/SCIDOCS-NL.v2.json +30 -0
- mteb/descriptive_stats/Retrieval/SQuADKorV1Retrieval.json +30 -0
- mteb/descriptive_stats/Retrieval/SciFact-NL.v2.json +30 -0
- mteb/descriptive_stats/Retrieval/TVPLRetrieval.json +30 -0
- mteb/evaluate.py +106 -75
- mteb/filter_tasks.py +25 -26
- mteb/get_tasks.py +29 -30
- mteb/languages/language_scripts.py +5 -3
- mteb/leaderboard/app.py +414 -151
- mteb/leaderboard/benchmark_selector.py +14 -5
- mteb/leaderboard/figures.py +13 -15
- mteb/leaderboard/table.py +82 -17
- mteb/load_results.py +12 -12
- mteb/models/__init__.py +4 -1
- mteb/models/abs_encoder.py +31 -23
- mteb/models/cache_wrappers/__init__.py +2 -1
- mteb/models/cache_wrappers/cache_backend_protocol.py +3 -5
- mteb/models/cache_wrappers/cache_backends/_hash_utils.py +7 -6
- mteb/models/cache_wrappers/cache_backends/faiss_cache.py +6 -2
- mteb/models/cache_wrappers/cache_backends/numpy_cache.py +43 -25
- mteb/models/cache_wrappers/cache_wrapper.py +3 -3
- mteb/models/get_model_meta.py +25 -118
- mteb/models/instruct_wrapper.py +33 -9
- mteb/models/model_implementations/align_models.py +8 -1
- mteb/models/model_implementations/amazon_models.py +1 -0
- mteb/models/model_implementations/andersborges.py +65 -0
- mteb/models/model_implementations/ara_models.py +9 -1
- mteb/models/model_implementations/arctic_models.py +16 -8
- mteb/models/model_implementations/b1ade_models.py +2 -1
- mteb/models/model_implementations/bedrock_models.py +4 -0
- mteb/models/model_implementations/bge_models.py +101 -17
- mteb/models/model_implementations/bica_model.py +35 -0
- mteb/models/model_implementations/blip2_models.py +13 -2
- mteb/models/model_implementations/blip_models.py +43 -16
- mteb/models/model_implementations/bm25.py +5 -4
- mteb/models/model_implementations/bmretriever_models.py +10 -4
- mteb/models/model_implementations/cadet_models.py +10 -1
- mteb/models/model_implementations/cde_models.py +25 -4
- mteb/models/model_implementations/clip_models.py +9 -6
- mteb/models/model_implementations/clips_models.py +100 -0
- mteb/models/model_implementations/codefuse_models.py +165 -3
- mteb/models/model_implementations/codesage_models.py +18 -3
- mteb/models/model_implementations/cohere_models.py +13 -6
- mteb/models/model_implementations/cohere_v.py +7 -2
- mteb/models/model_implementations/colpali_models.py +17 -9
- mteb/models/model_implementations/colqwen_models.py +275 -5
- mteb/models/model_implementations/colsmol_models.py +4 -2
- mteb/models/model_implementations/conan_models.py +2 -1
- mteb/models/model_implementations/dino_models.py +194 -23
- mteb/models/model_implementations/e5_instruct.py +27 -4
- mteb/models/model_implementations/e5_models.py +21 -110
- mteb/models/model_implementations/e5_v.py +7 -6
- mteb/models/model_implementations/eagerworks_models.py +164 -0
- mteb/models/model_implementations/emillykkejensen_models.py +91 -0
- mteb/models/model_implementations/en_code_retriever.py +2 -1
- mteb/models/model_implementations/euler_models.py +32 -0
- mteb/models/model_implementations/evaclip_models.py +4 -0
- mteb/models/model_implementations/fa_models.py +67 -9
- mteb/models/model_implementations/facebookai.py +205 -0
- mteb/models/model_implementations/geogpt_models.py +2 -1
- mteb/models/model_implementations/gme_v_models.py +17 -10
- mteb/models/model_implementations/google_models.py +17 -6
- mteb/models/model_implementations/granite_vision_embedding_models.py +8 -3
- mteb/models/model_implementations/gritlm_models.py +4 -2
- mteb/models/model_implementations/gte_models.py +99 -9
- mteb/models/model_implementations/hinvec_models.py +2 -1
- mteb/models/model_implementations/human.py +1 -0
- mteb/models/model_implementations/ibm_granite_models.py +36 -6
- mteb/models/model_implementations/inf_models.py +4 -2
- mteb/models/model_implementations/jasper_models.py +256 -3
- mteb/models/model_implementations/jina_clip.py +49 -10
- mteb/models/model_implementations/jina_models.py +222 -11
- mteb/models/model_implementations/kalm_models.py +203 -25
- mteb/models/model_implementations/kblab.py +37 -0
- mteb/models/model_implementations/kennethenevoldsen_models.py +74 -0
- mteb/models/model_implementations/kfst.py +25 -0
- mteb/models/model_implementations/kowshik24_models.py +32 -0
- mteb/models/model_implementations/lens_models.py +2 -0
- mteb/models/model_implementations/lgai_embedding_models.py +2 -1
- mteb/models/model_implementations/linq_models.py +4 -3
- mteb/models/model_implementations/listconranker.py +2 -2
- mteb/models/model_implementations/llm2clip_models.py +9 -6
- mteb/models/model_implementations/llm2vec_models.py +16 -8
- mteb/models/model_implementations/mcinext_models.py +7 -1
- mteb/models/model_implementations/mdbr_models.py +19 -3
- mteb/models/model_implementations/misc_models.py +422 -60
- mteb/models/model_implementations/mixedbread_ai_models.py +332 -0
- mteb/models/model_implementations/mme5_models.py +2 -1
- mteb/models/model_implementations/moco_models.py +15 -4
- mteb/models/model_implementations/mod_models.py +191 -0
- mteb/models/model_implementations/model2vec_models.py +27 -14
- mteb/models/model_implementations/moka_models.py +4 -1
- mteb/models/model_implementations/nbailab.py +70 -0
- mteb/models/model_implementations/no_instruct_sentence_models.py +3 -2
- mteb/models/model_implementations/nomic_models.py +173 -6
- mteb/models/model_implementations/nomic_models_vision.py +8 -3
- mteb/models/model_implementations/nvidia_llama_nemoretriever_colemb.py +32 -19
- mteb/models/model_implementations/nvidia_models.py +155 -20
- mteb/models/model_implementations/octen_models.py +254 -0
- mteb/models/model_implementations/openai_models.py +20 -16
- mteb/models/model_implementations/openclip_models.py +37 -13
- mteb/models/model_implementations/opensearch_neural_sparse_models.py +10 -5
- mteb/models/model_implementations/ops_moa_models.py +5 -3
- mteb/models/model_implementations/ordalietech_solon_embeddings_mini_beta_1_1.py +1 -1
- mteb/models/model_implementations/pawan_models.py +39 -0
- mteb/models/model_implementations/piccolo_models.py +9 -1
- mteb/models/model_implementations/pixie_models.py +56 -0
- mteb/models/model_implementations/promptriever_models.py +12 -8
- mteb/models/model_implementations/pylate_models.py +46 -12
- mteb/models/model_implementations/qodo_models.py +4 -2
- mteb/models/model_implementations/qtack_models.py +2 -1
- mteb/models/model_implementations/qwen3_models.py +9 -6
- mteb/models/model_implementations/qzhou_models.py +5 -3
- mteb/models/model_implementations/random_baseline.py +19 -24
- mteb/models/model_implementations/rasgaard_models.py +34 -0
- mteb/models/model_implementations/reasonir_model.py +2 -1
- mteb/models/model_implementations/repllama_models.py +5 -3
- mteb/models/model_implementations/rerankers_custom.py +15 -9
- mteb/models/model_implementations/rerankers_monot5_based.py +31 -31
- mteb/models/model_implementations/richinfoai_models.py +2 -1
- mteb/models/model_implementations/ru_sentence_models.py +71 -20
- mteb/models/model_implementations/ruri_models.py +322 -0
- mteb/models/model_implementations/salesforce_models.py +6 -3
- mteb/models/model_implementations/samilpwc_models.py +2 -1
- mteb/models/model_implementations/sarashina_embedding_models.py +168 -0
- mteb/models/model_implementations/searchmap_models.py +2 -1
- mteb/models/model_implementations/seed_1_6_embedding_models.py +8 -2
- mteb/models/model_implementations/seed_1_6_embedding_models_1215.py +625 -0
- mteb/models/model_implementations/seed_models.py +1 -0
- mteb/models/model_implementations/sentence_transformers_models.py +177 -18
- mteb/models/model_implementations/shuu_model.py +32 -31
- mteb/models/model_implementations/siglip_models.py +30 -20
- mteb/models/model_implementations/slm_models.py +416 -0
- mteb/models/model_implementations/sonar_models.py +1 -0
- mteb/models/model_implementations/spartan8806_atles_champion.py +34 -0
- mteb/models/model_implementations/stella_models.py +23 -4
- mteb/models/model_implementations/tarka_models.py +376 -0
- mteb/models/model_implementations/text2vec_models.py +9 -3
- mteb/models/model_implementations/ua_sentence_models.py +11 -1
- mteb/models/model_implementations/uae_models.py +8 -1
- mteb/models/model_implementations/vdr_models.py +3 -1
- mteb/models/model_implementations/vi_vn_models.py +45 -6
- mteb/models/model_implementations/vista_models.py +2 -0
- mteb/models/model_implementations/vlm2vec_models.py +5 -3
- mteb/models/model_implementations/voyage_models.py +99 -0
- mteb/models/model_implementations/voyage_v.py +17 -9
- mteb/models/model_implementations/xyz_models.py +1 -0
- mteb/models/model_implementations/youtu_models.py +2 -1
- mteb/models/model_implementations/yuan_models.py +34 -0
- mteb/models/model_implementations/yuan_models_en.py +58 -0
- mteb/models/model_meta.py +498 -29
- mteb/models/models_protocols.py +22 -6
- mteb/models/search_encoder_index/__init__.py +7 -0
- mteb/models/search_encoder_index/search_backend_protocol.py +50 -0
- mteb/models/search_encoder_index/search_indexes/__init__.py +5 -0
- mteb/models/search_encoder_index/search_indexes/faiss_search_index.py +160 -0
- mteb/models/search_wrappers.py +197 -65
- mteb/models/sentence_transformer_wrapper.py +52 -32
- mteb/models/vllm_wrapper.py +327 -0
- mteb/py.typed +0 -0
- mteb/results/benchmark_results.py +114 -65
- mteb/results/model_result.py +63 -26
- mteb/results/task_result.py +117 -77
- mteb/similarity_functions.py +60 -7
- mteb/tasks/bitext_mining/multilingual/__init__.py +2 -1
- mteb/tasks/bitext_mining/multilingual/bucc_bitext_mining.py +4 -2
- mteb/tasks/bitext_mining/multilingual/bucc_bitext_mining_fast.py +1 -1
- mteb/tasks/bitext_mining/multilingual/ru_sci_bench_bitext_mining.py +47 -5
- mteb/tasks/bitext_mining/multilingual/web_faq_bitext_mining.py +2 -6
- mteb/tasks/classification/ara/ajgt.py +1 -2
- mteb/tasks/classification/ara/hotel_review_sentiment_classification.py +1 -2
- mteb/tasks/classification/ara/online_store_review_sentiment_classification.py +1 -2
- mteb/tasks/classification/ara/restaurant_review_sentiment_classification.py +1 -2
- mteb/tasks/classification/ara/tweet_emotion_classification.py +1 -2
- mteb/tasks/classification/ara/tweet_sarcasm_classification.py +1 -2
- mteb/tasks/classification/ben/bengali_document_classification.py +1 -2
- mteb/tasks/classification/ben/bengali_hate_speech_classification.py +1 -2
- mteb/tasks/classification/ben/bengali_sentiment_analysis.py +1 -2
- mteb/tasks/classification/ces/csfdcz_movie_review_sentiment_classification.py +1 -2
- mteb/tasks/classification/ces/czech_product_review_sentiment_classification.py +1 -2
- mteb/tasks/classification/ces/czech_so_me_sentiment_classification.py +1 -2
- mteb/tasks/classification/dan/angry_tweets_classification.py +1 -2
- mteb/tasks/classification/dan/danish_political_comments_classification.py +1 -2
- mteb/tasks/classification/dan/ddisco_cohesion_classification.py +1 -2
- mteb/tasks/classification/dan/dk_hate_classification.py +2 -3
- mteb/tasks/classification/deu/german_politicians_twitter_sentiment_classification.py +1 -2
- mteb/tasks/classification/deu/ten_k_gnad_classification.py +1 -2
- mteb/tasks/classification/eng/amazon_polarity_classification.py +1 -2
- mteb/tasks/classification/eng/arxiv_classification.py +1 -2
- mteb/tasks/classification/eng/banking77_classification.py +1 -2
- mteb/tasks/classification/eng/dbpedia_classification.py +1 -2
- mteb/tasks/classification/eng/emotion_classification.py +1 -2
- mteb/tasks/classification/eng/financial_phrasebank_classification.py +1 -2
- mteb/tasks/classification/eng/frenk_en_classification.py +1 -2
- mteb/tasks/classification/eng/gtsrb_classification.py +1 -1
- mteb/tasks/classification/eng/imdb_classification.py +1 -2
- mteb/tasks/classification/eng/legal_bench_classification.py +14 -120
- mteb/tasks/classification/eng/news_classification.py +1 -2
- mteb/tasks/classification/eng/patch_camelyon_classification.py +1 -1
- mteb/tasks/classification/eng/patent_classification.py +1 -2
- mteb/tasks/classification/eng/poem_sentiment_classification.py +1 -2
- mteb/tasks/classification/eng/sds_eye_protection_classification.py +1 -2
- mteb/tasks/classification/eng/sds_gloves_classification.py +1 -2
- mteb/tasks/classification/eng/toxic_chat_classification.py +2 -19
- mteb/tasks/classification/eng/toxic_conversations_classification.py +1 -2
- mteb/tasks/classification/eng/tweet_sentiment_extraction_classification.py +1 -2
- mteb/tasks/classification/eng/tweet_topic_single_classification.py +2 -13
- mteb/tasks/classification/eng/ucf101_classification.py +1 -5
- mteb/tasks/classification/eng/wikipedia_bio_met_chem_classification.py +1 -2
- mteb/tasks/classification/eng/wikipedia_chem_fields_classification.py +1 -2
- mteb/tasks/classification/eng/wikipedia_comp_chem_spectroscopy_classification.py +1 -2
- mteb/tasks/classification/eng/wikipedia_crystallography_analytical_classification.py +1 -2
- mteb/tasks/classification/eng/wikipedia_theoretical_applied_classification.py +1 -2
- mteb/tasks/classification/eng/yahoo_answers_topics_classification.py +1 -2
- mteb/tasks/classification/eng/yelp_review_full_classification.py +1 -2
- mteb/tasks/classification/est/estonian_valence.py +2 -3
- mteb/tasks/classification/fas/fa_mteb_classification.py +7 -14
- mteb/tasks/classification/fil/filipino_hate_speech_classification.py +1 -2
- mteb/tasks/classification/fin/fin_toxicity_classification.py +2 -11
- mteb/tasks/classification/fra/french_book_reviews.py +1 -2
- mteb/tasks/classification/fra/movie_review_sentiment_classification.py +1 -2
- mteb/tasks/classification/guj/gujarati_news_classification.py +1 -2
- mteb/tasks/classification/heb/__init__.py +6 -1
- mteb/tasks/classification/heb/hebrew_sentiment_analysis.py +62 -4
- mteb/tasks/classification/hin/hindi_discourse_classification.py +1 -2
- mteb/tasks/classification/hin/sentiment_analysis_hindi.py +1 -2
- mteb/tasks/classification/hrv/frenk_hr_classification.py +1 -2
- mteb/tasks/classification/ind/indonesian_id_clickbait_classification.py +1 -2
- mteb/tasks/classification/ind/indonesian_mongabay_conservation_classification.py +1 -2
- mteb/tasks/classification/ita/italian_linguist_acceptability_classification.py +1 -2
- mteb/tasks/classification/jav/javanese_imdb_classification.py +1 -2
- mteb/tasks/classification/jpn/wrime_classification.py +1 -2
- mteb/tasks/classification/kan/kannada_news_classification.py +1 -2
- mteb/tasks/classification/kor/klue_tc.py +1 -2
- mteb/tasks/classification/kor/kor_hate_classification.py +2 -17
- mteb/tasks/classification/kor/kor_sarcasm_classification.py +2 -19
- mteb/tasks/classification/kur/kurdish_sentiment_classification.py +3 -4
- mteb/tasks/classification/mal/malayalam_news_classification.py +1 -2
- mteb/tasks/classification/mar/marathi_news_classification.py +1 -2
- mteb/tasks/classification/mkd/macedonian_tweet_sentiment_classification.py +1 -2
- mteb/tasks/classification/multilingual/catalonia_tweet_classification.py +1 -6
- mteb/tasks/classification/multilingual/multi_hate_classification.py +1 -4
- mteb/tasks/classification/multilingual/ru_sci_bench_classification.py +4 -23
- mteb/tasks/classification/multilingual/scala_classification.py +2 -3
- mteb/tasks/classification/multilingual/sib200_classification.py +1 -6
- mteb/tasks/classification/mya/myanmar_news.py +1 -2
- mteb/tasks/classification/nep/nepali_news_classification.py +1 -2
- mteb/tasks/classification/nld/dutch_book_review_sentiment_classification.py +4 -2
- mteb/tasks/classification/nld/dutch_cola_classification.py +3 -0
- mteb/tasks/classification/nld/dutch_government_bias_classification.py +3 -0
- mteb/tasks/classification/nld/dutch_news_articles_classification.py +3 -0
- mteb/tasks/classification/nld/dutch_sarcastic_headlines_classification.py +3 -0
- mteb/tasks/classification/nld/iconclass_classification.py +3 -0
- mteb/tasks/classification/nld/open_tender_classification.py +3 -0
- mteb/tasks/classification/nld/vaccin_chat_nl_classification.py +3 -0
- mteb/tasks/classification/nob/no_rec_classification.py +1 -2
- mteb/tasks/classification/nob/norwegian_parliament_classification.py +1 -2
- mteb/tasks/classification/ory/odia_news_classification.py +1 -2
- mteb/tasks/classification/pol/polish_classification.py +3 -6
- mteb/tasks/classification/ron/moroco.py +1 -2
- mteb/tasks/classification/ron/romanian_reviews_sentiment.py +1 -2
- mteb/tasks/classification/ron/romanian_sentiment_classification.py +1 -2
- mteb/tasks/classification/rus/georeview_classification.py +1 -2
- mteb/tasks/classification/rus/headline_classification.py +1 -2
- mteb/tasks/classification/rus/inappropriateness_classification.py +1 -2
- mteb/tasks/classification/rus/ru_reviews_classification.py +1 -2
- mteb/tasks/classification/rus/ru_toixic_classification_okmlcup.py +1 -2
- mteb/tasks/classification/rus/senti_ru_eval.py +1 -2
- mteb/tasks/classification/sin/sinhala_news_classification.py +1 -2
- mteb/tasks/classification/sin/sinhala_news_source_classification.py +1 -2
- mteb/tasks/classification/slk/csfdsk_movie_review_sentiment_classification.py +1 -2
- mteb/tasks/classification/slk/slovak_hate_speech_classification.py +1 -2
- mteb/tasks/classification/slk/slovak_movie_review_sentiment_classification.py +1 -2
- mteb/tasks/classification/slv/frenk_sl_classification.py +1 -2
- mteb/tasks/classification/spa/spanish_news_classification.py +1 -2
- mteb/tasks/classification/spa/spanish_sentiment_classification.py +1 -2
- mteb/tasks/classification/ssw/siswati_news_classification.py +1 -2
- mteb/tasks/classification/swa/swahili_news_classification.py +1 -2
- mteb/tasks/classification/swe/dalaj_classification.py +1 -2
- mteb/tasks/classification/swe/swe_rec_classification.py +1 -2
- mteb/tasks/classification/swe/swedish_sentiment_classification.py +1 -2
- mteb/tasks/classification/tam/tamil_news_classification.py +1 -2
- mteb/tasks/classification/tel/telugu_andhra_jyoti_news_classification.py +1 -2
- mteb/tasks/classification/tha/wisesight_sentiment_classification.py +1 -2
- mteb/tasks/classification/tsn/tswana_news_classification.py +1 -2
- mteb/tasks/classification/tur/__init__.py +4 -0
- mteb/tasks/classification/tur/turkish_constitutional_court.py +41 -0
- mteb/tasks/classification/tur/turkish_movie_sentiment_classification.py +1 -2
- mteb/tasks/classification/tur/turkish_product_sentiment_classification.py +1 -2
- mteb/tasks/classification/ukr/ukr_formality_classification.py +2 -15
- mteb/tasks/classification/urd/urdu_roman_sentiment_classification.py +1 -2
- mteb/tasks/classification/vie/amazon_counterfactual_vn_classification.py +1 -6
- mteb/tasks/classification/vie/amazon_polarity_vn_classification.py +1 -6
- mteb/tasks/classification/vie/amazon_reviews_vn_classification.py +1 -5
- mteb/tasks/classification/vie/banking77_vn_classification.py +1 -5
- mteb/tasks/classification/vie/emotion_vn_classification.py +1 -5
- mteb/tasks/classification/vie/imdb_vn_classification.py +1 -5
- mteb/tasks/classification/vie/massive_intent_vn_classification.py +1 -5
- mteb/tasks/classification/vie/massive_scenario_vn_classification.py +1 -5
- mteb/tasks/classification/vie/mtop_domain_vn_classification.py +1 -5
- mteb/tasks/classification/vie/mtop_intent_vn_classification.py +1 -5
- mteb/tasks/classification/vie/toxic_conversations_vn_classification.py +1 -5
- mteb/tasks/classification/vie/tweet_sentiment_extraction_vn_classification.py +1 -5
- mteb/tasks/classification/vie/vie_student_feedback_classification.py +1 -2
- mteb/tasks/classification/zho/cmteb_classification.py +5 -10
- mteb/tasks/classification/zho/yue_openrice_review_classification.py +1 -2
- mteb/tasks/classification/zul/isi_zulu_news_classification.py +1 -2
- mteb/tasks/clustering/eng/hume_wiki_cities_clustering.py +1 -1
- mteb/tasks/clustering/eng/wiki_cities_clustering.py +1 -1
- mteb/tasks/clustering/jpn/mews_c16_ja_clustering.py +1 -3
- mteb/tasks/clustering/multilingual/sib200_clustering_s2s.py +1 -6
- mteb/tasks/clustering/nld/dutch_news_articles_clustering_p2p.py +3 -0
- mteb/tasks/clustering/nld/dutch_news_articles_clustering_s2s.py +3 -0
- mteb/tasks/clustering/nld/iconclass_clustering_s2s.py +3 -0
- mteb/tasks/clustering/nld/open_tender_clustering_p2p.py +3 -0
- mteb/tasks/clustering/nld/open_tender_clustering_s2s.py +3 -0
- mteb/tasks/clustering/nld/vabb_clustering_p2p.py +3 -0
- mteb/tasks/clustering/nld/vabb_clustering_s2s.py +3 -0
- mteb/tasks/clustering/vie/reddit_clustering_p2p_vn.py +1 -5
- mteb/tasks/clustering/vie/reddit_clustering_vn.py +1 -5
- mteb/tasks/clustering/vie/stack_exchange_clustering_p2p_vn.py +1 -5
- mteb/tasks/clustering/vie/stack_exchange_clustering_vn.py +1 -5
- mteb/tasks/clustering/vie/twenty_newsgroups_clustering_vn.py +1 -5
- mteb/tasks/clustering/zho/cmteb_clustering.py +2 -2
- mteb/tasks/image_text_pair_classification/eng/sugar_crepe.py +1 -1
- mteb/tasks/multilabel_classification/ita/emit_classification.py +1 -5
- mteb/tasks/multilabel_classification/kor/kor_hate_speech_ml_classification.py +1 -9
- mteb/tasks/multilabel_classification/mlt/maltese_news_classification.py +1 -6
- mteb/tasks/multilabel_classification/nld/covid_disinformation_nl_multi_label_classification.py +3 -0
- mteb/tasks/multilabel_classification/nld/vabb_multi_label_classification.py +3 -0
- mteb/tasks/multilabel_classification/por/brazilian_toxic_tweets_classification.py +1 -6
- mteb/tasks/multilabel_classification/swe/swedish_patent_cpc_group_classification.py +1 -1
- mteb/tasks/multilabel_classification/swe/swedish_patent_cpc_subclass_classification.py +1 -2
- mteb/tasks/pair_classification/dan/talemaader_pc.py +1 -6
- mteb/tasks/pair_classification/eng/legal_bench_pc.py +1 -9
- mteb/tasks/pair_classification/nld/sick_nl_pair_classification.py +3 -0
- mteb/tasks/pair_classification/nld/xlwic_nl_pair_classification.py +3 -0
- mteb/tasks/pair_classification/rus/__init__.py +2 -2
- mteb/tasks/pair_classification/rus/terra.py +51 -25
- mteb/tasks/pair_classification/vie/sprint_duplicate_questions_pcvn.py +1 -5
- mteb/tasks/pair_classification/vie/twitter_sem_eval2015_pcvn.py +1 -5
- mteb/tasks/pair_classification/vie/twitter_url_corpus_pcvn.py +1 -5
- mteb/tasks/regression/multilingual/ru_sci_bench_regression.py +2 -6
- mteb/tasks/reranking/jpn/__init__.py +9 -1
- mteb/tasks/reranking/jpn/j_qa_ra_reranking_lite.py +49 -0
- mteb/tasks/reranking/jpn/ja_cwir_reranking_lite.py +47 -0
- mteb/tasks/reranking/multilingual/__init__.py +2 -0
- mteb/tasks/reranking/multilingual/multi_long_doc_reranking.py +70 -0
- mteb/tasks/reranking/multilingual/wikipedia_reranking_multilingual.py +1 -1
- mteb/tasks/reranking/multilingual/x_glue_wpr_reranking.py +1 -2
- mteb/tasks/reranking/vie/ask_ubuntu_dup_questions_vn.py +1 -5
- mteb/tasks/reranking/vie/sci_docs_reranking_vn.py +1 -5
- mteb/tasks/reranking/vie/stack_overflow_dup_questions_vn.py +1 -5
- mteb/tasks/retrieval/code/code_rag.py +12 -12
- mteb/tasks/retrieval/code/fresh_stack_retrieval.py +8 -5
- mteb/tasks/retrieval/dan/dan_fever_retrieval.py +1 -1
- mteb/tasks/retrieval/dan/tv2_nordretrieval.py +2 -2
- mteb/tasks/retrieval/dan/twitter_hjerne_retrieval.py +2 -2
- mteb/tasks/retrieval/eng/__init__.py +2 -0
- mteb/tasks/retrieval/eng/chemrxiv.py +33 -0
- mteb/tasks/retrieval/eng/cub200_i2i_retrieval.py +1 -1
- mteb/tasks/retrieval/eng/lit_search_retrieval.py +1 -8
- mteb/tasks/retrieval/eng/vidore_bench_retrieval.py +4 -0
- mteb/tasks/retrieval/jpn/__init__.py +8 -0
- mteb/tasks/retrieval/jpn/ja_cwir_retrieval.py +1 -4
- mteb/tasks/retrieval/jpn/ja_cwir_retrieval_lite.py +47 -0
- mteb/tasks/retrieval/jpn/jaqket_retrieval_lite.py +50 -0
- mteb/tasks/retrieval/jpn/miracl_ja_retrieval_lite.py +52 -0
- mteb/tasks/retrieval/jpn/mr_tydi_ja_retrieval_lite.py +48 -0
- mteb/tasks/retrieval/kat/georgian_faq_retrieval.py +11 -4
- mteb/tasks/retrieval/kor/__init__.py +16 -1
- mteb/tasks/retrieval/kor/kovidore2_bench_retrieval.py +142 -0
- mteb/tasks/retrieval/kor/squad_kor_v1_retrieval.py +47 -0
- mteb/tasks/retrieval/multilingual/__init__.py +24 -0
- mteb/tasks/retrieval/multilingual/belebele_retrieval.py +5 -4
- mteb/tasks/retrieval/multilingual/euro_pirq_retrieval.py +43 -0
- mteb/tasks/retrieval/multilingual/jina_vdr_bench_retrieval.py +56 -42
- mteb/tasks/retrieval/multilingual/mkqa_retrieval.py +1 -2
- mteb/tasks/retrieval/multilingual/mlqa_retrieval.py +1 -4
- mteb/tasks/retrieval/multilingual/multi_long_doc_retrieval.py +1 -2
- mteb/tasks/retrieval/multilingual/public_health_qa_retrieval.py +9 -4
- mteb/tasks/retrieval/multilingual/ru_sci_bench_retrieval.py +2 -12
- mteb/tasks/retrieval/multilingual/vidore2_bench_retrieval.py +4 -2
- mteb/tasks/retrieval/multilingual/vidore3_bench_retrieval.py +389 -0
- mteb/tasks/retrieval/nld/__init__.py +8 -4
- mteb/tasks/retrieval/nld/argu_ana_nl_retrieval.py +46 -27
- mteb/tasks/retrieval/nld/bbsard_nl_retrieval.py +3 -0
- mteb/tasks/retrieval/nld/dutch_news_articles_retrieval.py +3 -0
- mteb/tasks/retrieval/nld/legal_qa_nl_retrieval.py +3 -0
- mteb/tasks/retrieval/nld/nf_corpus_nl_retrieval.py +42 -25
- mteb/tasks/retrieval/nld/open_tender_retrieval.py +3 -0
- mteb/tasks/retrieval/nld/sci_fact_nl_retrieval.py +42 -24
- mteb/tasks/retrieval/nld/scidocsnl_retrieval.py +44 -27
- mteb/tasks/retrieval/nld/vabb_retrieval.py +3 -0
- mteb/tasks/retrieval/nob/norquad.py +2 -2
- mteb/tasks/retrieval/nob/snl_retrieval.py +2 -2
- mteb/tasks/retrieval/slk/slovak_sum_retrieval.py +1 -7
- mteb/tasks/retrieval/tur/tur_hist_quad.py +1 -1
- mteb/tasks/retrieval/vie/__init__.py +14 -6
- mteb/tasks/retrieval/vie/argu_ana_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/climate_fevervn_retrieval.py +40 -5
- mteb/tasks/retrieval/vie/cqa_dupstack_android_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/cqa_dupstack_gis_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/cqa_dupstack_mathematica_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/cqa_dupstack_physics_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/cqa_dupstack_programmers_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/cqa_dupstack_stats_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/cqa_dupstack_tex_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/cqa_dupstack_unix_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/cqa_dupstack_webmasters_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/cqa_dupstack_wordpress_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/db_pedia_vn_retrieval.py +40 -5
- mteb/tasks/retrieval/vie/fevervn_retrieval.py +40 -7
- mteb/tasks/retrieval/vie/fi_qa2018_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/green_node_table_markdown_retrieval.py +16 -1
- mteb/tasks/retrieval/vie/hotpot_qavn_retrieval.py +40 -6
- mteb/tasks/retrieval/vie/msmarcovn_retrieval.py +49 -5
- mteb/tasks/retrieval/vie/nf_corpus_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/nqvn_retrieval.py +40 -5
- mteb/tasks/retrieval/vie/quora_vn_retrieval.py +1 -6
- mteb/tasks/retrieval/vie/sci_fact_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/scidocsvn_retrieval.py +1 -6
- mteb/tasks/retrieval/vie/touche2020_vn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/treccovidvn_retrieval.py +1 -5
- mteb/tasks/retrieval/vie/tvpl_retrieval.py +42 -0
- mteb/tasks/retrieval/vie/zac_legal_text_retrieval.py +15 -1
- mteb/tasks/sts/nld/sick_nl_sts.py +1 -0
- mteb/tasks/sts/vie/biosses_stsvn.py +1 -5
- mteb/tasks/sts/vie/sickr_stsvn.py +1 -5
- mteb/tasks/sts/vie/sts_benchmark_stsvn.py +1 -5
- mteb/tasks/zeroshot_classification/eng/gtsrb.py +1 -1
- mteb/tasks/zeroshot_classification/eng/patch_camelyon.py +1 -1
- mteb/tasks/zeroshot_classification/eng/ucf101.py +1 -5
- mteb/types/__init__.py +2 -0
- mteb/types/_encoder_io.py +19 -2
- mteb/types/_result.py +2 -1
- mteb/types/statistics.py +9 -3
- {mteb-2.1.4.dist-info → mteb-2.7.2.dist-info}/METADATA +25 -8
- {mteb-2.1.4.dist-info → mteb-2.7.2.dist-info}/RECORD +525 -438
- mteb/models/model_implementations/mxbai_models.py +0 -102
- mteb/models/model_implementations/nb_sbert.py +0 -25
- {mteb-2.1.4.dist-info → mteb-2.7.2.dist-info}/WHEEL +0 -0
- {mteb-2.1.4.dist-info → mteb-2.7.2.dist-info}/entry_points.txt +0 -0
- {mteb-2.1.4.dist-info → mteb-2.7.2.dist-info}/licenses/LICENSE +0 -0
- {mteb-2.1.4.dist-info → mteb-2.7.2.dist-info}/top_level.txt +0 -0
|
@@ -104,8 +104,9 @@ dinov2_training_datasets = set(
|
|
|
104
104
|
|
|
105
105
|
|
|
106
106
|
dinov2_small = ModelMeta(
|
|
107
|
-
loader=DINOModel,
|
|
107
|
+
loader=DINOModel,
|
|
108
108
|
name="facebook/dinov2-small",
|
|
109
|
+
model_type=["dense"],
|
|
109
110
|
languages=["eng-Latn"],
|
|
110
111
|
revision="ed25f3a31f01632728cabb09d1542f84ab7b0056",
|
|
111
112
|
release_date="2023-07-18",
|
|
@@ -118,16 +119,25 @@ dinov2_small = ModelMeta(
|
|
|
118
119
|
open_weights=True,
|
|
119
120
|
public_training_code="https://github.com/facebookresearch/dinov2",
|
|
120
121
|
public_training_data=None,
|
|
121
|
-
framework=["PyTorch"],
|
|
122
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
122
123
|
reference="https://huggingface.co/facebook/dinov2-small",
|
|
123
124
|
similarity_fn_name=ScoringFunction.COSINE,
|
|
124
125
|
use_instructions=False,
|
|
125
126
|
training_datasets=dinov2_training_datasets,
|
|
127
|
+
citation="""@misc{oquab2023dinov2,
|
|
128
|
+
title={DINOv2: Learning Robust Visual Features without Supervision},
|
|
129
|
+
author={Maxime Oquab and Timothée Darcet and Théo Moutakanni and Huy Vo and Marc Szafraniec and Vasil Khalidov and Pierre Fernandez and Daniel Haziza and Francisco Massa and Alaaeldin El-Nouby and Mahmoud Assran and Nicolas Ballas and Wojciech Galuba and Russell Howes and Po-Yao Huang and Shang-Wen Li and Ishan Misra and Michael Rabbat and Vasu Sharma and Gabriel Synnaeve and Hu Xu and Hervé Jegou and Julien Mairal and Patrick Labatut and Armand Joulin and Piotr Bojanowski},
|
|
130
|
+
year={2023},
|
|
131
|
+
eprint={2304.07193},
|
|
132
|
+
archivePrefix={arXiv},
|
|
133
|
+
primaryClass={cs.CV}
|
|
134
|
+
}""",
|
|
126
135
|
)
|
|
127
136
|
|
|
128
137
|
dinov2_base = ModelMeta(
|
|
129
|
-
loader=DINOModel,
|
|
138
|
+
loader=DINOModel,
|
|
130
139
|
name="facebook/dinov2-base",
|
|
140
|
+
model_type=["dense"],
|
|
131
141
|
languages=["eng-Latn"],
|
|
132
142
|
revision="f9e44c814b77203eaa57a6bdbbd535f21ede1415",
|
|
133
143
|
release_date="2023-07-18",
|
|
@@ -140,16 +150,25 @@ dinov2_base = ModelMeta(
|
|
|
140
150
|
open_weights=True,
|
|
141
151
|
public_training_code="https://github.com/facebookresearch/dinov2",
|
|
142
152
|
public_training_data=None,
|
|
143
|
-
framework=["PyTorch"],
|
|
153
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
144
154
|
reference="https://huggingface.co/facebook/dinov2-base",
|
|
145
155
|
similarity_fn_name=ScoringFunction.COSINE,
|
|
146
156
|
use_instructions=False,
|
|
147
157
|
training_datasets=dinov2_training_datasets,
|
|
158
|
+
citation="""@misc{oquab2023dinov2,
|
|
159
|
+
title={DINOv2: Learning Robust Visual Features without Supervision},
|
|
160
|
+
author={Maxime Oquab and Timothée Darcet and Théo Moutakanni and Huy Vo and Marc Szafraniec and Vasil Khalidov and Pierre Fernandez and Daniel Haziza and Francisco Massa and Alaaeldin El-Nouby and Mahmoud Assran and Nicolas Ballas and Wojciech Galuba and Russell Howes and Po-Yao Huang and Shang-Wen Li and Ishan Misra and Michael Rabbat and Vasu Sharma and Gabriel Synnaeve and Hu Xu and Hervé Jegou and Julien Mairal and Patrick Labatut and Armand Joulin and Piotr Bojanowski},
|
|
161
|
+
year={2023},
|
|
162
|
+
eprint={2304.07193},
|
|
163
|
+
archivePrefix={arXiv},
|
|
164
|
+
primaryClass={cs.CV}
|
|
165
|
+
}""",
|
|
148
166
|
)
|
|
149
167
|
|
|
150
168
|
dinov2_large = ModelMeta(
|
|
151
|
-
loader=DINOModel,
|
|
169
|
+
loader=DINOModel,
|
|
152
170
|
name="facebook/dinov2-large",
|
|
171
|
+
model_type=["dense"],
|
|
153
172
|
languages=["eng-Latn"],
|
|
154
173
|
revision="47b73eefe95e8d44ec3623f8890bd894b6ea2d6c",
|
|
155
174
|
release_date="2023-07-18",
|
|
@@ -162,16 +181,25 @@ dinov2_large = ModelMeta(
|
|
|
162
181
|
open_weights=True,
|
|
163
182
|
public_training_code="https://github.com/facebookresearch/dinov2",
|
|
164
183
|
public_training_data=None,
|
|
165
|
-
framework=["PyTorch"],
|
|
184
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
166
185
|
reference="https://huggingface.co/facebook/dinov2-large",
|
|
167
186
|
similarity_fn_name=ScoringFunction.COSINE,
|
|
168
187
|
use_instructions=False,
|
|
169
188
|
training_datasets=dinov2_training_datasets,
|
|
189
|
+
citation="""@misc{oquab2023dinov2,
|
|
190
|
+
title={DINOv2: Learning Robust Visual Features without Supervision},
|
|
191
|
+
author={Maxime Oquab and Timothée Darcet and Théo Moutakanni and Huy Vo and Marc Szafraniec and Vasil Khalidov and Pierre Fernandez and Daniel Haziza and Francisco Massa and Alaaeldin El-Nouby and Mahmoud Assran and Nicolas Ballas and Wojciech Galuba and Russell Howes and Po-Yao Huang and Shang-Wen Li and Ishan Misra and Michael Rabbat and Vasu Sharma and Gabriel Synnaeve and Hu Xu and Hervé Jegou and Julien Mairal and Patrick Labatut and Armand Joulin and Piotr Bojanowski},
|
|
192
|
+
year={2023},
|
|
193
|
+
eprint={2304.07193},
|
|
194
|
+
archivePrefix={arXiv},
|
|
195
|
+
primaryClass={cs.CV}
|
|
196
|
+
}""",
|
|
170
197
|
)
|
|
171
198
|
|
|
172
199
|
dinov2_giant = ModelMeta(
|
|
173
|
-
loader=DINOModel,
|
|
200
|
+
loader=DINOModel,
|
|
174
201
|
name="facebook/dinov2-giant",
|
|
202
|
+
model_type=["dense"],
|
|
175
203
|
languages=["eng-Latn"],
|
|
176
204
|
revision="611a9d42f2335e0f921f1e313ad3c1b7178d206d",
|
|
177
205
|
release_date="2023-07-18",
|
|
@@ -184,11 +212,19 @@ dinov2_giant = ModelMeta(
|
|
|
184
212
|
open_weights=True,
|
|
185
213
|
public_training_code="https://github.com/facebookresearch/dinov2",
|
|
186
214
|
public_training_data=None,
|
|
187
|
-
framework=["PyTorch"],
|
|
215
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
188
216
|
reference="https://huggingface.co/facebook/dinov2-giant",
|
|
189
217
|
similarity_fn_name=ScoringFunction.COSINE,
|
|
190
218
|
use_instructions=False,
|
|
191
219
|
training_datasets=dinov2_training_datasets,
|
|
220
|
+
citation="""@misc{oquab2023dinov2,
|
|
221
|
+
title={DINOv2: Learning Robust Visual Features without Supervision},
|
|
222
|
+
author={Maxime Oquab and Timothée Darcet and Théo Moutakanni and Huy Vo and Marc Szafraniec and Vasil Khalidov and Pierre Fernandez and Daniel Haziza and Francisco Massa and Alaaeldin El-Nouby and Mahmoud Assran and Nicolas Ballas and Wojciech Galuba and Russell Howes and Po-Yao Huang and Shang-Wen Li and Ishan Misra and Michael Rabbat and Vasu Sharma and Gabriel Synnaeve and Hu Xu and Hervé Jegou and Julien Mairal and Patrick Labatut and Armand Joulin and Piotr Bojanowski},
|
|
223
|
+
year={2023},
|
|
224
|
+
eprint={2304.07193},
|
|
225
|
+
archivePrefix={arXiv},
|
|
226
|
+
primaryClass={cs.CV}
|
|
227
|
+
}""",
|
|
192
228
|
)
|
|
193
229
|
|
|
194
230
|
webssl_dino_training_datasets = set(
|
|
@@ -198,6 +234,7 @@ webssl_dino_training_datasets = set(
|
|
|
198
234
|
webssl_dino300m_full2b = ModelMeta(
|
|
199
235
|
loader=DINOModel,
|
|
200
236
|
name="facebook/webssl-dino300m-full2b-224",
|
|
237
|
+
model_type=["dense"],
|
|
201
238
|
languages=["eng-Latn"],
|
|
202
239
|
revision="8529cdb3fb75014932af3b896455fc21c386168e",
|
|
203
240
|
release_date="2025-04-24",
|
|
@@ -210,16 +247,25 @@ webssl_dino300m_full2b = ModelMeta(
|
|
|
210
247
|
open_weights=True,
|
|
211
248
|
public_training_code="",
|
|
212
249
|
public_training_data=None,
|
|
213
|
-
framework=["PyTorch"],
|
|
250
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
214
251
|
reference="https://huggingface.co/facebook/webssl-dino300m-full2b-224",
|
|
215
252
|
similarity_fn_name=None,
|
|
216
253
|
use_instructions=False,
|
|
217
254
|
training_datasets=webssl_dino_training_datasets,
|
|
255
|
+
citation="""@article{fan2025scaling,
|
|
256
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
257
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
258
|
+
year={2025},
|
|
259
|
+
eprint={2504.01017},
|
|
260
|
+
archivePrefix={arXiv},
|
|
261
|
+
primaryClass={cs.CV}
|
|
262
|
+
}""",
|
|
218
263
|
)
|
|
219
264
|
|
|
220
265
|
webssl_dino1b_full2b = ModelMeta(
|
|
221
266
|
loader=DINOModel,
|
|
222
267
|
name="facebook/webssl-dino1b-full2b-224",
|
|
268
|
+
model_type=["dense"],
|
|
223
269
|
languages=["eng-Latn"],
|
|
224
270
|
revision="d3bf033d9c8cc62ea9e73c40956642cad2ec568a",
|
|
225
271
|
release_date="2025-04-24",
|
|
@@ -232,16 +278,25 @@ webssl_dino1b_full2b = ModelMeta(
|
|
|
232
278
|
open_weights=True,
|
|
233
279
|
public_training_code="",
|
|
234
280
|
public_training_data=None,
|
|
235
|
-
framework=["PyTorch"],
|
|
281
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
236
282
|
reference="https://huggingface.co/facebook/webssl-dino1b-full2b-224",
|
|
237
283
|
similarity_fn_name=None,
|
|
238
284
|
use_instructions=False,
|
|
239
285
|
training_datasets=webssl_dino_training_datasets,
|
|
286
|
+
citation="""@article{fan2025scaling,
|
|
287
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
288
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
289
|
+
year={2025},
|
|
290
|
+
eprint={2504.01017},
|
|
291
|
+
archivePrefix={arXiv},
|
|
292
|
+
primaryClass={cs.CV}
|
|
293
|
+
}""",
|
|
240
294
|
)
|
|
241
295
|
|
|
242
296
|
webssl_dino2b_full2b = ModelMeta(
|
|
243
297
|
loader=DINOModel,
|
|
244
298
|
name="facebook/webssl-dino2b-full2b-224",
|
|
299
|
+
model_type=["dense"],
|
|
245
300
|
languages=["eng-Latn"],
|
|
246
301
|
revision="cd5893e3fd2e988eb716792049b3dd53b3f1b68b",
|
|
247
302
|
release_date="2025-04-24",
|
|
@@ -254,16 +309,25 @@ webssl_dino2b_full2b = ModelMeta(
|
|
|
254
309
|
open_weights=True,
|
|
255
310
|
public_training_code="",
|
|
256
311
|
public_training_data=None,
|
|
257
|
-
framework=["PyTorch"],
|
|
312
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
258
313
|
reference="https://huggingface.co/facebook/webssl-dino2b-full2b-224",
|
|
259
314
|
similarity_fn_name=None,
|
|
260
315
|
use_instructions=False,
|
|
261
316
|
training_datasets=webssl_dino_training_datasets,
|
|
317
|
+
citation="""@article{fan2025scaling,
|
|
318
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
319
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
320
|
+
year={2025},
|
|
321
|
+
eprint={2504.01017},
|
|
322
|
+
archivePrefix={arXiv},
|
|
323
|
+
primaryClass={cs.CV}
|
|
324
|
+
}""",
|
|
262
325
|
)
|
|
263
326
|
|
|
264
327
|
webssl_dino3b_full2b = ModelMeta(
|
|
265
328
|
loader=DINOModel,
|
|
266
329
|
name="facebook/webssl-dino3b-full2b-224",
|
|
330
|
+
model_type=["dense"],
|
|
267
331
|
languages=["eng-Latn"],
|
|
268
332
|
revision="2d015c340b16bc47bc6557fcb4e6c83a9d4aa1d3",
|
|
269
333
|
release_date="2025-04-24",
|
|
@@ -276,16 +340,25 @@ webssl_dino3b_full2b = ModelMeta(
|
|
|
276
340
|
open_weights=True,
|
|
277
341
|
public_training_code="",
|
|
278
342
|
public_training_data=None,
|
|
279
|
-
framework=["PyTorch"],
|
|
343
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
280
344
|
reference="https://huggingface.co/facebook/webssl-dino3b-full2b-224",
|
|
281
345
|
similarity_fn_name=None,
|
|
282
346
|
use_instructions=False,
|
|
283
347
|
training_datasets=webssl_dino_training_datasets,
|
|
348
|
+
citation="""@article{fan2025scaling,
|
|
349
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
350
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
351
|
+
year={2025},
|
|
352
|
+
eprint={2504.01017},
|
|
353
|
+
archivePrefix={arXiv},
|
|
354
|
+
primaryClass={cs.CV}
|
|
355
|
+
}""",
|
|
284
356
|
)
|
|
285
357
|
|
|
286
358
|
webssl_dino5b_full2b = ModelMeta(
|
|
287
359
|
loader=DINOModel,
|
|
288
360
|
name="facebook/webssl-dino5b-full2b-224",
|
|
361
|
+
model_type=["dense"],
|
|
289
362
|
languages=["eng-Latn"],
|
|
290
363
|
revision="88006b18b9af369f6c611db7a64d908bde3714e0",
|
|
291
364
|
release_date="2025-04-24",
|
|
@@ -298,16 +371,25 @@ webssl_dino5b_full2b = ModelMeta(
|
|
|
298
371
|
open_weights=True,
|
|
299
372
|
public_training_code="",
|
|
300
373
|
public_training_data=None,
|
|
301
|
-
framework=["PyTorch"],
|
|
374
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
302
375
|
reference="https://huggingface.co/facebook/webssl-dino5b-full2b-224",
|
|
303
376
|
similarity_fn_name=None,
|
|
304
377
|
use_instructions=False,
|
|
305
378
|
training_datasets=webssl_dino_training_datasets,
|
|
379
|
+
citation="""@article{fan2025scaling,
|
|
380
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
381
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
382
|
+
year={2025},
|
|
383
|
+
eprint={2504.01017},
|
|
384
|
+
archivePrefix={arXiv},
|
|
385
|
+
primaryClass={cs.CV}
|
|
386
|
+
}""",
|
|
306
387
|
)
|
|
307
388
|
|
|
308
389
|
webssl_dino7b_full8b_224 = ModelMeta(
|
|
309
390
|
loader=DINOModel,
|
|
310
391
|
name="facebook/webssl-dino7b-full8b-224",
|
|
392
|
+
model_type=["dense"],
|
|
311
393
|
languages=["eng-Latn"],
|
|
312
394
|
revision="c6085463ea680043042a80c6d41db2c65e85f466",
|
|
313
395
|
release_date="2025-04-24",
|
|
@@ -320,16 +402,25 @@ webssl_dino7b_full8b_224 = ModelMeta(
|
|
|
320
402
|
open_weights=True,
|
|
321
403
|
public_training_code="",
|
|
322
404
|
public_training_data=None,
|
|
323
|
-
framework=["PyTorch"],
|
|
405
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
324
406
|
reference="https://huggingface.co/facebook/webssl-dino7b-full8b-224",
|
|
325
407
|
similarity_fn_name=None,
|
|
326
408
|
use_instructions=False,
|
|
327
409
|
training_datasets=webssl_dino_training_datasets,
|
|
410
|
+
citation="""@article{fan2025scaling,
|
|
411
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
412
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
413
|
+
year={2025},
|
|
414
|
+
eprint={2504.01017},
|
|
415
|
+
archivePrefix={arXiv},
|
|
416
|
+
primaryClass={cs.CV}
|
|
417
|
+
}""",
|
|
328
418
|
)
|
|
329
419
|
|
|
330
420
|
webssl_dino7b_full8b_378 = ModelMeta(
|
|
331
421
|
loader=DINOModel,
|
|
332
422
|
name="facebook/webssl-dino7b-full8b-378",
|
|
423
|
+
model_type=["dense"],
|
|
333
424
|
languages=["eng-Latn"],
|
|
334
425
|
revision="53c8c5b43070bd2ddb3f66161140408ce832301f",
|
|
335
426
|
release_date="2025-04-24",
|
|
@@ -342,16 +433,25 @@ webssl_dino7b_full8b_378 = ModelMeta(
|
|
|
342
433
|
open_weights=True,
|
|
343
434
|
public_training_code="",
|
|
344
435
|
public_training_data=None,
|
|
345
|
-
framework=["PyTorch"],
|
|
436
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
346
437
|
reference="https://huggingface.co/facebook/webssl-dino7b-full8b-378",
|
|
347
438
|
similarity_fn_name=None,
|
|
348
439
|
use_instructions=False,
|
|
349
440
|
training_datasets=webssl_dino_training_datasets,
|
|
441
|
+
citation="""@article{fan2025scaling,
|
|
442
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
443
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
444
|
+
year={2025},
|
|
445
|
+
eprint={2504.01017},
|
|
446
|
+
archivePrefix={arXiv},
|
|
447
|
+
primaryClass={cs.CV}
|
|
448
|
+
}""",
|
|
350
449
|
)
|
|
351
450
|
|
|
352
451
|
webssl_dino7b_full8b_518 = ModelMeta(
|
|
353
452
|
loader=DINOModel,
|
|
354
453
|
name="facebook/webssl-dino7b-full8b-518",
|
|
454
|
+
model_type=["dense"],
|
|
355
455
|
languages=["eng-Latn"],
|
|
356
456
|
revision="aee350d2c5e3e5fdb7ee6985291d808ea5eef431",
|
|
357
457
|
release_date="2025-04-24",
|
|
@@ -364,17 +464,26 @@ webssl_dino7b_full8b_518 = ModelMeta(
|
|
|
364
464
|
open_weights=True,
|
|
365
465
|
public_training_code="",
|
|
366
466
|
public_training_data=None,
|
|
367
|
-
framework=["PyTorch"],
|
|
467
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
368
468
|
reference="https://huggingface.co/facebook/webssl-dino7b-full8b-518",
|
|
369
469
|
similarity_fn_name=None,
|
|
370
470
|
use_instructions=False,
|
|
371
471
|
training_datasets=webssl_dino_training_datasets,
|
|
472
|
+
citation="""@article{fan2025scaling,
|
|
473
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
474
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
475
|
+
year={2025},
|
|
476
|
+
eprint={2504.01017},
|
|
477
|
+
archivePrefix={arXiv},
|
|
478
|
+
primaryClass={cs.CV}
|
|
479
|
+
}""",
|
|
372
480
|
)
|
|
373
481
|
|
|
374
482
|
|
|
375
483
|
webssl_dino2b_light2b = ModelMeta(
|
|
376
484
|
loader=DINOModel,
|
|
377
485
|
name="facebook/webssl-dino2b-light2b-224",
|
|
486
|
+
model_type=["dense"],
|
|
378
487
|
languages=["eng-Latn"],
|
|
379
488
|
revision="633a663f304e63cc3cbec3f7f9ca2fbc94736128",
|
|
380
489
|
release_date="2025-04-24",
|
|
@@ -387,16 +496,25 @@ webssl_dino2b_light2b = ModelMeta(
|
|
|
387
496
|
open_weights=True,
|
|
388
497
|
public_training_code="",
|
|
389
498
|
public_training_data=None,
|
|
390
|
-
framework=["PyTorch"],
|
|
499
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
391
500
|
reference="https://huggingface.co/facebook/webssl-dino2b-light2b-224",
|
|
392
501
|
similarity_fn_name=None,
|
|
393
502
|
use_instructions=False,
|
|
394
503
|
training_datasets=webssl_dino_training_datasets,
|
|
504
|
+
citation="""@article{fan2025scaling,
|
|
505
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
506
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
507
|
+
year={2025},
|
|
508
|
+
eprint={2504.01017},
|
|
509
|
+
archivePrefix={arXiv},
|
|
510
|
+
primaryClass={cs.CV}
|
|
511
|
+
}""",
|
|
395
512
|
)
|
|
396
513
|
|
|
397
514
|
webssl_dino2b_heavy2b = ModelMeta(
|
|
398
515
|
loader=DINOModel,
|
|
399
516
|
name="facebook/webssl-dino2b-heavy2b-224",
|
|
517
|
+
model_type=["dense"],
|
|
400
518
|
languages=["eng-Latn"],
|
|
401
519
|
revision="9f46eb0c0129656a1ef195fde072e3765abdb7c6",
|
|
402
520
|
release_date="2025-04-24",
|
|
@@ -409,16 +527,25 @@ webssl_dino2b_heavy2b = ModelMeta(
|
|
|
409
527
|
open_weights=True,
|
|
410
528
|
public_training_code="",
|
|
411
529
|
public_training_data=None,
|
|
412
|
-
framework=["PyTorch"],
|
|
530
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
413
531
|
reference="https://huggingface.co/facebook/webssl-dino2b-heavy2b-224",
|
|
414
532
|
similarity_fn_name=None,
|
|
415
533
|
use_instructions=False,
|
|
416
534
|
training_datasets=webssl_dino_training_datasets,
|
|
535
|
+
citation="""@article{fan2025scaling,
|
|
536
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
537
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
538
|
+
year={2025},
|
|
539
|
+
eprint={2504.01017},
|
|
540
|
+
archivePrefix={arXiv},
|
|
541
|
+
primaryClass={cs.CV}
|
|
542
|
+
}""",
|
|
417
543
|
)
|
|
418
544
|
|
|
419
545
|
webssl_dino3b_light2b = ModelMeta(
|
|
420
546
|
loader=DINOModel,
|
|
421
547
|
name="facebook/webssl-dino3b-light2b-224",
|
|
548
|
+
model_type=["dense"],
|
|
422
549
|
languages=["eng-Latn"],
|
|
423
550
|
revision="4d0160f60673805431f4ad14983e712ed88be5b8",
|
|
424
551
|
release_date="2025-04-24",
|
|
@@ -431,16 +558,25 @@ webssl_dino3b_light2b = ModelMeta(
|
|
|
431
558
|
open_weights=True,
|
|
432
559
|
public_training_code="",
|
|
433
560
|
public_training_data=None,
|
|
434
|
-
framework=["PyTorch"],
|
|
561
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
435
562
|
reference="https://huggingface.co/facebook/webssl-dino3b-light2b-224",
|
|
436
563
|
similarity_fn_name=None,
|
|
437
564
|
use_instructions=False,
|
|
438
565
|
training_datasets=webssl_dino_training_datasets,
|
|
566
|
+
citation="""@article{fan2025scaling,
|
|
567
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
568
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
569
|
+
year={2025},
|
|
570
|
+
eprint={2504.01017},
|
|
571
|
+
archivePrefix={arXiv},
|
|
572
|
+
primaryClass={cs.CV}
|
|
573
|
+
}""",
|
|
439
574
|
)
|
|
440
575
|
|
|
441
576
|
webssl_dino3b_heavy2b = ModelMeta(
|
|
442
577
|
loader=DINOModel,
|
|
443
578
|
name="facebook/webssl-dino3b-heavy2b-224",
|
|
579
|
+
model_type=["dense"],
|
|
444
580
|
languages=["eng-Latn"],
|
|
445
581
|
revision="dd39c2910747561b332285d96c4dce0bdb240775",
|
|
446
582
|
release_date="2025-04-24",
|
|
@@ -453,16 +589,25 @@ webssl_dino3b_heavy2b = ModelMeta(
|
|
|
453
589
|
open_weights=True,
|
|
454
590
|
public_training_code="",
|
|
455
591
|
public_training_data=None,
|
|
456
|
-
framework=["PyTorch"],
|
|
592
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
457
593
|
reference="https://huggingface.co/facebook/webssl-dino3b-heavy2b-224",
|
|
458
594
|
similarity_fn_name=None,
|
|
459
595
|
use_instructions=False,
|
|
460
596
|
training_datasets=webssl_dino_training_datasets,
|
|
597
|
+
citation="""@article{fan2025scaling,
|
|
598
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
599
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
600
|
+
year={2025},
|
|
601
|
+
eprint={2504.01017},
|
|
602
|
+
archivePrefix={arXiv},
|
|
603
|
+
primaryClass={cs.CV}
|
|
604
|
+
}""",
|
|
461
605
|
)
|
|
462
606
|
|
|
463
607
|
webssl_mae300m_full2b = ModelMeta(
|
|
464
608
|
loader=DINOModel,
|
|
465
609
|
name="facebook/webssl-mae300m-full2b-224",
|
|
610
|
+
model_type=["dense"],
|
|
466
611
|
languages=["eng-Latn"],
|
|
467
612
|
revision="4655a0ac1726c206ba14d5ccb26758c62a4d03b0",
|
|
468
613
|
release_date="2025-04-24",
|
|
@@ -475,16 +620,25 @@ webssl_mae300m_full2b = ModelMeta(
|
|
|
475
620
|
open_weights=True,
|
|
476
621
|
public_training_code="",
|
|
477
622
|
public_training_data=None,
|
|
478
|
-
framework=["PyTorch"],
|
|
623
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
479
624
|
reference="https://huggingface.co/facebook/webssl-mae300m-full2b-224",
|
|
480
625
|
similarity_fn_name=None,
|
|
481
626
|
use_instructions=False,
|
|
482
627
|
training_datasets=webssl_dino_training_datasets,
|
|
628
|
+
citation="""@article{fan2025scaling,
|
|
629
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
630
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
631
|
+
year={2025},
|
|
632
|
+
eprint={2504.01017},
|
|
633
|
+
archivePrefix={arXiv},
|
|
634
|
+
primaryClass={cs.CV}
|
|
635
|
+
}""",
|
|
483
636
|
)
|
|
484
637
|
|
|
485
638
|
webssl_mae700m_full2b = ModelMeta(
|
|
486
639
|
loader=DINOModel,
|
|
487
640
|
name="facebook/webssl-mae700m-full2b-224",
|
|
641
|
+
model_type=["dense"],
|
|
488
642
|
languages=["eng-Latn"],
|
|
489
643
|
revision="c32be382e757d73a178de1ead62c27391d4b4280",
|
|
490
644
|
release_date="2025-04-24",
|
|
@@ -497,16 +651,25 @@ webssl_mae700m_full2b = ModelMeta(
|
|
|
497
651
|
open_weights=True,
|
|
498
652
|
public_training_code="",
|
|
499
653
|
public_training_data=None,
|
|
500
|
-
framework=["PyTorch"],
|
|
654
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
501
655
|
reference="https://huggingface.co/facebook/webssl-mae700m-full2b-224",
|
|
502
656
|
similarity_fn_name=None,
|
|
503
657
|
use_instructions=False,
|
|
504
658
|
training_datasets=webssl_dino_training_datasets,
|
|
659
|
+
citation="""@article{fan2025scaling,
|
|
660
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
661
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
662
|
+
year={2025},
|
|
663
|
+
eprint={2504.01017},
|
|
664
|
+
archivePrefix={arXiv},
|
|
665
|
+
primaryClass={cs.CV}
|
|
666
|
+
}""",
|
|
505
667
|
)
|
|
506
668
|
|
|
507
669
|
webssl_mae1b_full2b = ModelMeta(
|
|
508
670
|
loader=DINOModel,
|
|
509
671
|
name="facebook/webssl-mae1b-full2b-224",
|
|
672
|
+
model_type=["dense"],
|
|
510
673
|
languages=["eng-Latn"],
|
|
511
674
|
revision="5880aefedbad8db0f44d27358f6f08e8576f70fc",
|
|
512
675
|
release_date="2025-04-24",
|
|
@@ -519,9 +682,17 @@ webssl_mae1b_full2b = ModelMeta(
|
|
|
519
682
|
open_weights=True,
|
|
520
683
|
public_training_code="",
|
|
521
684
|
public_training_data=None,
|
|
522
|
-
framework=["PyTorch"],
|
|
685
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
523
686
|
reference="https://huggingface.co/facebook/webssl-mae1b-full2b-224",
|
|
524
687
|
similarity_fn_name=None,
|
|
525
688
|
use_instructions=False,
|
|
526
689
|
training_datasets=webssl_dino_training_datasets,
|
|
690
|
+
citation="""@article{fan2025scaling,
|
|
691
|
+
title={Scaling Language-Free Visual Representation Learning},
|
|
692
|
+
author={David Fan and Shengbang Tong and Jiachen Zhu and Koustuv Sinha and Zhuang Liu and Xinlei Chen and Michael Rabbat and Nicolas Ballas and Yann LeCun and Amir Bar and Saining Xie},
|
|
693
|
+
year={2025},
|
|
694
|
+
eprint={2504.01017},
|
|
695
|
+
archivePrefix={arXiv},
|
|
696
|
+
primaryClass={cs.CV}
|
|
697
|
+
}""",
|
|
527
698
|
)
|
|
@@ -40,11 +40,19 @@ e5_instruct = ModelMeta(
|
|
|
40
40
|
normalized=True,
|
|
41
41
|
),
|
|
42
42
|
name="intfloat/multilingual-e5-large-instruct",
|
|
43
|
+
model_type=["dense"],
|
|
43
44
|
languages=XLMR_LANGUAGES,
|
|
44
45
|
open_weights=True,
|
|
45
46
|
revision="baa7be480a7de1539afce709c8f13f833a510e0a",
|
|
46
47
|
release_date=E5_PAPER_RELEASE_DATE,
|
|
47
|
-
framework=[
|
|
48
|
+
framework=[
|
|
49
|
+
"GritLM",
|
|
50
|
+
"PyTorch",
|
|
51
|
+
"Sentence Transformers",
|
|
52
|
+
"ONNX",
|
|
53
|
+
"safetensors",
|
|
54
|
+
"Transformers",
|
|
55
|
+
],
|
|
48
56
|
similarity_fn_name=ScoringFunction.COSINE,
|
|
49
57
|
use_instructions=True,
|
|
50
58
|
reference="https://huggingface.co/intfloat/multilingual-e5-large-instruct",
|
|
@@ -78,11 +86,18 @@ e5_mistral = ModelMeta(
|
|
|
78
86
|
normalized=True,
|
|
79
87
|
),
|
|
80
88
|
name="intfloat/e5-mistral-7b-instruct",
|
|
89
|
+
model_type=["dense"],
|
|
81
90
|
languages=MISTRAL_LANGUAGES,
|
|
82
91
|
open_weights=True,
|
|
83
92
|
revision="07163b72af1488142a360786df853f237b1a3ca1",
|
|
84
93
|
release_date=E5_PAPER_RELEASE_DATE,
|
|
85
|
-
framework=[
|
|
94
|
+
framework=[
|
|
95
|
+
"GritLM",
|
|
96
|
+
"PyTorch",
|
|
97
|
+
"Sentence Transformers",
|
|
98
|
+
"safetensors",
|
|
99
|
+
"Transformers",
|
|
100
|
+
],
|
|
86
101
|
similarity_fn_name=ScoringFunction.COSINE,
|
|
87
102
|
use_instructions=True,
|
|
88
103
|
reference="https://huggingface.co/intfloat/e5-mistral-7b-instruct",
|
|
@@ -125,6 +140,7 @@ zeta_alpha_ai__zeta_alpha_e5_mistral = ModelMeta(
|
|
|
125
140
|
normalized=True,
|
|
126
141
|
),
|
|
127
142
|
name="zeta-alpha-ai/Zeta-Alpha-E5-Mistral",
|
|
143
|
+
model_type=["dense"],
|
|
128
144
|
revision="c791d37474fa6a5c72eb3a2522be346bc21fbfc3",
|
|
129
145
|
release_date="2024-08-30",
|
|
130
146
|
languages=["eng-Latn"],
|
|
@@ -136,7 +152,13 @@ zeta_alpha_ai__zeta_alpha_e5_mistral = ModelMeta(
|
|
|
136
152
|
open_weights=True,
|
|
137
153
|
public_training_data=None,
|
|
138
154
|
public_training_code=None,
|
|
139
|
-
framework=[
|
|
155
|
+
framework=[
|
|
156
|
+
"PyTorch",
|
|
157
|
+
"Sentence Transformers",
|
|
158
|
+
"GritLM",
|
|
159
|
+
"safetensors",
|
|
160
|
+
"Transformers",
|
|
161
|
+
],
|
|
140
162
|
reference="https://huggingface.co/zeta-alpha-ai/Zeta-Alpha-E5-Mistral",
|
|
141
163
|
similarity_fn_name=ScoringFunction.COSINE,
|
|
142
164
|
use_instructions=True,
|
|
@@ -201,6 +223,7 @@ BeastyZ__e5_R_mistral_7b = ModelMeta(
|
|
|
201
223
|
tokenizer_kwargs={"pad_token": "</s>"},
|
|
202
224
|
),
|
|
203
225
|
name="BeastyZ/e5-R-mistral-7b",
|
|
226
|
+
model_type=["dense"],
|
|
204
227
|
revision="3f810a6a7fd220369ad248e3705cf13d71803602",
|
|
205
228
|
release_date="2024-06-28",
|
|
206
229
|
languages=["eng-Latn"],
|
|
@@ -212,7 +235,7 @@ BeastyZ__e5_R_mistral_7b = ModelMeta(
|
|
|
212
235
|
open_weights=True,
|
|
213
236
|
public_training_code="https://github.com/LeeSureman/E5-Retrieval-Reproduction",
|
|
214
237
|
public_training_data="https://huggingface.co/datasets/BeastyZ/E5-R",
|
|
215
|
-
framework=["PyTorch"],
|
|
238
|
+
framework=["PyTorch", "Transformers", "safetensors"],
|
|
216
239
|
reference="https://huggingface.co/BeastyZ/e5-R-mistral-7b",
|
|
217
240
|
similarity_fn_name="cosine",
|
|
218
241
|
use_instructions=True,
|