EuroEval 15.10.0__tar.gz → 15.10.1__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of EuroEval might be problematic. Click here for more details.
- {euroeval-15.10.0 → euroeval-15.10.1}/.pre-commit-config.yaml +1 -1
- {euroeval-15.10.0 → euroeval-15.10.1}/CHANGELOG.md +6 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/PKG-INFO +1 -1
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/README.md +1 -1
- euroeval-15.10.1/docs/leaderboards/Monolingual/finnish.md +15 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/pyproject.toml +1 -1
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/finetuning.py +1 -1
- {euroeval-15.10.0 → euroeval-15.10.1}/uv.lock +1 -1
- {euroeval-15.10.0 → euroeval-15.10.1}/.github/ISSUE_TEMPLATE/benchmark_dataset_request.yaml +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/.github/ISSUE_TEMPLATE/bug.yaml +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/.github/ISSUE_TEMPLATE/feature_request.yaml +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/.github/ISSUE_TEMPLATE/model_evaluation_request.yaml +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/.github/workflows/ci.yaml +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/.gitignore +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/CITATION.cff +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/CODE_OF_CONDUCT.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/CONTRIBUTING.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/Dockerfile.cuda +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/LICENSE +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/NEW_DATASET_GUIDE.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/README.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/CNAME +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/README.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/danish.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/dutch.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/english.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/faroese.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/finnish.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/french.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/german.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/icelandic.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/italian.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/norwegian.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/spanish.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/datasets/swedish.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/extras/radial_plotter.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/faq.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/gfx/favicon.png +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Monolingual/danish.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Monolingual/dutch.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Monolingual/english.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Monolingual/faroese.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Monolingual/french.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Monolingual/german.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Monolingual/icelandic.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Monolingual/italian.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Monolingual/norwegian.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Monolingual/spanish.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Monolingual/swedish.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Multilingual/european.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Multilingual/germanic.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Multilingual/mainland-scandinavian.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Multilingual/romance.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/README.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/methodology.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/python-package.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/tasks/README.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/tasks/common-sense-reasoning.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/tasks/knowledge.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/tasks/linguistic-acceptability.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/tasks/named-entity-recognition.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/tasks/reading-comprehension.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/tasks/sentiment-classification.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/tasks/speed.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/docs/tasks/summarization.md +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/gfx/euroeval.png +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/gfx/euroeval.xcf +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/gfx/scandeval.png +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/makefile +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/mkdocs.yaml +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/__init__.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/benchmark_config_factory.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/benchmark_modules/__init__.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/benchmark_modules/base.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/benchmark_modules/fresh.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/benchmark_modules/hf.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/benchmark_modules/litellm.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/benchmark_modules/vllm.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/benchmarker.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/callbacks.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/cli.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/constants.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/data_loading.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/data_models.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/__init__.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/danish.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/dutch.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/english.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/faroese.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/finnish.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/french.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/german.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/icelandic.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/italian.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/norwegian.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/spanish.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/dataset_configs/swedish.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/enums.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/exceptions.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/generation.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/generation_utils.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/human_evaluation.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/languages.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/model_cache.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/model_config.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/model_loading.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/prompt_templates/__init__.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/prompt_templates/linguistic_acceptability.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/prompt_templates/multiple_choice.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/prompt_templates/named_entity_recognition.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/prompt_templates/reading_comprehension.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/prompt_templates/sentiment_classification.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/prompt_templates/summarization.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/scores.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/speed_benchmark.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/task_group_utils/__init__.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/task_group_utils/multiple_choice_classification.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/task_group_utils/question_answering.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/task_group_utils/sequence_classification.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/task_group_utils/text_to_text.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/task_group_utils/token_classification.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/tasks.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/tokenization_utils.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/types.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/utils.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/constants.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_allocine.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_angry_tweets.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_arc.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_arc_is.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_belebele.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_cnn_dailymail.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_conll_en.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_conll_es.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_conll_nl.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_dane.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_danish_citizen_tests.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_dansk.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_danske_talemaader.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_danske_talemaader_old.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_dbrd.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_dutch_cola.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_eltec.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_fone.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_foqa.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_fosent.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_fquad.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_germanquad.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_germeval.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_hellaswag.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_hellaswag_fi.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_hotter_and_colder_sentiment.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_ice_linguistic.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_icelandic_error_corpus.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_icelandic_knowledge.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_icelandic_qa.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_icesum.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_ilpost_sum.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_jentoft.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_mim_gold_ner.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_mlqa_es.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_mlsum_de.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_mlsum_es.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_mmlu.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_multinerd-it.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_no_cola.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_no_sammendrag.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_nor_common_sense_qa.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_nordjylland_news.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_norec.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_norglm_multiqa.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_norglm_multisum.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_norne.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_norquad.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_nqii.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_nrk_quiz_qa.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_orange_sum.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_personal_sum.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_rrn.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_sb10k.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_scala.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_scandiqa.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_scandisent_fi.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_schibsted.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_sentiment_headlines_es.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_sentipolc16.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_squad.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_squad_it.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_squad_nl.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_squad_nl_old.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_sst5.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_suc3.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_swedn.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_swerec.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_turku_ner_fi.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_tydiqa_fi.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_wiki_lingua_nl.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_wikiann_fo.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_wikineural-it.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_winogrande_is.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_xlsum_fi.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/create_xquad_es.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/fix_dot_env_file.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/load_ud_pos.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/src/scripts/versioning.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/__init__.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/conftest.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_benchmark_config_factory.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_benchmark_modules/__init__.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_benchmark_modules/test_base.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_benchmark_modules/test_fresh.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_benchmark_modules/test_hf.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_benchmark_modules/test_litellm.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_benchmark_modules/test_vllm.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_benchmarker.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_callbacks.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_cli.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_constants.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_data_loading.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_data_models.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_dataset_configs.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_enums.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_exceptions.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_finetuning.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_generation.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_human_evaluation.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_languages.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_model_cache.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_model_config.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_model_loading.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_scores.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_speed_benchmark.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_task_utils/__init__.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_task_utils/test_question_answering.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_task_utils/test_sequence_classification.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_task_utils/test_text_to_text.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_task_utils/test_token_classification.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_tasks.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_tokenization_utils.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_types.py +0 -0
- {euroeval-15.10.0 → euroeval-15.10.1}/tests/test_utils.py +0 -0
|
@@ -10,6 +10,12 @@ and this project adheres to [Semantic Versioning](http://semver.org/spec/v2.0.0.
|
|
|
10
10
|
|
|
11
11
|
|
|
12
12
|
|
|
13
|
+
## [v15.10.1] - 2025-06-20
|
|
14
|
+
### Fixed
|
|
15
|
+
- Fixed an issue when benchmarking encoder models on reading comprehension tasks, where
|
|
16
|
+
we sometimes would truncate the model outputs when they should not have been.
|
|
17
|
+
|
|
18
|
+
|
|
13
19
|
## [v15.10.0] - 2025-06-17
|
|
14
20
|
### Changed
|
|
15
21
|
- Updated `vllm` to `>=0.9.1`.
|
|
@@ -29,7 +29,7 @@ or [LM Studio](https://lmstudio.ai/).
|
|
|
29
29
|
The idea of EuroEval grew out of the development of Danish language model RøBÆRTa in
|
|
30
30
|
2021, when we realised that there was no standard way to evaluate Danish language
|
|
31
31
|
models. It started as a hobby project including Danish, Swedish and Norwegian, but has
|
|
32
|
-
since grown to include
|
|
32
|
+
since grown to include 12+ European languages.
|
|
33
33
|
|
|
34
34
|
EuroEval is maintained by [Dan Saattrup Nielsen](https://www.saattrupdan.com/) from the
|
|
35
35
|
[Alexandra Institute](https://alexandra.dk), and is funded by the EU project
|
|
@@ -0,0 +1,15 @@
|
|
|
1
|
+
---
|
|
2
|
+
hide:
|
|
3
|
+
- toc
|
|
4
|
+
---
|
|
5
|
+
# 🇫🇮 Finnish
|
|
6
|
+
|
|
7
|
+
See the [leaderboard page](/leaderboards) for more information about all the columns.
|
|
8
|
+
|
|
9
|
+
/// tab | Generative Leaderboard
|
|
10
|
+
<iframe title="" aria-label="Table" id="datawrapper-chart-ubHSy" src="https://datawrapper.dwcdn.net/ubHSy" scrolling="no" frameborder="0" style="width: 0; min-width: 100% !important; border: none;" height="847" data-external="1"></iframe><script type="text/javascript">!function(){"use strict";window.addEventListener("message",(function(a){if(void 0!==a.data["datawrapper-height"]){var e=document.querySelectorAll("iframe");for(var t in a.data["datawrapper-height"])for(var r,i=0;r=e[i];i++)if(r.contentWindow===a.source){var d=a.data["datawrapper-height"][t]+"px";r.style.height=d}}}))}();</script>
|
|
11
|
+
///
|
|
12
|
+
|
|
13
|
+
/// tab | NLU Leaderboard
|
|
14
|
+
<iframe title="" aria-label="Table" id="datawrapper-chart-qVbA3" src="https://datawrapper.dwcdn.net/qVbA3/1/" scrolling="no" frameborder="0" style="width: 0; min-width: 100% !important; border: none;" height="818" data-external="1"></iframe><script type="text/javascript">!function(){"use strict";window.addEventListener("message",(function(a){if(void 0!==a.data["datawrapper-height"]){var e=document.querySelectorAll("iframe");for(var t in a.data["datawrapper-height"])for(var r,i=0;r=e[i];i++)if(r.contentWindow===a.source){var d=a.data["datawrapper-height"][t]+"px";r.style.height=d}}}))}();</script>
|
|
15
|
+
///
|
|
@@ -333,7 +333,7 @@ def remove_extra_tensors_from_logits(
|
|
|
333
333
|
Returns:
|
|
334
334
|
The processed logits.
|
|
335
335
|
"""
|
|
336
|
-
if isinstance(logits, tuple):
|
|
336
|
+
if isinstance(logits, tuple) and isinstance(logits[-1], tuple):
|
|
337
337
|
logits = logits[:-1]
|
|
338
338
|
if len(logits) == 1:
|
|
339
339
|
logits = logits[0]
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{euroeval-15.10.0 → euroeval-15.10.1}/docs/leaderboards/Multilingual/mainland-scandinavian.md
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/prompt_templates/linguistic_acceptability.py
RENAMED
|
File without changes
|
|
File without changes
|
{euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/prompt_templates/named_entity_recognition.py
RENAMED
|
File without changes
|
{euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/prompt_templates/reading_comprehension.py
RENAMED
|
File without changes
|
{euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/prompt_templates/sentiment_classification.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{euroeval-15.10.0 → euroeval-15.10.1}/src/euroeval/task_group_utils/sequence_classification.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|