wisent 0.7.379__py3-none-any.whl → 0.7.901__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- wisent/__init__.py +1 -1
- wisent/core/activations/__init__.py +22 -6
- wisent/core/activations/activation_cache.py +393 -0
- wisent/core/activations/activations.py +22 -40
- wisent/core/activations/activations_collector.py +145 -373
- wisent/core/activations/classifier_inference_strategy.py +195 -0
- wisent/core/activations/core/atoms.py +8 -92
- wisent/core/activations/extraction_strategy.py +480 -0
- wisent/core/agent/diagnose/response_diagnostics.py +3 -3
- wisent/core/agent/diagnose.py +3 -3
- wisent/core/autonomous_agent.py +2 -2
- wisent/core/classifiers/classifiers/core/atoms.py +3 -2
- wisent/core/cli/__init__.py +2 -1
- wisent/core/cli/agent/apply_steering.py +25 -31
- wisent/core/cli/agent/evaluate_response.py +18 -20
- wisent/core/cli/agent/train_classifier.py +36 -26
- wisent/core/cli/check_linearity.py +35 -3
- wisent/core/cli/cluster_benchmarks.py +470 -0
- wisent/core/cli/create_steering_vector.py +19 -9
- wisent/core/cli/diagnose_vectors.py +7 -4
- wisent/core/cli/estimate_unified_goodness_time.py +6 -4
- wisent/core/cli/generate_pairs_from_task.py +9 -56
- wisent/core/cli/generate_vector_from_task.py +4 -0
- wisent/core/cli/geometry_search.py +137 -0
- wisent/core/cli/get_activations.py +13 -37
- wisent/core/cli/method_optimizer.py +860 -0
- wisent/core/cli/modify_weights.py +3 -2
- wisent/core/cli/optimize.py +44 -5
- wisent/core/cli/optimize_classification.py +5 -6
- wisent/core/cli/optimize_sample_size.py +9 -23
- wisent/core/cli/optimize_steering.py +433 -159
- wisent/core/cli/optimize_weights.py +67 -7
- wisent/core/cli/preview_pairs.py +203 -0
- wisent/core/cli/steering_method_trainer.py +8 -7
- wisent/core/cli/steering_search_space.py +20 -15
- wisent/core/cli/tasks.py +31 -117
- wisent/core/cli/train_unified_goodness.py +18 -19
- wisent/core/contrastive_pairs/diagnostics/control_vectors.py +1582 -177
- wisent/core/contrastive_pairs/diagnostics/linearity.py +70 -80
- wisent/core/contrastive_pairs/diagnostics/vector_quality.py +6 -5
- wisent/core/contrastive_pairs/huggingface_pairs/hf_extractor_manifest.py +5 -19
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/__init__.py +11 -5
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/agentic_search.py +37 -347
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/aider_polyglot.py +113 -136
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/apps.py +146 -32
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codeforces.py +2 -12
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue.py +2 -2
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/coding_benchmarks.py +124 -504
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/faithbench.py +40 -63
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/flames.py +46 -89
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/flores.py +15 -4
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/frames.py +36 -20
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/hallucinations_leaderboard.py +3 -45
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/humaneval.py +98 -57
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/livemathbench.py +42 -4
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/longform_writing.py +2 -112
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/math500.py +39 -4
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/medium_priority_benchmarks.py +475 -525
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/mercury.py +65 -42
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/olympiadbench.py +2 -12
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/planbench.py +78 -219
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/polymath.py +37 -4
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/recode.py +84 -69
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/refusalbench.py +168 -160
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/simpleqa.py +44 -25
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/tau_bench.py +3 -103
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/toolbench.py +3 -97
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/toolemu.py +48 -182
- wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/code_x_glue.py +8 -8
- wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/freebase.py +1 -1
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_extractor_manifest.py +11 -5
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_extractor_registry.py +19 -1
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/aclue.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/acp_bench.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/acp_bench_hard.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/advanced.py +2 -4
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/aexams.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/afrimmlu.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/afrixnli.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/agieval_aqua_rat.py +129 -0
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabculture.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabic.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabic_exams.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabic_leaderboard_complete.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabic_leaderboard_light.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabicmmlu.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/aradice.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arc.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arc_challenge.py +1 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arc_easy.py +1 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arithmetic.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/asdiv.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/babi.py +36 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/basque_bench.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bbq.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/belebele.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/benchmarks.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bertaqa.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bhs.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bhtc.py +3 -5
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/blimp.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/blimp_nl.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/boolq.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/c4.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cabbq.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/careqa.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/catalan_bench.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/catalanqa.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/catcola.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cb.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ceval.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ceval_valid.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/chain.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/chartqa.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/claim.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/click.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cmmlu.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cnn.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cocoteros.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/code_x_glue.py +11 -6
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/coedit.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/commonsense.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/commonsense_qa.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/copa.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/copal_id.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/coqa.py +3 -4
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/csatqa.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cycle.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/darija_bench.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/darijahellaswag.py +2 -6
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/darijammlu.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/dbpedia.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/discrim_eval.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/doc.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/drop.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/epec.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eq.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eq_bench.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eq_bench_ca.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eq_bench_es.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/esbbq.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ethics.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus_exams.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus_proficiency.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus_reading.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus_trivia.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/evalita_llm.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/financial.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/flan.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/french_bench.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/galician_bench.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/gaokao.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/glianorex.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/global_mmlu.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/global_piqa.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/gpt3.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/groundcocoa.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/gsm8k.py +1 -1
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/haerae.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/headqa.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hellaswag.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hendrycks_ethics.py +5 -9
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hendrycks_math.py +63 -16
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/histoires_morales.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hrm8k.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/humaneval_infilling.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/icelandic_winogrande.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/inverse.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/inverse_scaling.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ja.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/japanese_leaderboard.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/japanese_leaderboard_mc.py +1 -1
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/kmmlu.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/kobest.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/kormedmcqa.py +5 -17
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lambada_cloze.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lambada_multilingual.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/law.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/leaderboard.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lingoly.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/llama3.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lm_syneval.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/logiqa.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/logiqa2.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/longbench.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/longbenchv2.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mastermind.py +2 -4
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mbpp.py +47 -6
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mc-taco.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/med_concepts_qa.py +2 -4
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/meddialog.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/medical.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/medmcqa.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/medqa.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mela.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/metabench.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/minerva_math.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mmlu.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mmlusr.py +3 -4
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mrpc.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/multiblimp.py +2 -5
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/multirc.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mutual.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/non.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_exact.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_gen_exact.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_mc.py +4 -8
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_mc_log_likelihoods.py +4 -8
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/nq_open.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi_arc_multilingual.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi_hellaswag_multilingual.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi_mmlu_multilingual.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi_truthfulqa_multilingual.py +2 -5
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/olaph.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/openbookqa.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/option.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/parafraseja.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/parafrases.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/paws.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/paws_x.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/pawsx.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/persona.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/phrases.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/pile.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/piqa.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/portuguese_bench.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/prompt.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/prost.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/pubmedqa.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qa4mre.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qasper.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qasper_bool.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qnli.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qnlieu.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qqp.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/race.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/random.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/record.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/reversed.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/rte.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ruler.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sciq.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/score.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/scrolls.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/scrolls_mc.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/self.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sglue.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sglue_rte.py +2 -1
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/siqa.py +4 -7
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/social_iqa.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/spanish_bench.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/storycloze.py +2 -6
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/summarization.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/super.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/super_glue.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/swag.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/swde.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sycophancy.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/t0.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/teca.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinyarc.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinybenchmarks.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinygsm8k.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinyhellaswag.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinymmlu.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinytruthfulqa.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinywinogrande.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tmmluplus.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/triviaqa.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/truthfulqa.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/truthfulqa_mc1.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/truthfulqa_mc2.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/turblimp_core.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/turkishmmlu.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/turkishmmlu_mc.py +0 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/unscramble.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/vaxx.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/webqs.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wic.py +3 -4
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/winogrande.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wmdp.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wnli.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wsc.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wsc273.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xcopa.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xlsum.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xnli.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xquad.py +2 -4
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xstorycloze.py +2 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xwinograd.py +2 -2
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/zhoblimp.py +1 -3
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_pairs_generation.py +173 -6
- wisent/core/data_loaders/loaders/lm_loader.py +12 -1
- wisent/core/evaluators/benchmark_specific/apps_evaluator.py +133 -0
- wisent/core/evaluators/benchmark_specific/coding/metrics/evaluator.py +6 -1
- wisent/core/evaluators/benchmark_specific/conala_evaluator.py +31 -168
- wisent/core/evaluators/custom/examples/humanization_coherent.py +89 -35
- wisent/core/evaluators/oracles/truthfulqa_gen_evaluator.py +2 -20
- wisent/core/evaluators/personalization/coherence.py +46 -0
- wisent/core/geometry_runner.py +995 -0
- wisent/core/geometry_search_space.py +237 -0
- wisent/core/hyperparameter_optimizer.py +14 -14
- wisent/core/lm_eval_harness_ground_truth.py +7 -11
- wisent/core/main.py +6 -0
- wisent/core/models/core/atoms.py +5 -3
- wisent/core/models/wisent_model.py +9 -8
- wisent/core/opti/methods/opti_weights.py +29 -2
- wisent/core/optuna/classifier/activation_generator.py +14 -12
- wisent/core/optuna/classifier/optuna_classifier_optimizer.py +2 -2
- wisent/core/optuna/steering/steering_optimization.py +14 -9
- wisent/core/parser_arguments/check_linearity_parser.py +12 -2
- wisent/core/parser_arguments/cluster_benchmarks_parser.py +31 -0
- wisent/core/parser_arguments/generate_vector_from_synthetic_parser.py +2 -2
- wisent/core/parser_arguments/generate_vector_from_task_parser.py +22 -2
- wisent/core/parser_arguments/geometry_search_parser.py +61 -0
- wisent/core/parser_arguments/main_parser.py +16 -0
- wisent/core/parser_arguments/optimize_steering_parser.py +117 -10
- wisent/core/parser_arguments/optimize_weights_parser.py +6 -0
- wisent/core/parser_arguments/tasks_parser.py +7 -19
- wisent/core/parser_arguments/train_unified_goodness_parser.py +2 -2
- wisent/core/steering.py +5 -3
- wisent/core/steering_methods/core/atoms.py +1 -2
- wisent/core/steering_methods/methods/caa.py +1 -1
- wisent/core/steering_methods/methods/hyperplane.py +75 -0
- wisent/core/steering_methods/methods/prism.py +1 -2
- wisent/core/steering_methods/methods/pulse.py +39 -8
- wisent/core/steering_methods/methods/titan.py +59 -14
- wisent/core/steering_methods/registry.py +52 -12
- wisent/core/steering_optimizer.py +15 -15
- wisent/core/synthetic/generators/nonsense_generator.py +30 -18
- wisent/core/trainers/steering_trainer.py +11 -20
- wisent/core/utils/device.py +27 -27
- wisent/core/utils/layer_combinations.py +70 -0
- wisent/examples/__init__.py +1 -0
- wisent/examples/scripts/__init__.py +1 -0
- wisent/examples/scripts/count_all_benchmarks.py +121 -0
- wisent/examples/scripts/discover_directions.py +469 -0
- wisent/examples/scripts/extract_benchmark_info.py +71 -0
- wisent/examples/scripts/generate_paper_data.py +384 -0
- wisent/examples/scripts/intervention_validation.py +626 -0
- wisent/examples/scripts/results/test_AraDiCE_ArabicMMLU_lev_evaluation.json +324 -0
- wisent/examples/scripts/results/test_AraDiCE_ArabicMMLU_lev_pairs.json +92 -0
- wisent/examples/scripts/results/test_aexams_IslamicStudies_evaluation.json +324 -0
- wisent/examples/scripts/results/test_aexams_IslamicStudies_pairs.json +92 -0
- wisent/examples/scripts/results/test_afrimgsm_pairs.json +92 -0
- wisent/examples/scripts/results/test_afrimmlu_evaluation.json +324 -0
- wisent/examples/scripts/results/test_afrimmlu_pairs.json +92 -0
- wisent/examples/scripts/search_all_short_names.py +31 -0
- wisent/examples/scripts/test_all_benchmarks.py +138 -0
- wisent/examples/scripts/test_all_benchmarks_new.py +28 -0
- wisent/examples/scripts/test_contrastive_pairs_all_supported.py +230 -0
- wisent/examples/scripts/test_nonsense_baseline.py +261 -0
- wisent/examples/scripts/test_one_benchmark.py +324 -0
- wisent/examples/scripts/test_one_coding_benchmark.py +293 -0
- wisent/examples/scripts/threshold_analysis.py +434 -0
- wisent/examples/scripts/visualization_gallery.py +582 -0
- wisent/parameters/lm_eval/broken_in_lm_eval.json +179 -2
- wisent/parameters/lm_eval/category_directions.json +137 -0
- wisent/parameters/lm_eval/repair_plan.json +282 -0
- wisent/parameters/lm_eval/track_progress_not_lm_eval_tasks.json +19 -70
- wisent/parameters/lm_eval/weak_contrastive_pairs.json +38 -0
- wisent/parameters/lm_eval/working_benchmarks.json +206 -0
- wisent/parameters/lm_eval/working_benchmarks_categorized.json +236 -0
- wisent/scripts/run_quality_metrics_sweep.sh +22 -27
- wisent/tests/test_aggregation_geometry.py +236 -0
- wisent/tests/test_detector_accuracy.py +163 -0
- wisent/tests/test_geometry_exhaustive.py +1202 -0
- wisent/tests/visualize_geometry.py +255 -61
- {wisent-0.7.379.dist-info → wisent-0.7.901.dist-info}/METADATA +1 -1
- {wisent-0.7.379.dist-info → wisent-0.7.901.dist-info}/RECORD +376 -974
- wisent/core/activations/prompt_construction_strategy.py +0 -47
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/browsecomp.py +0 -245
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text.py +0 -15
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text_go.py +0 -64
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text_java.py +0 -65
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text_javascript.py +0 -65
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text_php.py +0 -65
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text_python.py +0 -65
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text_ruby.py +0 -65
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/freebase.py +0 -99
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/instruct_humaneval.py +0 -180
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/instructhumaneval.py +0 -129
- wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/mbpp.py +0 -142
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/agieval.py +0 -155
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/code2text.py +0 -161
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/codexglue.py +0 -107
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/livemathbench.py +0 -155
- wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/polymath.py +0 -155
- wisent/examples/scripts/results/benchmark_descriptions.json +0 -1244
- wisent/examples/scripts/results/benchmark_evaluation_methods.json +0 -66
- wisent/examples/scripts/results/benchmark_evaluator_mapping.json +0 -2781
- wisent/examples/scripts/results/benchmark_evaluator_mapping_updated.json +0 -30536
- wisent/examples/scripts/results/benchmark_evaluators_clean.json +0 -469
- wisent/examples/scripts/results/benchmark_methods_summary.json +0 -260
- wisent/examples/scripts/results/benchmark_pair_creation_methods.json +0 -66
- wisent/examples/scripts/results/benchmark_pair_totals.json +0 -269
- wisent/examples/scripts/results/benchmark_tags.json +0 -917
- wisent/examples/scripts/results/benchmark_test_summary_nov4.json +0 -71
- wisent/examples/scripts/results/coding_benchmarks_test_code_status.json +0 -150
- wisent/examples/scripts/results/failing_benchmarks.json +0 -946
- wisent/examples/scripts/results/failing_benchmarks_list.json +0 -41
- wisent/examples/scripts/results/failing_benchmarks_test_results.json +0 -945
- wisent/examples/scripts/results/missing_benchmark_tags.json +0 -341
- wisent/examples/scripts/results/test_20_newsgroups_evaluation.json +0 -30
- wisent/examples/scripts/results/test_20_newsgroups_pairs.json +0 -8
- wisent/examples/scripts/results/test_AraDICE_evaluation.json +0 -51
- wisent/examples/scripts/results/test_AraDICE_pairs.json +0 -14
- wisent/examples/scripts/results/test_AraDiCE_boolq_egy/test_AraDiCE_boolq_egy_evaluation.json +0 -30
- wisent/examples/scripts/results/test_AraDiCE_boolq_egy/test_AraDiCE_boolq_egy_pairs.json +0 -8
- wisent/examples/scripts/results/test_ArabCulture_evaluation.json +0 -51
- wisent/examples/scripts/results/test_ArabCulture_pairs.json +0 -14
- wisent/examples/scripts/results/test_Tag_evaluation.json +0 -30
- wisent/examples/scripts/results/test_Tag_pairs.json +0 -8
- wisent/examples/scripts/results/test_aclue_evaluation.json +0 -51
- wisent/examples/scripts/results/test_aclue_pairs.json +0 -14
- wisent/examples/scripts/results/test_acp_bench_evaluation.json +0 -51
- wisent/examples/scripts/results/test_acp_bench_hard_evaluation.json +0 -51
- wisent/examples/scripts/results/test_acp_bench_hard_pairs.json +0 -14
- wisent/examples/scripts/results/test_acp_bench_pairs.json +0 -14
- wisent/examples/scripts/results/test_advanced_ai_risk_evaluation.json +0 -51
- wisent/examples/scripts/results/test_advanced_ai_risk_pairs.json +0 -14
- wisent/examples/scripts/results/test_aexams_evaluation.json +0 -51
- wisent/examples/scripts/results/test_aexams_pairs.json +0 -14
- wisent/examples/scripts/results/test_afrimgsm_direct_amh_evaluation.json +0 -30
- wisent/examples/scripts/results/test_afrimgsm_direct_amh_pairs.json +0 -8
- wisent/examples/scripts/results/test_afrimmlu_direct_amh_evaluation.json +0 -30
- wisent/examples/scripts/results/test_afrimmlu_direct_amh_pairs.json +0 -8
- wisent/examples/scripts/results/test_afrixnli_en_direct_amh_evaluation.json +0 -30
- wisent/examples/scripts/results/test_afrixnli_en_direct_amh_pairs.json +0 -8
- wisent/examples/scripts/results/test_ag_news_evaluation.json +0 -30
- wisent/examples/scripts/results/test_ag_news_pairs.json +0 -8
- wisent/examples/scripts/results/test_agieval_evaluation.json +0 -51
- wisent/examples/scripts/results/test_agieval_pairs.json +0 -14
- wisent/examples/scripts/results/test_aime2024_evaluation.json +0 -30
- wisent/examples/scripts/results/test_aime2024_pairs.json +0 -8
- wisent/examples/scripts/results/test_aime2025_evaluation.json +0 -30
- wisent/examples/scripts/results/test_aime2025_pairs.json +0 -8
- wisent/examples/scripts/results/test_aime_evaluation.json +0 -30
- wisent/examples/scripts/results/test_aime_pairs.json +0 -8
- wisent/examples/scripts/results/test_anagrams1_evaluation.json +0 -30
- wisent/examples/scripts/results/test_anagrams1_pairs.json +0 -8
- wisent/examples/scripts/results/test_anagrams2_evaluation.json +0 -30
- wisent/examples/scripts/results/test_anagrams2_pairs.json +0 -8
- wisent/examples/scripts/results/test_anli_evaluation.json +0 -30
- wisent/examples/scripts/results/test_anli_pairs.json +0 -8
- wisent/examples/scripts/results/test_apps_evaluation.json +0 -30
- wisent/examples/scripts/results/test_apps_pairs.json +0 -8
- wisent/examples/scripts/results/test_arabic_exams_evaluation.json +0 -30
- wisent/examples/scripts/results/test_arabic_exams_pairs.json +0 -8
- wisent/examples/scripts/results/test_arabic_leaderboard_complete_evaluation.json +0 -51
- wisent/examples/scripts/results/test_arabic_leaderboard_complete_pairs.json +0 -14
- wisent/examples/scripts/results/test_arabic_leaderboard_light_evaluation.json +0 -51
- wisent/examples/scripts/results/test_arabic_leaderboard_light_pairs.json +0 -14
- wisent/examples/scripts/results/test_arabicmmlu_evaluation.json +0 -51
- wisent/examples/scripts/results/test_arabicmmlu_pairs.json +0 -14
- wisent/examples/scripts/results/test_aradice/test_aradice_evaluation.json +0 -51
- wisent/examples/scripts/results/test_aradice/test_aradice_pairs.json +0 -14
- wisent/examples/scripts/results/test_aradice3/test_aradice_evaluation.json +0 -51
- wisent/examples/scripts/results/test_aradice3/test_aradice_pairs.json +0 -14
- wisent/examples/scripts/results/test_arc_ar_evaluation.json +0 -30
- wisent/examples/scripts/results/test_arc_ar_pairs.json +0 -8
- wisent/examples/scripts/results/test_arc_challenge_evaluation.json +0 -30
- wisent/examples/scripts/results/test_arc_challenge_pairs.json +0 -8
- wisent/examples/scripts/results/test_arc_easy_evaluation.json +0 -30
- wisent/examples/scripts/results/test_arc_easy_pairs.json +0 -8
- wisent/examples/scripts/results/test_argument_topic_evaluation.json +0 -30
- wisent/examples/scripts/results/test_argument_topic_pairs.json +0 -8
- wisent/examples/scripts/results/test_arithmetic_evaluation.json +0 -51
- wisent/examples/scripts/results/test_arithmetic_pairs.json +0 -14
- wisent/examples/scripts/results/test_asdiv_evaluation.json +0 -30
- wisent/examples/scripts/results/test_asdiv_pairs.json +0 -8
- wisent/examples/scripts/results/test_assin_entailment_evaluation.json +0 -30
- wisent/examples/scripts/results/test_assin_entailment_pairs.json +0 -8
- wisent/examples/scripts/results/test_atis_evaluation.json +0 -30
- wisent/examples/scripts/results/test_atis_pairs.json +0 -8
- wisent/examples/scripts/results/test_babi_evaluation.json +0 -30
- wisent/examples/scripts/results/test_babi_pairs.json +0 -8
- wisent/examples/scripts/results/test_babilong_evaluation.json +0 -30
- wisent/examples/scripts/results/test_babilong_pairs.json +0 -8
- wisent/examples/scripts/results/test_bangla_mmlu_evaluation.json +0 -30
- wisent/examples/scripts/results/test_bangla_mmlu_pairs.json +0 -8
- wisent/examples/scripts/results/test_banking77_evaluation.json +0 -30
- wisent/examples/scripts/results/test_banking77_pairs.json +0 -8
- wisent/examples/scripts/results/test_basque/test_basque-glue_pairs.json +0 -14
- wisent/examples/scripts/results/test_basque-glue_evaluation.json +0 -51
- wisent/examples/scripts/results/test_basque-glue_pairs.json +0 -14
- wisent/examples/scripts/results/test_basque2/test_basque-glue_evaluation.json +0 -51
- wisent/examples/scripts/results/test_basque2/test_basque-glue_pairs.json +0 -14
- wisent/examples/scripts/results/test_basque_bench_evaluation.json +0 -51
- wisent/examples/scripts/results/test_basque_bench_pairs.json +0 -14
- wisent/examples/scripts/results/test_basque_glue/test_basque-glue_evaluation.json +0 -51
- wisent/examples/scripts/results/test_basque_glue/test_basque-glue_pairs.json +0 -14
- wisent/examples/scripts/results/test_basqueglue_evaluation.json +0 -51
- wisent/examples/scripts/results/test_basqueglue_pairs.json +0 -14
- wisent/examples/scripts/results/test_bbh_evaluation.json +0 -51
- wisent/examples/scripts/results/test_bbh_pairs.json +0 -14
- wisent/examples/scripts/results/test_bbq_evaluation.json +0 -30
- wisent/examples/scripts/results/test_bbq_pairs.json +0 -8
- wisent/examples/scripts/results/test_bec2016eu_evaluation.json +0 -51
- wisent/examples/scripts/results/test_bec2016eu_pairs.json +0 -14
- wisent/examples/scripts/results/test_belebele_evaluation.json +0 -51
- wisent/examples/scripts/results/test_belebele_pairs.json +0 -14
- wisent/examples/scripts/results/test_benchmarks_evaluation.json +0 -51
- wisent/examples/scripts/results/test_benchmarks_pairs.json +0 -14
- wisent/examples/scripts/results/test_bertaqa_evaluation.json +0 -51
- wisent/examples/scripts/results/test_bertaqa_pairs.json +0 -14
- wisent/examples/scripts/results/test_bhtc_v2_evaluation.json +0 -30
- wisent/examples/scripts/results/test_bhtc_v2_pairs.json +0 -8
- wisent/examples/scripts/results/test_bigbench_evaluation.json +0 -51
- wisent/examples/scripts/results/test_bigbench_pairs.json +0 -14
- wisent/examples/scripts/results/test_blimp_evaluation.json +0 -51
- wisent/examples/scripts/results/test_blimp_pairs.json +0 -14
- wisent/examples/scripts/results/test_boolq/test_boolq_evaluation.json +0 -30
- wisent/examples/scripts/results/test_boolq/test_boolq_pairs.json +0 -8
- wisent/examples/scripts/results/test_boolq-seq2seq_evaluation.json +0 -30
- wisent/examples/scripts/results/test_boolq-seq2seq_pairs.json +0 -8
- wisent/examples/scripts/results/test_boolq_evaluation.json +0 -30
- wisent/examples/scripts/results/test_boolq_pairs.json +0 -8
- wisent/examples/scripts/results/test_c4_evaluation.json +0 -30
- wisent/examples/scripts/results/test_c4_pairs.json +0 -8
- wisent/examples/scripts/results/test_cabreu_evaluation.json +0 -30
- wisent/examples/scripts/results/test_cabreu_pairs.json +0 -8
- wisent/examples/scripts/results/test_careqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_careqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_catalan_bench_evaluation.json +0 -51
- wisent/examples/scripts/results/test_catalan_bench_pairs.json +0 -14
- wisent/examples/scripts/results/test_catalanqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_catalanqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_catcola_evaluation.json +0 -30
- wisent/examples/scripts/results/test_catcola_pairs.json +0 -8
- wisent/examples/scripts/results/test_cb_evaluation.json +0 -30
- wisent/examples/scripts/results/test_cb_pairs.json +0 -8
- wisent/examples/scripts/results/test_ceval/test_ceval_evaluation.json +0 -51
- wisent/examples/scripts/results/test_ceval/test_ceval_pairs.json +0 -14
- wisent/examples/scripts/results/test_ceval_accountant/test_ceval-valid_accountant_evaluation.json +0 -30
- wisent/examples/scripts/results/test_ceval_accountant/test_ceval-valid_accountant_pairs.json +0 -8
- wisent/examples/scripts/results/test_ceval_evaluation.json +0 -51
- wisent/examples/scripts/results/test_ceval_pairs.json +0 -14
- wisent/examples/scripts/results/test_ceval_valid/test_ceval_valid_evaluation.json +0 -51
- wisent/examples/scripts/results/test_ceval_valid/test_ceval_valid_pairs.json +0 -14
- wisent/examples/scripts/results/test_chain_of_thought_evaluation.json +0 -51
- wisent/examples/scripts/results/test_chain_of_thought_pairs.json +0 -14
- wisent/examples/scripts/results/test_chartqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_chartqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_claim_stance_topic_evaluation.json +0 -30
- wisent/examples/scripts/results/test_claim_stance_topic_pairs.json +0 -8
- wisent/examples/scripts/results/test_cmmlu_evaluation.json +0 -51
- wisent/examples/scripts/results/test_cmmlu_pairs.json +0 -14
- wisent/examples/scripts/results/test_cnn_dailymail_evaluation.json +0 -30
- wisent/examples/scripts/results/test_cnn_dailymail_pairs.json +0 -8
- wisent/examples/scripts/results/test_cocoteros_es_evaluation.json +0 -30
- wisent/examples/scripts/results/test_cocoteros_es_pairs.json +0 -8
- wisent/examples/scripts/results/test_codexglue_code_to_text_go_evaluation.json +0 -30
- wisent/examples/scripts/results/test_codexglue_code_to_text_go_pairs.json +0 -8
- wisent/examples/scripts/results/test_codexglue_code_to_text_java_evaluation.json +0 -30
- wisent/examples/scripts/results/test_codexglue_code_to_text_java_pairs.json +0 -8
- wisent/examples/scripts/results/test_codexglue_code_to_text_javascript_evaluation.json +0 -30
- wisent/examples/scripts/results/test_codexglue_code_to_text_javascript_pairs.json +0 -8
- wisent/examples/scripts/results/test_codexglue_code_to_text_php_evaluation.json +0 -30
- wisent/examples/scripts/results/test_codexglue_code_to_text_php_pairs.json +0 -8
- wisent/examples/scripts/results/test_codexglue_code_to_text_python_evaluation.json +0 -30
- wisent/examples/scripts/results/test_codexglue_code_to_text_python_pairs.json +0 -8
- wisent/examples/scripts/results/test_codexglue_code_to_text_ruby_evaluation.json +0 -30
- wisent/examples/scripts/results/test_codexglue_code_to_text_ruby_pairs.json +0 -8
- wisent/examples/scripts/results/test_coedit_gec_evaluation.json +0 -30
- wisent/examples/scripts/results/test_coedit_gec_pairs.json +0 -8
- wisent/examples/scripts/results/test_cola_evaluation.json +0 -30
- wisent/examples/scripts/results/test_cola_pairs.json +0 -8
- wisent/examples/scripts/results/test_commonsense_qa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_commonsense_qa_pairs.json +0 -8
- wisent/examples/scripts/results/test_conala_evaluation.json +0 -30
- wisent/examples/scripts/results/test_conala_pairs.json +0 -8
- wisent/examples/scripts/results/test_concode_evaluation.json +0 -30
- wisent/examples/scripts/results/test_concode_pairs.json +0 -8
- wisent/examples/scripts/results/test_copa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_copa_pairs.json +0 -8
- wisent/examples/scripts/results/test_copal_id_evaluation.json +0 -30
- wisent/examples/scripts/results/test_copal_id_pairs.json +0 -8
- wisent/examples/scripts/results/test_coqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_coqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_coqcat_evaluation.json +0 -30
- wisent/examples/scripts/results/test_coqcat_pairs.json +0 -8
- wisent/examples/scripts/results/test_crows_pairs_evaluation.json +0 -51
- wisent/examples/scripts/results/test_crows_pairs_pairs.json +0 -14
- wisent/examples/scripts/results/test_csatqa_evaluation.json +0 -51
- wisent/examples/scripts/results/test_csatqa_pairs.json +0 -14
- wisent/examples/scripts/results/test_cycle_letters_evaluation.json +0 -30
- wisent/examples/scripts/results/test_cycle_letters_pairs.json +0 -8
- wisent/examples/scripts/results/test_darija_bench/test_darija_bench_evaluation.json +0 -51
- wisent/examples/scripts/results/test_darija_bench/test_darija_bench_pairs.json +0 -14
- wisent/examples/scripts/results/test_darija_bench_evaluation.json +0 -51
- wisent/examples/scripts/results/test_darija_bench_pairs.json +0 -14
- wisent/examples/scripts/results/test_darijahellaswag_evaluation.json +0 -30
- wisent/examples/scripts/results/test_darijahellaswag_pairs.json +0 -8
- wisent/examples/scripts/results/test_darijammlu_evaluation.json +0 -51
- wisent/examples/scripts/results/test_darijammlu_pairs.json +0 -14
- wisent/examples/scripts/results/test_dbpedia_14_evaluation.json +0 -30
- wisent/examples/scripts/results/test_dbpedia_14_pairs.json +0 -8
- wisent/examples/scripts/results/test_drop_evaluation.json +0 -30
- wisent/examples/scripts/results/test_drop_pairs.json +0 -8
- wisent/examples/scripts/results/test_ds1000_evaluation.json +0 -30
- wisent/examples/scripts/results/test_ds1000_pairs.json +0 -8
- wisent/examples/scripts/results/test_egyhellaswag_evaluation.json +0 -30
- wisent/examples/scripts/results/test_egyhellaswag_pairs.json +0 -8
- wisent/examples/scripts/results/test_egymmlu_evaluation.json +0 -51
- wisent/examples/scripts/results/test_egymmlu_pairs.json +0 -14
- wisent/examples/scripts/results/test_epec_koref_bin_evaluation.json +0 -30
- wisent/examples/scripts/results/test_epec_koref_bin_pairs.json +0 -8
- wisent/examples/scripts/results/test_eq_bench_evaluation.json +0 -30
- wisent/examples/scripts/results/test_eq_bench_pairs.json +0 -8
- wisent/examples/scripts/results/test_escola_evaluation.json +0 -30
- wisent/examples/scripts/results/test_escola_pairs.json +0 -8
- wisent/examples/scripts/results/test_ethics_cm_evaluation.json +0 -30
- wisent/examples/scripts/results/test_ethics_cm_pairs.json +0 -8
- wisent/examples/scripts/results/test_ethos_binary_evaluation.json +0 -30
- wisent/examples/scripts/results/test_ethos_binary_pairs.json +0 -8
- wisent/examples/scripts/results/test_eus_exams/test_eus_exams_evaluation.json +0 -51
- wisent/examples/scripts/results/test_eus_exams/test_eus_exams_pairs.json +0 -14
- wisent/examples/scripts/results/test_eus_exams_es_evaluation.json +0 -51
- wisent/examples/scripts/results/test_eus_exams_es_pairs.json +0 -14
- wisent/examples/scripts/results/test_eus_exams_evaluation.json +0 -51
- wisent/examples/scripts/results/test_eus_exams_pairs.json +0 -14
- wisent/examples/scripts/results/test_eus_proficiency_evaluation.json +0 -30
- wisent/examples/scripts/results/test_eus_proficiency_pairs.json +0 -8
- wisent/examples/scripts/results/test_eus_reading_evaluation.json +0 -30
- wisent/examples/scripts/results/test_eus_reading_pairs.json +0 -8
- wisent/examples/scripts/results/test_eus_trivia_evaluation.json +0 -30
- wisent/examples/scripts/results/test_eus_trivia_pairs.json +0 -8
- wisent/examples/scripts/results/test_evalita-mp_evaluation.json +0 -51
- wisent/examples/scripts/results/test_evalita-mp_pairs.json +0 -14
- wisent/examples/scripts/results/test_evalita-sp_sum_task_fp-small_p1_evaluation.json +0 -30
- wisent/examples/scripts/results/test_evalita-sp_sum_task_fp-small_p1_pairs.json +0 -8
- wisent/examples/scripts/results/test_evalita_LLM_evaluation.json +0 -51
- wisent/examples/scripts/results/test_evalita_LLM_pairs.json +0 -14
- wisent/examples/scripts/results/test_evalita_llm/test_evalita_llm_evaluation.json +0 -51
- wisent/examples/scripts/results/test_evalita_llm/test_evalita_llm_pairs.json +0 -14
- wisent/examples/scripts/results/test_evalita_mp/test_evalita-mp_te_prompt-1_evaluation.json +0 -30
- wisent/examples/scripts/results/test_evalita_mp/test_evalita-mp_te_prompt-1_pairs.json +0 -8
- wisent/examples/scripts/results/test_evalita_mp2/test_evalita_mp_evaluation.json +0 -51
- wisent/examples/scripts/results/test_evalita_mp2/test_evalita_mp_pairs.json +0 -14
- wisent/examples/scripts/results/test_evalita_sp2/test_evalita-sp_sum_task_fp-small_p1_evaluation.json +0 -30
- wisent/examples/scripts/results/test_evalita_sp2/test_evalita-sp_sum_task_fp-small_p1_pairs.json +0 -8
- wisent/examples/scripts/results/test_fda_evaluation.json +0 -30
- wisent/examples/scripts/results/test_fda_pairs.json +0 -8
- wisent/examples/scripts/results/test_financial_tweets_evaluation.json +0 -30
- wisent/examples/scripts/results/test_financial_tweets_pairs.json +0 -8
- wisent/examples/scripts/results/test_fld/test_fld_evaluation.json +0 -30
- wisent/examples/scripts/results/test_fld/test_fld_pairs.json +0 -8
- wisent/examples/scripts/results/test_fld_evaluation.json +0 -30
- wisent/examples/scripts/results/test_fld_fixed/test_fld_evaluation.json +0 -30
- wisent/examples/scripts/results/test_fld_fixed/test_fld_pairs.json +0 -8
- wisent/examples/scripts/results/test_fld_pairs.json +0 -8
- wisent/examples/scripts/results/test_flores_evaluation.json +0 -51
- wisent/examples/scripts/results/test_flores_pairs.json +0 -14
- wisent/examples/scripts/results/test_freebase_evaluation.json +0 -30
- wisent/examples/scripts/results/test_freebase_pairs.json +0 -8
- wisent/examples/scripts/results/test_french_bench_evaluation.json +0 -51
- wisent/examples/scripts/results/test_french_bench_pairs.json +0 -14
- wisent/examples/scripts/results/test_galcola_evaluation.json +0 -30
- wisent/examples/scripts/results/test_galcola_pairs.json +0 -8
- wisent/examples/scripts/results/test_galician_bench_evaluation.json +0 -51
- wisent/examples/scripts/results/test_galician_bench_pairs.json +0 -14
- wisent/examples/scripts/results/test_glianorex_evaluation.json +0 -30
- wisent/examples/scripts/results/test_glianorex_pairs.json +0 -8
- wisent/examples/scripts/results/test_global_mmlu_evaluation.json +0 -51
- wisent/examples/scripts/results/test_global_mmlu_pairs.json +0 -14
- wisent/examples/scripts/results/test_glue_evaluation.json +0 -51
- wisent/examples/scripts/results/test_glue_pairs.json +0 -14
- wisent/examples/scripts/results/test_gpqa_evaluation.json +0 -51
- wisent/examples/scripts/results/test_gpqa_pairs.json +0 -14
- wisent/examples/scripts/results/test_gpt3_translation_benchmarks_evaluation.json +0 -51
- wisent/examples/scripts/results/test_gpt3_translation_benchmarks_pairs.json +0 -14
- wisent/examples/scripts/results/test_groundcocoa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_groundcocoa_pairs.json +0 -8
- wisent/examples/scripts/results/test_gsm8k_evaluation.json +0 -30
- wisent/examples/scripts/results/test_gsm8k_pairs.json +0 -8
- wisent/examples/scripts/results/test_haerae_evaluation.json +0 -51
- wisent/examples/scripts/results/test_haerae_pairs.json +0 -14
- wisent/examples/scripts/results/test_headqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_headqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_hellaswag_evaluation.json +0 -30
- wisent/examples/scripts/results/test_hellaswag_pairs.json +0 -8
- wisent/examples/scripts/results/test_hendrycks_ethics_evaluation.json +0 -51
- wisent/examples/scripts/results/test_hendrycks_ethics_pairs.json +0 -14
- wisent/examples/scripts/results/test_hendrycks_math_evaluation.json +0 -51
- wisent/examples/scripts/results/test_hendrycks_math_pairs.json +0 -14
- wisent/examples/scripts/results/test_histoires_morales_evaluation.json +0 -30
- wisent/examples/scripts/results/test_histoires_morales_pairs.json +0 -8
- wisent/examples/scripts/results/test_hmmt_evaluation.json +0 -30
- wisent/examples/scripts/results/test_hmmt_feb_2025_evaluation.json +0 -30
- wisent/examples/scripts/results/test_hmmt_feb_2025_pairs.json +0 -8
- wisent/examples/scripts/results/test_hmmt_pairs.json +0 -8
- wisent/examples/scripts/results/test_hrm8k_evaluation.json +0 -51
- wisent/examples/scripts/results/test_hrm8k_pairs.json +0 -14
- wisent/examples/scripts/results/test_humaneval_evaluation.json +0 -30
- wisent/examples/scripts/results/test_humaneval_pairs.json +0 -8
- wisent/examples/scripts/results/test_humaneval_plus_evaluation.json +0 -30
- wisent/examples/scripts/results/test_humaneval_plus_pairs.json +0 -8
- wisent/examples/scripts/results/test_ifeval_evaluation.json +0 -30
- wisent/examples/scripts/results/test_ifeval_pairs.json +0 -8
- wisent/examples/scripts/results/test_instruct_humaneval/test_instruct_humaneval_evaluation.json +0 -30
- wisent/examples/scripts/results/test_instruct_humaneval/test_instruct_humaneval_pairs.json +0 -8
- wisent/examples/scripts/results/test_instruct_humaneval_evaluation.json +0 -30
- wisent/examples/scripts/results/test_instruct_humaneval_pairs.json +0 -8
- wisent/examples/scripts/results/test_inverse_scaling_evaluation.json +0 -51
- wisent/examples/scripts/results/test_inverse_scaling_hindsight_neglect_10shot_evaluation.json +0 -30
- wisent/examples/scripts/results/test_inverse_scaling_hindsight_neglect_10shot_pairs.json +0 -8
- wisent/examples/scripts/results/test_inverse_scaling_mc/test_inverse_scaling_mc_evaluation.json +0 -51
- wisent/examples/scripts/results/test_inverse_scaling_mc/test_inverse_scaling_mc_pairs.json +0 -14
- wisent/examples/scripts/results/test_inverse_scaling_pairs.json +0 -14
- wisent/examples/scripts/results/test_iwslt2017-ar-en_evaluation.json +0 -30
- wisent/examples/scripts/results/test_iwslt2017-ar-en_pairs.json +0 -8
- wisent/examples/scripts/results/test_iwslt2017-en-ar_evaluation.json +0 -30
- wisent/examples/scripts/results/test_iwslt2017-en-ar_pairs.json +0 -8
- wisent/examples/scripts/results/test_iwslt2017_ar_en/test_iwslt2017-ar-en_evaluation.json +0 -30
- wisent/examples/scripts/results/test_iwslt2017_ar_en/test_iwslt2017-ar-en_pairs.json +0 -8
- wisent/examples/scripts/results/test_iwslt2017_en_ar/test_iwslt2017-en-ar_evaluation.json +0 -30
- wisent/examples/scripts/results/test_iwslt2017_en_ar/test_iwslt2017-en-ar_pairs.json +0 -8
- wisent/examples/scripts/results/test_iwslt2017_group/test_iwslt2017_evaluation.json +0 -30
- wisent/examples/scripts/results/test_iwslt2017_group/test_iwslt2017_pairs.json +0 -8
- wisent/examples/scripts/results/test_japanese_leaderboard_evaluation.json +0 -51
- wisent/examples/scripts/results/test_japanese_leaderboard_pairs.json +0 -14
- wisent/examples/scripts/results/test_jsonschema_bench/test_jsonschema_bench_evaluation.json +0 -30
- wisent/examples/scripts/results/test_jsonschema_bench/test_jsonschema_bench_pairs.json +0 -8
- wisent/examples/scripts/results/test_jsonschema_bench_evaluation.json +0 -30
- wisent/examples/scripts/results/test_jsonschema_bench_final/test_jsonschema_bench_evaluation.json +0 -30
- wisent/examples/scripts/results/test_jsonschema_bench_final/test_jsonschema_bench_pairs.json +0 -8
- wisent/examples/scripts/results/test_jsonschema_bench_pairs.json +0 -8
- wisent/examples/scripts/results/test_kbl_evaluation.json +0 -51
- wisent/examples/scripts/results/test_kbl_fixed/test_kbl_evaluation.json +0 -51
- wisent/examples/scripts/results/test_kbl_fixed/test_kbl_pairs.json +0 -14
- wisent/examples/scripts/results/test_kbl_pairs.json +0 -14
- wisent/examples/scripts/results/test_kmmlu_evaluation.json +0 -51
- wisent/examples/scripts/results/test_kmmlu_pairs.json +0 -14
- wisent/examples/scripts/results/test_kobest_evaluation.json +0 -51
- wisent/examples/scripts/results/test_kobest_pairs.json +0 -14
- wisent/examples/scripts/results/test_kormedmcqa/test_kormedmcqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_kormedmcqa/test_kormedmcqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_kormedmcqa_dentist/test_kormedmcqa_dentist_evaluation.json +0 -30
- wisent/examples/scripts/results/test_kormedmcqa_dentist/test_kormedmcqa_dentist_pairs.json +0 -8
- wisent/examples/scripts/results/test_kormedmcqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_kormedmcqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_lambada_cloze_evaluation.json +0 -30
- wisent/examples/scripts/results/test_lambada_cloze_pairs.json +0 -8
- wisent/examples/scripts/results/test_lambada_evaluation.json +0 -30
- wisent/examples/scripts/results/test_lambada_final/test_lambada_openai_mt_stablelm_en_evaluation.json +0 -30
- wisent/examples/scripts/results/test_lambada_final/test_lambada_openai_mt_stablelm_en_pairs.json +0 -8
- wisent/examples/scripts/results/test_lambada_multilingual/test_lambada_multilingual_evaluation.json +0 -51
- wisent/examples/scripts/results/test_lambada_multilingual/test_lambada_multilingual_pairs.json +0 -14
- wisent/examples/scripts/results/test_lambada_multilingual_evaluation.json +0 -51
- wisent/examples/scripts/results/test_lambada_multilingual_pairs.json +0 -14
- wisent/examples/scripts/results/test_lambada_multilingual_stablelm_evaluation.json +0 -51
- wisent/examples/scripts/results/test_lambada_multilingual_stablelm_pairs.json +0 -14
- wisent/examples/scripts/results/test_lambada_openai_evaluation.json +0 -30
- wisent/examples/scripts/results/test_lambada_openai_pairs.json +0 -8
- wisent/examples/scripts/results/test_lambada_pairs.json +0 -8
- wisent/examples/scripts/results/test_lambada_stablelm_en_fixed/test_lambada_openai_mt_stablelm_en_evaluation.json +0 -30
- wisent/examples/scripts/results/test_lambada_stablelm_en_fixed/test_lambada_openai_mt_stablelm_en_pairs.json +0 -8
- wisent/examples/scripts/results/test_lambada_stablelm_fixed/test_lambada_openai_mt_stablelm_en_evaluation.json +0 -30
- wisent/examples/scripts/results/test_lambada_stablelm_fixed/test_lambada_openai_mt_stablelm_en_pairs.json +0 -8
- wisent/examples/scripts/results/test_lambada_standard_evaluation.json +0 -30
- wisent/examples/scripts/results/test_lambada_standard_pairs.json +0 -8
- wisent/examples/scripts/results/test_leaderboard_evaluation.json +0 -51
- wisent/examples/scripts/results/test_leaderboard_pairs.json +0 -14
- wisent/examples/scripts/results/test_libra/test_libra_evaluation.json +0 -51
- wisent/examples/scripts/results/test_libra/test_libra_pairs.json +0 -14
- wisent/examples/scripts/results/test_libra_evaluation.json +0 -51
- wisent/examples/scripts/results/test_libra_pairs.json +0 -14
- wisent/examples/scripts/results/test_lingoly_evaluation.json +0 -30
- wisent/examples/scripts/results/test_lingoly_pairs.json +0 -8
- wisent/examples/scripts/results/test_livecodebench_evaluation.json +0 -30
- wisent/examples/scripts/results/test_livecodebench_pairs.json +0 -8
- wisent/examples/scripts/results/test_livemathbench_cnmo_en_evaluation.json +0 -30
- wisent/examples/scripts/results/test_livemathbench_cnmo_en_pairs.json +0 -8
- wisent/examples/scripts/results/test_livemathbench_cnmo_zh_evaluation.json +0 -30
- wisent/examples/scripts/results/test_livemathbench_cnmo_zh_pairs.json +0 -8
- wisent/examples/scripts/results/test_llama_evaluation.json +0 -30
- wisent/examples/scripts/results/test_llama_pairs.json +0 -8
- wisent/examples/scripts/results/test_logiqa2_evaluation.json +0 -30
- wisent/examples/scripts/results/test_logiqa2_pairs.json +0 -8
- wisent/examples/scripts/results/test_logiqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_logiqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_m_mmlu_evaluation.json +0 -51
- wisent/examples/scripts/results/test_m_mmlu_pairs.json +0 -14
- wisent/examples/scripts/results/test_mastermind/test_mastermind_evaluation.json +0 -51
- wisent/examples/scripts/results/test_mastermind/test_mastermind_pairs.json +0 -14
- wisent/examples/scripts/results/test_mastermind_24_easy/test_mastermind_24_easy_evaluation.json +0 -30
- wisent/examples/scripts/results/test_mastermind_24_easy/test_mastermind_24_easy_pairs.json +0 -8
- wisent/examples/scripts/results/test_mastermind_evaluation.json +0 -51
- wisent/examples/scripts/results/test_mastermind_pairs.json +0 -14
- wisent/examples/scripts/results/test_math500_evaluation.json +0 -30
- wisent/examples/scripts/results/test_math500_pairs.json +0 -8
- wisent/examples/scripts/results/test_math_evaluation.json +0 -30
- wisent/examples/scripts/results/test_math_pairs.json +0 -8
- wisent/examples/scripts/results/test_mathqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_mathqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_mbpp_evaluation.json +0 -30
- wisent/examples/scripts/results/test_mbpp_pairs.json +0 -8
- wisent/examples/scripts/results/test_mbpp_plus_evaluation.json +0 -30
- wisent/examples/scripts/results/test_mbpp_plus_pairs.json +0 -8
- wisent/examples/scripts/results/test_mc_taco_evaluation.json +0 -30
- wisent/examples/scripts/results/test_mc_taco_pairs.json +0 -8
- wisent/examples/scripts/results/test_med_concepts_qa/test_med_concepts_qa_evaluation.json +0 -51
- wisent/examples/scripts/results/test_med_concepts_qa/test_med_concepts_qa_pairs.json +0 -14
- wisent/examples/scripts/results/test_med_concepts_qa_atc_easy/test_med_concepts_qa_atc_easy_evaluation.json +0 -30
- wisent/examples/scripts/results/test_med_concepts_qa_atc_easy/test_med_concepts_qa_atc_easy_pairs.json +0 -8
- wisent/examples/scripts/results/test_med_concepts_qa_evaluation.json +0 -51
- wisent/examples/scripts/results/test_med_concepts_qa_pairs.json +0 -14
- wisent/examples/scripts/results/test_meddialog_evaluation.json +0 -30
- wisent/examples/scripts/results/test_meddialog_pairs.json +0 -8
- wisent/examples/scripts/results/test_meddialog_raw_perplexity/test_meddialog_raw_perplexity_evaluation.json +0 -30
- wisent/examples/scripts/results/test_meddialog_raw_perplexity/test_meddialog_raw_perplexity_pairs.json +0 -8
- wisent/examples/scripts/results/test_mediqa_qa2019_evaluation.json +0 -30
- wisent/examples/scripts/results/test_mediqa_qa2019_pairs.json +0 -8
- wisent/examples/scripts/results/test_medmcqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_medmcqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_medqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_medqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_medtext_evaluation.json +0 -30
- wisent/examples/scripts/results/test_medtext_pairs.json +0 -8
- wisent/examples/scripts/results/test_mela_evaluation.json +0 -51
- wisent/examples/scripts/results/test_mela_pairs.json +0 -14
- wisent/examples/scripts/results/test_meqsum_evaluation.json +0 -30
- wisent/examples/scripts/results/test_meqsum_pairs.json +0 -8
- wisent/examples/scripts/results/test_mercury_evaluation.json +0 -30
- wisent/examples/scripts/results/test_mercury_pairs.json +0 -8
- wisent/examples/scripts/results/test_metabench_evaluation.json +0 -51
- wisent/examples/scripts/results/test_metabench_pairs.json +0 -14
- wisent/examples/scripts/results/test_mgsm_evaluation.json +0 -51
- wisent/examples/scripts/results/test_mgsm_pairs.json +0 -14
- wisent/examples/scripts/results/test_mimic_repsum_evaluation.json +0 -30
- wisent/examples/scripts/results/test_mimic_repsum_pairs.json +0 -8
- wisent/examples/scripts/results/test_minerva_math_evaluation.json +0 -51
- wisent/examples/scripts/results/test_minerva_math_pairs.json +0 -14
- wisent/examples/scripts/results/test_mlqa_evaluation.json +0 -51
- wisent/examples/scripts/results/test_mlqa_pairs.json +0 -14
- wisent/examples/scripts/results/test_mmlu-pro-plus_evaluation.json +0 -51
- wisent/examples/scripts/results/test_mmlu-pro-plus_pairs.json +0 -14
- wisent/examples/scripts/results/test_mmlu_evaluation.json +0 -51
- wisent/examples/scripts/results/test_mmlu_pairs.json +0 -14
- wisent/examples/scripts/results/test_mmlu_pro_evaluation.json +0 -51
- wisent/examples/scripts/results/test_mmlu_pro_pairs.json +0 -14
- wisent/examples/scripts/results/test_mmlu_prox_evaluation.json +0 -51
- wisent/examples/scripts/results/test_mmlu_prox_pairs.json +0 -14
- wisent/examples/scripts/results/test_mmlusr_evaluation.json +0 -30
- wisent/examples/scripts/results/test_mmlusr_pairs.json +0 -8
- wisent/examples/scripts/results/test_mmmu_evaluation.json +0 -51
- wisent/examples/scripts/results/test_mmmu_pairs.json +0 -14
- wisent/examples/scripts/results/test_mnli_evaluation.json +0 -30
- wisent/examples/scripts/results/test_mnli_pairs.json +0 -8
- wisent/examples/scripts/results/test_model_written_evals_evaluation.json +0 -51
- wisent/examples/scripts/results/test_model_written_evals_pairs.json +0 -14
- wisent/examples/scripts/results/test_moral_stories_evaluation.json +0 -30
- wisent/examples/scripts/results/test_moral_stories_pairs.json +0 -8
- wisent/examples/scripts/results/test_mts_dialog_evaluation.json +0 -30
- wisent/examples/scripts/results/test_mts_dialog_pairs.json +0 -8
- wisent/examples/scripts/results/test_multiblimp_evaluation.json +0 -51
- wisent/examples/scripts/results/test_multiblimp_pairs.json +0 -14
- wisent/examples/scripts/results/test_multimedqa_evaluation.json +0 -51
- wisent/examples/scripts/results/test_multimedqa_pairs.json +0 -14
- wisent/examples/scripts/results/test_multipl_e_evaluation.json +0 -30
- wisent/examples/scripts/results/test_multipl_e_pairs.json +0 -8
- wisent/examples/scripts/results/test_mutual_evaluation.json +0 -30
- wisent/examples/scripts/results/test_mutual_pairs.json +0 -8
- wisent/examples/scripts/results/test_non_greedy_robustness_agieval_aqua_rat_evaluation.json +0 -30
- wisent/examples/scripts/results/test_non_greedy_robustness_agieval_aqua_rat_pairs.json +0 -8
- wisent/examples/scripts/results/test_noreval_evaluation.json +0 -51
- wisent/examples/scripts/results/test_noreval_pairs.json +0 -14
- wisent/examples/scripts/results/test_noticia_evaluation.json +0 -30
- wisent/examples/scripts/results/test_noticia_pairs.json +0 -8
- wisent/examples/scripts/results/test_nq_open_evaluation.json +0 -30
- wisent/examples/scripts/results/test_nq_open_pairs.json +0 -8
- wisent/examples/scripts/results/test_olaph_evaluation.json +0 -30
- wisent/examples/scripts/results/test_olaph_pairs.json +0 -8
- wisent/examples/scripts/results/test_openbookqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_openbookqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_openllm_evaluation.json +0 -51
- wisent/examples/scripts/results/test_openllm_pairs.json +0 -14
- wisent/examples/scripts/results/test_option_order_robustness_agieval_aqua_rat_evaluation.json +0 -30
- wisent/examples/scripts/results/test_option_order_robustness_agieval_aqua_rat_pairs.json +0 -8
- wisent/examples/scripts/results/test_paloma_evaluation.json +0 -51
- wisent/examples/scripts/results/test_paloma_pairs.json +0 -14
- wisent/examples/scripts/results/test_passkey/test_passkey_evaluation.json +0 -30
- wisent/examples/scripts/results/test_passkey/test_passkey_pairs.json +0 -8
- wisent/examples/scripts/results/test_paws-x_evaluation.json +0 -51
- wisent/examples/scripts/results/test_paws-x_pairs.json +0 -14
- wisent/examples/scripts/results/test_paws_en/test_paws_en_evaluation.json +0 -30
- wisent/examples/scripts/results/test_paws_en/test_paws_en_pairs.json +0 -8
- wisent/examples/scripts/results/test_penn_treebank_evaluation.json +0 -30
- wisent/examples/scripts/results/test_penn_treebank_pairs.json +0 -8
- wisent/examples/scripts/results/test_pile_10k/test_pile_10k_evaluation.json +0 -30
- wisent/examples/scripts/results/test_pile_10k/test_pile_10k_pairs.json +0 -8
- wisent/examples/scripts/results/test_piqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_piqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_polemo2_evaluation.json +0 -30
- wisent/examples/scripts/results/test_polemo2_pairs.json +0 -8
- wisent/examples/scripts/results/test_polymath_en_high_evaluation.json +0 -30
- wisent/examples/scripts/results/test_polymath_en_high_pairs.json +0 -8
- wisent/examples/scripts/results/test_polymath_en_medium_evaluation.json +0 -30
- wisent/examples/scripts/results/test_polymath_en_medium_pairs.json +0 -8
- wisent/examples/scripts/results/test_polymath_zh_high_evaluation.json +0 -30
- wisent/examples/scripts/results/test_polymath_zh_high_pairs.json +0 -8
- wisent/examples/scripts/results/test_polymath_zh_medium_evaluation.json +0 -30
- wisent/examples/scripts/results/test_polymath_zh_medium_pairs.json +0 -8
- wisent/examples/scripts/results/test_portuguese_bench_evaluation.json +0 -51
- wisent/examples/scripts/results/test_portuguese_bench_pairs.json +0 -14
- wisent/examples/scripts/results/test_prompt_robustness_agieval_aqua_rat/test_prompt_robustness_agieval_aqua_rat_evaluation.json +0 -30
- wisent/examples/scripts/results/test_prompt_robustness_agieval_aqua_rat/test_prompt_robustness_agieval_aqua_rat_pairs.json +0 -8
- wisent/examples/scripts/results/test_prompt_robustness_agieval_aqua_rat_evaluation.json +0 -30
- wisent/examples/scripts/results/test_prompt_robustness_agieval_aqua_rat_pairs.json +0 -8
- wisent/examples/scripts/results/test_prost_evaluation.json +0 -30
- wisent/examples/scripts/results/test_prost_pairs.json +0 -8
- wisent/examples/scripts/results/test_ptb_evaluation.json +0 -30
- wisent/examples/scripts/results/test_ptb_pairs.json +0 -8
- wisent/examples/scripts/results/test_pubmedqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_pubmedqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_pythia_evaluation.json +0 -51
- wisent/examples/scripts/results/test_pythia_pairs.json +0 -14
- wisent/examples/scripts/results/test_qa4mre_evaluation.json +0 -30
- wisent/examples/scripts/results/test_qa4mre_pairs.json +0 -8
- wisent/examples/scripts/results/test_qasper_evaluation.json +0 -30
- wisent/examples/scripts/results/test_qasper_pairs.json +0 -8
- wisent/examples/scripts/results/test_race_evaluation.json +0 -30
- wisent/examples/scripts/results/test_race_pairs.json +0 -8
- wisent/examples/scripts/results/test_realtoxicityprompts_evaluation.json +0 -30
- wisent/examples/scripts/results/test_realtoxicityprompts_pairs.json +0 -8
- wisent/examples/scripts/results/test_recode_evaluation.json +0 -30
- wisent/examples/scripts/results/test_recode_pairs.json +0 -8
- wisent/examples/scripts/results/test_record_evaluation.json +0 -30
- wisent/examples/scripts/results/test_record_pairs.json +0 -8
- wisent/examples/scripts/results/test_ruler_evaluation.json +0 -51
- wisent/examples/scripts/results/test_ruler_pairs.json +0 -14
- wisent/examples/scripts/results/test_sciq_evaluation.json +0 -30
- wisent/examples/scripts/results/test_sciq_pairs.json +0 -8
- wisent/examples/scripts/results/test_score_evaluation.json +0 -51
- wisent/examples/scripts/results/test_score_pairs.json +0 -14
- wisent/examples/scripts/results/test_self_consistency_evaluation.json +0 -30
- wisent/examples/scripts/results/test_self_consistency_pairs.json +0 -8
- wisent/examples/scripts/results/test_siqa/test_siqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_siqa/test_siqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_siqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_siqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_spanish_bench_evaluation.json +0 -51
- wisent/examples/scripts/results/test_spanish_bench_pairs.json +0 -14
- wisent/examples/scripts/results/test_squad2_evaluation.json +0 -30
- wisent/examples/scripts/results/test_squad2_pairs.json +0 -8
- wisent/examples/scripts/results/test_squadv2_evaluation.json +0 -30
- wisent/examples/scripts/results/test_squadv2_pairs.json +0 -8
- wisent/examples/scripts/results/test_super-glue-lm-eval-v1-seq2seq_evaluation.json +0 -30
- wisent/examples/scripts/results/test_super-glue-lm-eval-v1-seq2seq_pairs.json +0 -8
- wisent/examples/scripts/results/test_super-glue-lm-eval-v1_evaluation.json +0 -51
- wisent/examples/scripts/results/test_super-glue-lm-eval-v1_pairs.json +0 -14
- wisent/examples/scripts/results/test_swag_evaluation.json +0 -30
- wisent/examples/scripts/results/test_swag_pairs.json +0 -8
- wisent/examples/scripts/results/test_tinyBenchmarks_evaluation.json +0 -51
- wisent/examples/scripts/results/test_tinyBenchmarks_pairs.json +0 -14
- wisent/examples/scripts/results/test_tmmluplus_evaluation.json +0 -51
- wisent/examples/scripts/results/test_tmmluplus_pairs.json +0 -14
- wisent/examples/scripts/results/test_translation_evaluation.json +0 -51
- wisent/examples/scripts/results/test_translation_pairs.json +0 -14
- wisent/examples/scripts/results/test_triviaqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_triviaqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_truthfulqa-multi_evaluation.json +0 -51
- wisent/examples/scripts/results/test_truthfulqa-multi_pairs.json +0 -14
- wisent/examples/scripts/results/test_truthfulqa_evaluation.json +0 -30
- wisent/examples/scripts/results/test_truthfulqa_mc1_evaluation.json +0 -30
- wisent/examples/scripts/results/test_truthfulqa_mc1_pairs.json +0 -8
- wisent/examples/scripts/results/test_truthfulqa_mc2_evaluation.json +0 -30
- wisent/examples/scripts/results/test_truthfulqa_mc2_pairs.json +0 -8
- wisent/examples/scripts/results/test_truthfulqa_pairs.json +0 -8
- wisent/examples/scripts/results/test_turkishmmlu_evaluation.json +0 -51
- wisent/examples/scripts/results/test_turkishmmlu_pairs.json +0 -14
- wisent/examples/scripts/results/test_unfair_tos_evaluation.json +0 -30
- wisent/examples/scripts/results/test_unfair_tos_pairs.json +0 -8
- wisent/examples/scripts/results/test_unscramble_evaluation.json +0 -51
- wisent/examples/scripts/results/test_unscramble_pairs.json +0 -14
- wisent/examples/scripts/results/test_webqs_evaluation.json +0 -30
- wisent/examples/scripts/results/test_webqs_pairs.json +0 -8
- wisent/examples/scripts/results/test_wikitext103_evaluation.json +0 -30
- wisent/examples/scripts/results/test_wikitext103_pairs.json +0 -8
- wisent/examples/scripts/results/test_wikitext_evaluation.json +0 -30
- wisent/examples/scripts/results/test_wikitext_pairs.json +0 -8
- wisent/examples/scripts/results/test_winogender_evaluation.json +0 -51
- wisent/examples/scripts/results/test_winogender_pairs.json +0 -14
- wisent/examples/scripts/results/test_winogrande_evaluation.json +0 -30
- wisent/examples/scripts/results/test_winogrande_pairs.json +0 -8
- wisent/examples/scripts/results/test_wmdp_evaluation.json +0 -30
- wisent/examples/scripts/results/test_wmdp_pairs.json +0 -8
- wisent/examples/scripts/results/test_wmt-ro-en-t5-prompt_evaluation.json +0 -30
- wisent/examples/scripts/results/test_wmt-ro-en-t5-prompt_pairs.json +0 -8
- wisent/examples/scripts/results/test_wmt14_en_fr_evaluation.json +0 -30
- wisent/examples/scripts/results/test_wmt14_en_fr_pairs.json +0 -8
- wisent/examples/scripts/results/test_wmt16_en_de_evaluation.json +0 -30
- wisent/examples/scripts/results/test_wmt16_en_de_pairs.json +0 -8
- wisent/examples/scripts/results/test_wmt16_ro_en_evaluation.json +0 -30
- wisent/examples/scripts/results/test_wmt16_ro_en_pairs.json +0 -8
- wisent/examples/scripts/results/test_wsc273_evaluation.json +0 -30
- wisent/examples/scripts/results/test_wsc273_pairs.json +0 -8
- wisent/examples/scripts/results/test_xcopa_evaluation.json +0 -51
- wisent/examples/scripts/results/test_xcopa_pairs.json +0 -14
- wisent/examples/scripts/results/test_xnli_eu_evaluation.json +0 -30
- wisent/examples/scripts/results/test_xnli_eu_pairs.json +0 -8
- wisent/examples/scripts/results/test_xnli_evaluation.json +0 -51
- wisent/examples/scripts/results/test_xnli_pairs.json +0 -14
- wisent/examples/scripts/results/test_xquad_evaluation.json +0 -51
- wisent/examples/scripts/results/test_xquad_pairs.json +0 -14
- wisent/examples/scripts/results/test_xstorycloze_evaluation.json +0 -51
- wisent/examples/scripts/results/test_xstorycloze_pairs.json +0 -14
- wisent/examples/scripts/results/test_xsum_evaluation.json +0 -30
- wisent/examples/scripts/results/test_xsum_pairs.json +0 -8
- wisent/examples/scripts/results/test_xwinograd_evaluation.json +0 -51
- wisent/examples/scripts/results/test_xwinograd_pairs.json +0 -14
- wisent/examples/scripts/results/test_yahoo_answers_topics_evaluation.json +0 -30
- wisent/examples/scripts/results/test_yahoo_answers_topics_pairs.json +0 -8
- {wisent-0.7.379.dist-info → wisent-0.7.901.dist-info}/WHEEL +0 -0
- {wisent-0.7.379.dist-info → wisent-0.7.901.dist-info}/entry_points.txt +0 -0
- {wisent-0.7.379.dist-info → wisent-0.7.901.dist-info}/licenses/LICENSE +0 -0
- {wisent-0.7.379.dist-info → wisent-0.7.901.dist-info}/top_level.txt +0 -0
|
@@ -1,7 +1,7 @@
|
|
|
1
|
-
wisent/__init__.py,sha256=
|
|
1
|
+
wisent/__init__.py,sha256=_tapv1VtSsFzxXjtnrr2XXezxkMMdt4Me1YSKo_fSKc,1229
|
|
2
2
|
wisent/cli.py,sha256=XKzGIGstr38EowHYpr821c6YuV9Eaw3I1I3NvLztTO0,3960
|
|
3
3
|
wisent/core/__init__.py,sha256=x1MX4vKpKP3c2FuIHcFly-UkoZwGVnRPbzcFaxr_Jdo,1340
|
|
4
|
-
wisent/core/autonomous_agent.py,sha256=
|
|
4
|
+
wisent/core/autonomous_agent.py,sha256=rtJ5XlWqPys7c1PBFkUBHGg9Ox6_LDjeoiNPEph6NA4,48667
|
|
5
5
|
wisent/core/benchmark_extractors.py,sha256=BtGoL23n9EzSGoywymSh8uIhlr8T_LU8y-hp7et1vIk,13616
|
|
6
6
|
wisent/core/benchmark_registry.py,sha256=KQWMDEKNLBRvzd91HyH8SlhwIKXwpJtTWoSPcIuTn5Y,4627
|
|
7
7
|
wisent/core/bigcode_extractors.py,sha256=xKrJLdglcpykCv9TR72PVwu4cq3Fp5W6XuMYrdDHsVc,696
|
|
@@ -12,10 +12,12 @@ wisent/core/config_manager.py,sha256=RfB9PT3K1Ns5EsQiSGQ1DSxdlG-cVMdaaUuqQMdCNOY
|
|
|
12
12
|
wisent/core/detection_handling.py,sha256=L14US_y4UWaSabeAEzWn6tPM79qQFgwpO-BXvBBO7fA,11183
|
|
13
13
|
wisent/core/diversity_processors.py,sha256=wm4rFK8qrvYLcDpaJVHe-r6QtDYDRGty-Eyd0nXzcdM,6883
|
|
14
14
|
wisent/core/download_full_benchmarks.py,sha256=6JVmof4xKC--Lkj8r6v70KGRxPVTqu7YC3nVsb5m42g,60722
|
|
15
|
-
wisent/core/
|
|
15
|
+
wisent/core/geometry_runner.py,sha256=KvDfSSob-scJSBB_Wya81rlWpiQohxLPjQxoyQw24rA,35719
|
|
16
|
+
wisent/core/geometry_search_space.py,sha256=JSF-zrwFkJxn33Gie_irTxhZW8M6h7eUpRu0Y_9Ci6k,8401
|
|
17
|
+
wisent/core/hyperparameter_optimizer.py,sha256=_L767LaidpRJN23nV9raWQ0wapclIEPJDX3h72mBQo0,22741
|
|
16
18
|
wisent/core/layer.py,sha256=on_jCGb0CUhn8dpbY9ZbH3yXk1QoNqR6uUPsI6eX1hU,391
|
|
17
|
-
wisent/core/lm_eval_harness_ground_truth.py,sha256=
|
|
18
|
-
wisent/core/main.py,sha256=
|
|
19
|
+
wisent/core/lm_eval_harness_ground_truth.py,sha256=46WGnsJLoQ3ALXnXJ0PkTo-N1U2wGDGKyU1kwg-1Ap0,66514
|
|
20
|
+
wisent/core/main.py,sha256=oL5ODpKkbM2HR9HLlBUbf2z9JSUkMzeI_8zHeMuJcrE,4503
|
|
19
21
|
wisent/core/managed_cached_benchmarks.py,sha256=_q26-13t_GLFvkMA3M8tge0Sv6fFJmH_AJqCVl-Dt3w,23499
|
|
20
22
|
wisent/core/mixed_benchmark_sampler.py,sha256=J1R7Q7LOXE28P2Bydx_NrgblJv35rqdkCPkvZiAxp_c,13715
|
|
21
23
|
wisent/core/model_persistence.py,sha256=Pr1A3E0MxqwICKsFXmjKVq9KgG8Ip5UbtG-gujGFShc,9870
|
|
@@ -23,9 +25,9 @@ wisent/core/multi_steering.py,sha256=7RKYLBBFxEsrSc83KPakAU3WzvVx5XO88tShM2cLKZE
|
|
|
23
25
|
wisent/core/parser.py,sha256=v99xCTbiyy2f4JzaVjz7bUtvn-uZEAj4S-u2OPikE24,68987
|
|
24
26
|
wisent/core/representation.py,sha256=hBl_N9qbr5Gsa7GCQ0nMWRm82RqYEfhd9cyf0PPH5LY,195
|
|
25
27
|
wisent/core/save_results.py,sha256=NJ7elQzbh3Q_ZefdTV8L-9QyutteWSBWfgTw78OBm1k,13725
|
|
26
|
-
wisent/core/steering.py,sha256=
|
|
28
|
+
wisent/core/steering.py,sha256=LFSEla3sCdGBDprjZ5si-ouFcYdxnflW8pfAgyPEJkY,22993
|
|
27
29
|
wisent/core/steering_method.py,sha256=Y09jIImhZnRuHkbpeAfJT1hDovXi0bacqt3X3TVSo68,411
|
|
28
|
-
wisent/core/steering_optimizer.py,sha256=
|
|
30
|
+
wisent/core/steering_optimizer.py,sha256=SVMI6xHtMb6xAZYkXggziqjEZ9SSkWCL0PiBj4WMlsc,65353
|
|
29
31
|
wisent/core/task_interface.py,sha256=4xm6nrduFdXSZpJccahfZWtpI4rZvCQcsS7GCJWpbMU,4906
|
|
30
32
|
wisent/core/task_selector.py,sha256=JLMQ8E1HAvs4H4UqJRIvvWaktJsSAo3uz8oY135qO9g,7774
|
|
31
33
|
wisent/core/time_estimator.py,sha256=Frwwbg8DRaeFlxBNewhLPhveysfOZQDR7oMhcJO6kt0,5963
|
|
@@ -33,12 +35,14 @@ wisent/core/timing_calibration.py,sha256=zIu1lgIEX_lBAmVfHakOHSEOvUAtFI5y4i3sk5e
|
|
|
33
35
|
wisent/core/universal_subspace.py,sha256=D35PgZE42IwzjdyrTjmPcYou9YKJkbVZPfwCHh2jF1g,30728
|
|
34
36
|
wisent/core/user_model_config.py,sha256=FGzHYo1kD7qDPhpffvDkigV-z7aiLxHAtqiMEPf_sIM,6729
|
|
35
37
|
wisent/core/wisent.py,sha256=yglyOL-10ptlTVTshgjuXle3PXo-fdWJiZPx8oLyabM,21076
|
|
36
|
-
wisent/core/activations/__init__.py,sha256=
|
|
37
|
-
wisent/core/activations/
|
|
38
|
-
wisent/core/activations/
|
|
39
|
-
wisent/core/activations/
|
|
38
|
+
wisent/core/activations/__init__.py,sha256=KjKMOPbPMmi1iMQMH6ALkcwa8pZLK8dpbz0cHGVjl_M,1352
|
|
39
|
+
wisent/core/activations/activation_cache.py,sha256=Tc-qH26Ht_E9wtQYJHnEMtea3dvB8x9XWaZOAQ2oPtA,13784
|
|
40
|
+
wisent/core/activations/activations.py,sha256=ljDkyCPiFyIt-SA43m-vJh3U2pcYIMenYxm46Vy4B1I,3200
|
|
41
|
+
wisent/core/activations/activations_collector.py,sha256=3aY6VxWVErnWOLdTLY6bapjR9e5kzHOoSV2OaOsDlYE,10536
|
|
42
|
+
wisent/core/activations/classifier_inference_strategy.py,sha256=Nw7xz08vgxJoMAUbCOT-vY118815STjh8iOZGbiBBU8,7054
|
|
43
|
+
wisent/core/activations/extraction_strategy.py,sha256=AkbVZ5TyF3bST4ZOw33HVNVlrbGAb8XrhAxoeDtRPNY,19820
|
|
40
44
|
wisent/core/activations/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
41
|
-
wisent/core/activations/core/atoms.py,sha256=
|
|
45
|
+
wisent/core/activations/core/atoms.py,sha256=wfPhgSt7NP_4xkyYZA6T62KTM2DUkq1Jj-FJeRd9Kko,5383
|
|
42
46
|
wisent/core/adapters/__init__.py,sha256=UZkssKYL4-Jl_F29x29MQr6L4899lpK-eFvFa_qGa8Y,712
|
|
43
47
|
wisent/core/adapters/audio.py,sha256=hqEXJ5NSfGstnQLmYkaBw_4TZ9Ft2qJaBMOKtObkb4Q,21712
|
|
44
48
|
wisent/core/adapters/base.py,sha256=ir75AwPA39sjpzGIs3aPFL2poZ34CVqVmygO-KZHbpA,12824
|
|
@@ -49,14 +53,14 @@ wisent/core/adapters/video.py,sha256=M1p2rHFTNkN2LjteYXp3NL3L6v1E238XMR8Agv7O5wI
|
|
|
49
53
|
wisent/core/agent/__init__.py,sha256=cAzpae7HWdNrpxCqANWUA2TKkqpm_hoSj8JAdbfmLwM,81
|
|
50
54
|
wisent/core/agent/budget.py,sha256=zBhMTvdVGLqM6vIhHzm5BO2dAp_ANuJvFPmZ8_9YQdM,24301
|
|
51
55
|
wisent/core/agent/device_benchmarks.py,sha256=2G_SuiM87gAS0TPZaMzS03yTOTHlbwJzpWNxYH60IJY,26206
|
|
52
|
-
wisent/core/agent/diagnose.py,sha256=
|
|
56
|
+
wisent/core/agent/diagnose.py,sha256=HpPnPDt0UE9yXLJeuWZdL5W38FoXRKHI0S2st05l4C4,9298
|
|
53
57
|
wisent/core/agent/steer.py,sha256=4v3kkWTo4qerEJSa-D2CBUQE0ESQRN90Rd3ovL48uQo,9928
|
|
54
58
|
wisent/core/agent/timeout.py,sha256=WvYC9n9huf0b5daXX1vt2G4b3OEsU7irPd15nj_Twbc,4328
|
|
55
59
|
wisent/core/agent/diagnose/__init__.py,sha256=cAzpae7HWdNrpxCqANWUA2TKkqpm_hoSj8JAdbfmLwM,81
|
|
56
60
|
wisent/core/agent/diagnose/agent_classifier_decision.py,sha256=WrrIW-ig4V_OoVQUHhieENOhEMjy0t72Z-ElgxWQS5s,28978
|
|
57
61
|
wisent/core/agent/diagnose/classifier_marketplace.py,sha256=m02pwQkC4ROui6BhNhGJArdgBREI2xYuaRinm09VxM0,22113
|
|
58
62
|
wisent/core/agent/diagnose/create_classifier.py,sha256=IeyqObop2Z6jdEgFz-RIW37bqcOl2mUC2l_cFNdn8ww,44269
|
|
59
|
-
wisent/core/agent/diagnose/response_diagnostics.py,sha256=
|
|
63
|
+
wisent/core/agent/diagnose/response_diagnostics.py,sha256=pEqxZVXtRJoadrJeFanWRzne_hIfeRHk4cEuPo_j0t0,10629
|
|
60
64
|
wisent/core/agent/diagnose/select_classifiers.py,sha256=XmmG3eAYkMNoPGE55-0gQTIGtDeqc_5sg93Mx03r__k,18353
|
|
61
65
|
wisent/core/agent/diagnose/synthetic_classifier_option.py,sha256=ZWsyZM7iUoFPlDtyWDjxi1qOeoVo9bUqFtl6eZ5pqzM,32703
|
|
62
66
|
wisent/core/agent/diagnose/tasks/__init__.py,sha256=IGnEhyeCWNagVjRpIDoX4Msb1rxfeWLrsPa3EvhiYeI,698
|
|
@@ -69,48 +73,52 @@ wisent/core/classifiers/__init__.py,sha256=AZyqSkAxKUtmNFBHfFfK8DzU2UwelX6Xhl4VN
|
|
|
69
73
|
wisent/core/classifiers/classifiers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
70
74
|
wisent/core/classifiers/classifiers/rotator.py,sha256=nc3N-PuZwaBzbtk4n7cetZux1GB0BWPHTV7cACXP23I,5148
|
|
71
75
|
wisent/core/classifiers/classifiers/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
72
|
-
wisent/core/classifiers/classifiers/core/atoms.py,sha256=
|
|
76
|
+
wisent/core/classifiers/classifiers/core/atoms.py,sha256=UrNwIIeJgd7JpibliEas9dinTtIrCuAC1lc1_f_qdiE,26194
|
|
73
77
|
wisent/core/classifiers/classifiers/models/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
74
78
|
wisent/core/classifiers/classifiers/models/logistic.py,sha256=6FNnybW4zZ0HSeFjyEiOQrtNFN4LV-M39mmiiW4buDk,876
|
|
75
79
|
wisent/core/classifiers/classifiers/models/mlp.py,sha256=f_8Lgh5UZPLLCIKF1b6qeg5MwyFj9tuLrNMUcs-QDOo,1536
|
|
76
80
|
wisent/core/classifiers/core/__init__.py,sha256=DJVQfGN-oXkaUur5HwH9xPP9-VCBVxjkIt4U_SqriA4,28
|
|
77
81
|
wisent/core/classifiers/models/__init__.py,sha256=DJVQfGN-oXkaUur5HwH9xPP9-VCBVxjkIt4U_SqriA4,28
|
|
78
82
|
wisent/core/classifiers/pipeline_steps/__init__.py,sha256=DJVQfGN-oXkaUur5HwH9xPP9-VCBVxjkIt4U_SqriA4,28
|
|
79
|
-
wisent/core/cli/__init__.py,sha256=
|
|
80
|
-
wisent/core/cli/check_linearity.py,sha256=
|
|
81
|
-
wisent/core/cli/
|
|
83
|
+
wisent/core/cli/__init__.py,sha256=YBvZ1ko75IFtmmvETRC8wa77wij8HvBO_FSHMYandBU,2009
|
|
84
|
+
wisent/core/cli/check_linearity.py,sha256=weRPt1arFa1a8sSUY8JjyApjLssokMX_kJeiLHDqv1I,5916
|
|
85
|
+
wisent/core/cli/cluster_benchmarks.py,sha256=hPkR0pujWJixb7C4QuqNTZ6H2ElExdTb_FnsDkbE0L8,20056
|
|
86
|
+
wisent/core/cli/create_steering_vector.py,sha256=4iCXFKF-HkxwyUnooOLzH37L2FP6cWOEX8_saD8e914,16695
|
|
82
87
|
wisent/core/cli/diagnose_pairs.py,sha256=dopxJUgxien33yx6zAhwRVfb_4uvIem7Zpj2lawC1dQ,6775
|
|
83
|
-
wisent/core/cli/diagnose_vectors.py,sha256=
|
|
84
|
-
wisent/core/cli/estimate_unified_goodness_time.py,sha256=
|
|
88
|
+
wisent/core/cli/diagnose_vectors.py,sha256=cwn9P0Ui-OWBKD5Wl-RmxqR3Ruel_EPUYPg0qiJB-T4,17177
|
|
89
|
+
wisent/core/cli/estimate_unified_goodness_time.py,sha256=dsJLh7a_4iaYoJlsQ_t46CTl_8RzMun2LPJD02jiMts,16789
|
|
85
90
|
wisent/core/cli/evaluate_refusal.py,sha256=V9MjNEs4XqChnr1o9CrkgFwVVbcrhmNtl-p-0nkZ_jY,8758
|
|
86
91
|
wisent/core/cli/evaluate_responses.py,sha256=jDsb6qnnqJWivL80DERtvWN5nD7je68FNxVp3TNBBIA,38415
|
|
87
92
|
wisent/core/cli/generate_humanization_pairs.py,sha256=hspH8kd9u9BnI0Zdh7s2nMvCi45sMIvd9bLSIa9eLio,4200
|
|
88
93
|
wisent/core/cli/generate_pairs.py,sha256=KT88DaRMv5UcQwkLY9hf8uF3vuq9i3pWSnAL6Nejrzc,7545
|
|
89
|
-
wisent/core/cli/generate_pairs_from_task.py,sha256=
|
|
94
|
+
wisent/core/cli/generate_pairs_from_task.py,sha256=OfxO-JpiYncUvRZL6AEbGzHNJm7QhGGZ3d9YxShXq2Q,2130
|
|
90
95
|
wisent/core/cli/generate_responses.py,sha256=nPEwQ8_EVjRbr0lhsCl8sacQzvt5XgDUOONSwRyI--U,5238
|
|
91
96
|
wisent/core/cli/generate_vector_from_synthetic.py,sha256=Fc9vcd7-1VTqHy8-gjTuPiCC7FIP1rxTajZf8TFSIi8,8868
|
|
92
|
-
wisent/core/cli/generate_vector_from_task.py,sha256=
|
|
93
|
-
wisent/core/cli/
|
|
97
|
+
wisent/core/cli/generate_vector_from_task.py,sha256=O619eALpDrTWMq4Milih_IC3eDViXz46EP6D1A6uduE,10121
|
|
98
|
+
wisent/core/cli/geometry_search.py,sha256=DOXjzEspdcnLNhjZKf_Mapi33mMVi2LMXpQNLQkE5zI,5503
|
|
99
|
+
wisent/core/cli/get_activations.py,sha256=dAvlhRIWg9p5Z_9_G7UQmgUB3HjsmBbEADSGwPYGEDA,6592
|
|
94
100
|
wisent/core/cli/inference_config.py,sha256=iIZa0_ciBbM0Fqat0DJNd-mlWd0ANuYoeZ1v1V4jduc,3148
|
|
95
101
|
wisent/core/cli/inference_config_cli.py,sha256=CKvD3TpFYDSNtm9HdRFv0uMGInaR6iSHP8aLWYPhrfs,1786
|
|
96
|
-
wisent/core/cli/
|
|
102
|
+
wisent/core/cli/method_optimizer.py,sha256=oDfS80biqK8DsuB387KgzehoILebZ2m1_7_aL8eqgpQ,32903
|
|
103
|
+
wisent/core/cli/modify_weights.py,sha256=YHWvuDbrDghIzHCrfCdX5ndpg54ESFgLm6uY7iekhFM,28660
|
|
97
104
|
wisent/core/cli/multi_steer.py,sha256=GRs0557YabcEwch7P75uWJadHf4Ssa8YE5nTMt8WTvs,4564
|
|
98
105
|
wisent/core/cli/optimization_cache.py,sha256=nvnmFSy9km3tcquL36bhumCvc6wxl-_Ch3Ju9-MzNOE,9943
|
|
99
|
-
wisent/core/cli/optimize.py,sha256=
|
|
100
|
-
wisent/core/cli/optimize_classification.py,sha256=
|
|
101
|
-
wisent/core/cli/optimize_sample_size.py,sha256=
|
|
102
|
-
wisent/core/cli/optimize_steering.py,sha256
|
|
103
|
-
wisent/core/cli/optimize_weights.py,sha256=
|
|
104
|
-
wisent/core/cli/
|
|
105
|
-
wisent/core/cli/
|
|
106
|
-
wisent/core/cli/
|
|
107
|
-
wisent/core/cli/
|
|
106
|
+
wisent/core/cli/optimize.py,sha256=4ZpLawTrvU57SUEEhxYiR-Xy5c3mZrE9gSRIxgSRWSg,28090
|
|
107
|
+
wisent/core/cli/optimize_classification.py,sha256=deg3psSPvERDptRIfv4x88adKL0RM3gCBJGfb0QdWnI,23099
|
|
108
|
+
wisent/core/cli/optimize_sample_size.py,sha256=kn8d8fqu4K1cq8CEW_ufz1iu4-nJh_Y3dl15fCmWCq4,16184
|
|
109
|
+
wisent/core/cli/optimize_steering.py,sha256=-8K_RrojHhInLHUtCgvOVqsozUMuEWZcFuBDDhLoVrw,172781
|
|
110
|
+
wisent/core/cli/optimize_weights.py,sha256=uuiepRuq3xM88rnIxtmlmD7a3ylHS8I6WMsa4psCMoc,54364
|
|
111
|
+
wisent/core/cli/preview_pairs.py,sha256=MJjdYJhXCAxA3BvcRQxQfaVZzoKuj4sQl112maHP5Qk,8056
|
|
112
|
+
wisent/core/cli/steering_method_trainer.py,sha256=AENxXgpP6YlFbelpdq3LsWq8WQKfXY1Ub0L6dic__iw,22827
|
|
113
|
+
wisent/core/cli/steering_search_space.py,sha256=4iGf7vTHPEE4JW1mQdq_P1vLYWyGlUekoyjMMJgx0Hw,23113
|
|
114
|
+
wisent/core/cli/tasks.py,sha256=ckQ3NW8DDrHSpmxm3HZ27e6j9ex_lqKKIMTXQ97Np8k,39717
|
|
115
|
+
wisent/core/cli/train_unified_goodness.py,sha256=fOcw-9yD2tcCwUTdxqxFsfuSsCuEPZ8x7nth1gN9lnE,29079
|
|
108
116
|
wisent/core/cli/agent/__init__.py,sha256=tWH634YZVFfHmaEEQPgOn1LILIXwdpyJg5nj9tsdFz8,591
|
|
109
|
-
wisent/core/cli/agent/apply_steering.py,sha256=
|
|
110
|
-
wisent/core/cli/agent/evaluate_response.py,sha256=
|
|
117
|
+
wisent/core/cli/agent/apply_steering.py,sha256=hLjsA7B9Y7t1AHvrs1QhDZm3v_Tqo4NYMCCtW2Yo66c,6635
|
|
118
|
+
wisent/core/cli/agent/evaluate_response.py,sha256=Xk-nKSeGxTqMX7IF6tjYdTUkc_EITVIUg8XEYqZBSnk,4522
|
|
111
119
|
wisent/core/cli/agent/generate_synthetic_pairs.py,sha256=QnMuJvunEB3Icmx9TrFeMklh1fjpTMLeu8mkV_dx46w,4723
|
|
112
120
|
wisent/core/cli/agent/main.py,sha256=aZ7SIuzTmYkFTaygjTf76Fgho9CiRMIOooes5Vd7ueI,5457
|
|
113
|
-
wisent/core/cli/agent/train_classifier.py,sha256=
|
|
121
|
+
wisent/core/cli/agent/train_classifier.py,sha256=qhJlHy0AKdmWJsVg_ZZwLjNL-G8rd6_oSfWtNyx85R0,6961
|
|
114
122
|
wisent/core/contrastive_pairs/__init__.py,sha256=AbaAf-t_nyVVy_vLjp8WAlMDmNun3KNp_GMWAK25r9g,429
|
|
115
123
|
wisent/core/contrastive_pairs/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
116
124
|
wisent/core/contrastive_pairs/core/atoms.py,sha256=_zghw6c8iisW_SqBIUCoAnzhc5q7t5EgZ4zzTPxeLwQ,1129
|
|
@@ -122,26 +130,26 @@ wisent/core/contrastive_pairs/core/set.py,sha256=sVJ2zvlVaFpMPgr4dYe-FMhT6sPS0KO
|
|
|
122
130
|
wisent/core/contrastive_pairs/diagnostics/__init__.py,sha256=X17XJthKEO4gUxUqBR01ysPwf7jx4LZoPKu3QZPK8Xk,2366
|
|
123
131
|
wisent/core/contrastive_pairs/diagnostics/activations.py,sha256=TUNxU-HV3oeQxFbZhKo-OISM4mzR-Bib0naHmbqWzk8,1736
|
|
124
132
|
wisent/core/contrastive_pairs/diagnostics/base.py,sha256=uBi8PdTd6BRyy0lmGjAZLTZdgiiWwPNtsmKkBFCmlD0,2658
|
|
125
|
-
wisent/core/contrastive_pairs/diagnostics/control_vectors.py,sha256=
|
|
133
|
+
wisent/core/contrastive_pairs/diagnostics/control_vectors.py,sha256=BAUOtbq1mAIEdXPWtiPUtfq_NggekteByvfAy5F7ilY,120153
|
|
126
134
|
wisent/core/contrastive_pairs/diagnostics/coverage.py,sha256=MpT6_IdLqtMpav6mOCiNuemBVFvxWzkUbj7j3ZNx-48,2761
|
|
127
135
|
wisent/core/contrastive_pairs/diagnostics/divergence.py,sha256=Io3AcGluJogz4qENWu0ivQyFR_5bLN49BzCTI7DIVa4,3430
|
|
128
136
|
wisent/core/contrastive_pairs/diagnostics/duplicates.py,sha256=s5JPUdWcndX_kWAwP5UmXxEYNkW9DAYqtKwntIRoAiI,4755
|
|
129
|
-
wisent/core/contrastive_pairs/diagnostics/linearity.py,sha256=
|
|
130
|
-
wisent/core/contrastive_pairs/diagnostics/vector_quality.py,sha256=
|
|
137
|
+
wisent/core/contrastive_pairs/diagnostics/linearity.py,sha256=j4-YvzQbysV2dC_mX7mBhwHqj9pmJ6IWUf1cul3pPmY,11169
|
|
138
|
+
wisent/core/contrastive_pairs/diagnostics/vector_quality.py,sha256=EmgH05y5j9EbdiNxCc3FuhIvCM1DoUsGCgQVMkYSjYk,22311
|
|
131
139
|
wisent/core/contrastive_pairs/huggingface_pairs/__init__.py,sha256=PYur_GOluHmwaYUS6rxsoas5-AmrG7OhVGoPteuJB-c,76
|
|
132
140
|
wisent/core/contrastive_pairs/huggingface_pairs/atoms.py,sha256=iIGJRHpDKLskBE_nNOVk9R5329OooktQ9r92_DZNq9A,8826
|
|
133
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_extractor_manifest.py,sha256=
|
|
141
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_extractor_manifest.py,sha256=GwgoH0zXKQ9J29aT_taZzPrLYTJBpTc82fqjHKEOsbc,26345
|
|
134
142
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_extractor_registry.py,sha256=OVD-qzWEzWX0vDz9j8oBiz2gK8rxnpOBZEC4_DOIfak,4680
|
|
135
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/__init__.py,sha256=
|
|
143
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/__init__.py,sha256=HtFG8o1n69SkHgbkjqPXXqsPMPlRUzFu6UWqQ76c268,2522
|
|
136
144
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/agentbench.py,sha256=tdJznfmBU0PxtHwzgXVIJy5qRCGPQ898i_-Mu2FFoF8,7936
|
|
137
145
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/agentharm.py,sha256=hWEPf8mKIgZDZuisG0YMtAr04c33lfXjkRT8-wr2zfo,10504
|
|
138
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/agentic_search.py,sha256=
|
|
139
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/aider_polyglot.py,sha256=
|
|
146
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/agentic_search.py,sha256=OSKPksEL5gs_SLykD7_PIrBV6iLCPEkyCkWxlJsxdPw,4249
|
|
147
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/aider_polyglot.py,sha256=U7_a3slnr6xyPTmHIC-DS9kv6sJaEigCwEpp8o0wRZY,7229
|
|
140
148
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/aime.py,sha256=v0xmp650bG5NYHynaookiXrxstdZOU6zwYOhTtguPMI,3584
|
|
141
149
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/aime2024.py,sha256=iWtVKnwr1dS4k-zDU9nS4qsN3hnoFNjKb4JOIHsRuqM,2234
|
|
142
150
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/aime2025.py,sha256=l2NC4sA7yCpsEx-NtyQmj7x19KfXHcprsYhxVA8a6OQ,2132
|
|
143
151
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/alpaca_eval.py,sha256=NQWzHEcZr_kKDNcb4mXbpy2Rf45wOWEIxYR9o6YEs9s,5560
|
|
144
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/apps.py,sha256=
|
|
152
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/apps.py,sha256=SEMU4cKx5BQUMrKTn7MISece_c2NJDv-PehSW0cmI6k,10281
|
|
145
153
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/arena_hard.py,sha256=T9qLzUpFLHZz1OBwGJ4_-7c6_3ZWswDebbvYle3sINw,6824
|
|
146
154
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/atis.py,sha256=UJfzAett3soThQGvnkFctninkNPMK5YFj16SVm0dsdw,3102
|
|
147
155
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/babilong.py,sha256=sqXHWyyRE1LMZB5IZtSdldxP7PP6OR890bZ68Vn4wt8,3050
|
|
@@ -150,21 +158,13 @@ wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/basqueglue.py
|
|
|
150
158
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/bec2016eu.py,sha256=jRg17Bd08mKGsbtC7xt6-5EfLEr93AUfk4578wHebS0,3806
|
|
151
159
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/bfcl.py,sha256=LZmvmoJFGU9LUc5xxHbugjWiD__rADJkNrmIHJTC-nE,10536
|
|
152
160
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/bhtc_v2.py,sha256=aVRRHAkLIHxpbSqYFXPwIYKdQLTo6X05_Rg3Dof4q_k,3080
|
|
153
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/browsecomp.py,sha256=g0Up4jGNzVf0g8SQtBdnCoZvNLTjLe52OV4hwOa7uto,9919
|
|
154
161
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/chain_of_thought.py,sha256=QsaJFZiFauHzlenUon7P0FnB9cDdMEVGDpJK2nm_w3g,3160
|
|
155
162
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/chinese_simpleqa.py,sha256=2q7r_PplOvbYUcNzHsk3JywEb5j6QjD9mR-Fyf7xw10,7107
|
|
156
163
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/cluewsc.py,sha256=yhi43rtNT_zjfZ2yg2BuxHI0kSDSETKc-tPk9eeFqgc,6300
|
|
157
164
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/cnn_dailymail.py,sha256=NSWDMh2ScUsvC_WVAgIWfGkkY64F_lPbbj9U4FokD7s,3200
|
|
158
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codeforces.py,sha256=
|
|
159
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue.py,sha256
|
|
160
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/
|
|
161
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text_go.py,sha256=rAWrOb9-edJReFKFEp0orVdZzsBkUc1Jk0l652sMLPw,2142
|
|
162
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text_java.py,sha256=2r1mQ-GVQpHrNJkTtr5jd1-s-c2DyrEifzNCPkIDSDA,2161
|
|
163
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text_javascript.py,sha256=1qF8qRlIiQzinSPsV6DV6yHVb4mah1z4j_09_5CpxtM,2215
|
|
164
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text_php.py,sha256=0ezAul2CAfxgOjS2zlc2lnsnO2ryB1YnBEyvLofJero,2152
|
|
165
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text_python.py,sha256=vJ8V9WJofxXAdwict1IEjxYvVj0PsS7oK3khwpb9OXM,2179
|
|
166
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue_code_to_text_ruby.py,sha256=nhprmMfG-82hi6DYlnvJrSYprgez4uBIUCS1Ta6WNhs,2161
|
|
167
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/coding_benchmarks.py,sha256=QXJBlUj_rJIwXqn1uNouyT76hBgwOHMYJabaLIfE9ng,25867
|
|
165
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codeforces.py,sha256=stimcsMEhPgJJfhi9PSXftaAhY5jiSEQGKpFP2yZPv8,11300
|
|
166
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/codexglue.py,sha256=voaKHYSQV91mkY9pqHehNFqO-nnAKxuq5T0r4JRVsm4,3352
|
|
167
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/coding_benchmarks.py,sha256=VjvwwWGsBfCIMPm1uRQGwEjRaeCjp80wrUUP8-cwo-U,15417
|
|
168
168
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/coedit_gec.py,sha256=a-0kJQFcAmoLNFE-dV-G07th9qXPQE0IuAXPcZaVEm8,2605
|
|
169
169
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/conala.py,sha256=auULgkRhG77vy2rAHJlpRhAsdTLrIZuq_XKK9PZF9tU,4075
|
|
170
170
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/concode.py,sha256=qhrgzJsJUnCG_hg4ouw_rMK5VFsecTwa4q7h_kXqMK8,3400
|
|
@@ -178,26 +178,23 @@ wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/ethos_binary.
|
|
|
178
178
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/evalita_mp.py,sha256=Ioy59ZiNVnkwHV7IR0A6wJI3vFASr8o6xcXdrHjOT3I,7719
|
|
179
179
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/evalita_sp_sum_task_fp_small_p1.py,sha256=N-LunVyfI4jClY5svXq088V7N0QZR3aJqEPCBwmPjOg,3078
|
|
180
180
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/facts_grounding.py,sha256=Oyf65Wn2DzE4tSwvMkR6A4XAQLmmKqBNLvLuTgRApv0,6506
|
|
181
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/faithbench.py,sha256=
|
|
181
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/faithbench.py,sha256=MxqTqaFio6oXWr3YwA2EYitii3KF8zdtbK-s9uYrgIQ,10220
|
|
182
182
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/financial_tweets.py,sha256=vUE79yRr5oE1vjFZ_wL4s6XFw7UuakWwrGf5UF24iAw,3635
|
|
183
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/flames.py,sha256=
|
|
183
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/flames.py,sha256=UiKaVxgjpv_QhdMf1FTnPIr_Ebe59YHL_goN5hnSSrc,9034
|
|
184
184
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/flan_held_in.py,sha256=Xzx2V6j8ihoYwC4SYG226SXXEH5j9G2vJFOMT0Y7pR8,3650
|
|
185
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/flores.py,sha256=
|
|
186
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/frames.py,sha256=
|
|
187
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/freebase.py,sha256=UqwnPzljWCSHOyaz7l4C2Zd6lJlVTXxvwy9gxVNeG5k,3801
|
|
185
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/flores.py,sha256=03d8WzoOknwOj4pssiNDCrUdWXKayp-2Wj1McfzkUbA,23418
|
|
186
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/frames.py,sha256=9JZ2LCbIm6yASe-w_sWo3XpgWpnjn7GXgQzY99F9NPc,5601
|
|
188
187
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/get_negative_example_livecodebench.py,sha256=lrhwIQtQupD-xM9ypOamMcPuohkYHIb5uoDvmvgF8JA,5129
|
|
189
188
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/get_positive_example_livecodebench.py,sha256=k_PSaWtokvvBfysz3goFh-ZneXGSAKDaLQ22kkMl5oQ,4622
|
|
190
189
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/gpt3_translation_benchmarks.py,sha256=aOsJ-l67Noc1qnq_orp7-iw8wSNLX-VCa9C_gXX7MAc,3773
|
|
191
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/hallucinations_leaderboard.py,sha256=
|
|
190
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/hallucinations_leaderboard.py,sha256=IaXs9oFXkx7o8PRnjrMvYHLmh-npyIDAfoLZ8eKWGSk,12412
|
|
192
191
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/halueval.py,sha256=N-nwmLP_Zsni0IvjgB2efPSGwJ0m95oW20eyx9Um0-I,8833
|
|
193
192
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/harmbench.py,sha256=HyHZYRFUSZFgJ7atINICsCCK3t01SofCaqbzUjdqrE0,9575
|
|
194
193
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/healthbench.py,sha256=_APNLxYsMgu3rJigXJwWdB83qL-X3pBMRJF0fzAPWNo,6831
|
|
195
194
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/hle.py,sha256=awu6NcomLtATCwps67BQZJ0bZNDTx9EtYgoi9dshVlU,3176
|
|
196
195
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/hmmt.py,sha256=oJ4UQvVHmdo1klTJlqJY3ckfbtD6wk3JYV-P8QAjfNY,3584
|
|
197
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/humaneval.py,sha256=
|
|
196
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/humaneval.py,sha256=OWJnf6AsY4vcvZixlWZi2ui2pb_kqiPBzAIWxrHH0Dg,4797
|
|
198
197
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/humanevalpack.py,sha256=cVQOaOM7O_BpEYXnu8jqtpKpGBIG8BRe6MxyZ25qMHQ,3340
|
|
199
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/instruct_humaneval.py,sha256=Xgfr3rHmZ6K4E-0rY1u9af_nT5BTFzwHis7YKz7MUq4,6747
|
|
200
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/instructhumaneval.py,sha256=Xhr7sI4tqCmNyhzv3WrAM3fp17QJEe2oB2Nw6x9Od9Q,4712
|
|
201
198
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/iwslt2017_ar_en.py,sha256=OakHs-5Qli9tt9gXXsQ913u1aJqbNm4bP7hQ3kbAol0,3826
|
|
202
199
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/iwslt2017_en_ar.py,sha256=GszqSy52EgJ1L885KnhvA5zs_TEBbb6_NJP__aTXWgI,3826
|
|
203
200
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/jailbreakbench.py,sha256=DI9kig2nHMgLZ-Ow4EpwYTQlpNinTW1ul15ms_r4SJA,9642
|
|
@@ -206,17 +203,16 @@ wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/ledgar.py,sha
|
|
|
206
203
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/livecodebench.py,sha256=gQjkxgF7qByJLOHN2JQwOgwY4IkJUWw7kESNyQlkT1g,1964
|
|
207
204
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/livecodebench_contrastive_pair_generator.py,sha256=btT2P6utHmbejctjRelREYO_JCqV_Rhm4BWFJix11EQ,16808
|
|
208
205
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/livecodebench_v6.py,sha256=4S6wv2yt6-s1mJeme-iEmTgXFHfOjBmpL4e6Y3QiseA,9486
|
|
209
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/livemathbench.py,sha256=
|
|
206
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/livemathbench.py,sha256=G9G9ry5QVStYsZTFPxukH1xLanRXm5n68pMJVxRAFEk,9106
|
|
210
207
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/llama.py,sha256=0GP8duCOy1u-G--s4VgIWNIihH06-0xSiE9GCqK82UA,3722
|
|
211
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/longform_writing.py,sha256=
|
|
208
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/longform_writing.py,sha256=NskHJKjm9NBTisNQXiYh6doLVDFl4G92JJY_QEjLXhQ,5982
|
|
212
209
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/m_mmlu.py,sha256=RDZmJAZfJdpxXwrbhDPFBOClNDV2gMf9TaBWNhVF3Gw,3724
|
|
213
210
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/math.py,sha256=1HUMRBIN9b26aWOcyM70tEBbLfzIiZ9uw3OmKZFBpEA,5980
|
|
214
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/math500.py,sha256=
|
|
215
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/mbpp.py,sha256=iMiddPfOsMPhwH_y0RwRCAC0OVE4syCSmx9Q8jvHwPQ,4792
|
|
211
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/math500.py,sha256=h3oA5S9Kuq6FLTVYpGrhDemjh8zyGcZLnx2NMDC_9OM,6039
|
|
216
212
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/meddialog.py,sha256=n-Mh0iWhd-v6avJVAIKe3juHn_D5CrqsXCgERQNK8uA,2616
|
|
217
213
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/medical_abstracts.py,sha256=TP1jcbcVRaDuwwSI_CusIwlchI2QWfMhsCa3rHLH_RY,3576
|
|
218
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/medium_priority_benchmarks.py,sha256
|
|
219
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/mercury.py,sha256=
|
|
214
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/medium_priority_benchmarks.py,sha256=VMjoaUC6WSFo86BGJa8uYStfAC839uoE0M-3lAmKa_I,27316
|
|
215
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/mercury.py,sha256=zO81ogmkR-_6r_wZ9asLg3NUY3emeuzEfTF0YVT5iYY,4327
|
|
220
216
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/mmlu_redux.py,sha256=VX9mKGZZtsaVggyXxfFKOL2pIs-V6Ah1UXN9rktsBCA,7611
|
|
221
217
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/mmlusr.py,sha256=Ib5IPMeTp9m-Zc90YlxSXxJiZWo3tw8WasbuUL33yG0,3974
|
|
222
218
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/multimedqa.py,sha256=0ijOZPjd86pZlUqDGHKK-QRJcJSSWPvbUglNy0uSw7o,3811
|
|
@@ -230,20 +226,20 @@ wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/multiple_js.p
|
|
|
230
226
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/multiple_py.py,sha256=TjowpFLoraDyppMPa7375Ol3NwGs8H1_E1xa68LAhxo,406
|
|
231
227
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/multiple_rs.py,sha256=7GtAWK7iig8vaCW-lI77HXOQCSnuXiN8q16XuvrIyRo,4351
|
|
232
228
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/non_greedy_robustness_agieval_aqua_rat.py,sha256=zcyMAZv7LDOgNdsU-gxVX5PaL8W6IYXOFeaP_l4ZqFw,3461
|
|
233
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/olympiadbench.py,sha256=
|
|
229
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/olympiadbench.py,sha256=OrJQ55-YwI2n3m0wOmKfwj-h-IE79IZIZPLKdJzamKU,9185
|
|
234
230
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/openllm.py,sha256=OLl__FMCKuOIcAq7-nHif4uinknDFQjFKy1yUFaDvhU,3796
|
|
235
231
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/option_order_robustness_agieval_aqua_rat.py,sha256=GOGncOk_KiYVVjNXCgUaaVgxiowRF8avM8PWpaUng_o,3479
|
|
236
232
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/or_bench.py,sha256=R_tpmbnxXHAUEb47CA3s94F0LcjinO6mB_WMZrl2I6M,11101
|
|
237
233
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/penn_treebank.py,sha256=hp1ct35XCY4KQLtJOA36t7K5fl72o9CHDF374oJzBS8,2601
|
|
238
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/planbench.py,sha256=
|
|
239
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/polymath.py,sha256=
|
|
234
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/planbench.py,sha256=CWSq7e3F_NCeiINLkksQ7truDYmuC1YkVgOgUvVuqxU,6250
|
|
235
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/polymath.py,sha256=lI0Fepaf053ygAYCTnbwoMLCSAlWipctJc1uibMog3A,14194
|
|
240
236
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/prompt_robustness_agieval_aqua_rat.py,sha256=g-h6DrOIe4zdNfDUUAqoE90dgBUFbIiEZcxH2Aq-Z9k,3427
|
|
241
237
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/pythia.py,sha256=7cTgI1og4b6qSP3LCkG6m9FRnkmP1IzjT3O7ltis7II,3791
|
|
242
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/recode.py,sha256=
|
|
243
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/refusalbench.py,sha256=
|
|
238
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/recode.py,sha256=V9n8nwSW4Tz3L0bXcZWqQWpin7PJWuecvWqaYesrkVA,4867
|
|
239
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/refusalbench.py,sha256=CPORdQECm2GHTwzYfwYcdY0EfmMQXSL6RwPwQeN7ccU,11767
|
|
244
240
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/scicode.py,sha256=RQUEzLatM8Dys-CWsMahKWB_eAILKTS8exc99REG0Qg,9495
|
|
245
241
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/self_consistency.py,sha256=QclAgUIwl0YPTBKHtlOyI1gSzdHeATmL5-kxgB16tPA,3035
|
|
246
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/simpleqa.py,sha256=
|
|
242
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/simpleqa.py,sha256=20ptnbwjpli4wsYiQUZCdynImpcdcSw4gHxG64Lgeqw,5712
|
|
247
243
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/sorry_bench.py,sha256=orRjSL-mfjtXBWpwd18yNo-XVdUaKTK0RpWLAuiKLhw,8348
|
|
248
244
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/stsb.py,sha256=PB7T85YTTN1W6LvFa61ZK2OI02NZqdOsGi0AyFew2dY,2544
|
|
249
245
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/super_glue_lm_eval_v1.py,sha256=5sjnFalFsICF29k3DIyJ-PGM18yCA8IBQNsJAuZMWBc,3858
|
|
@@ -255,10 +251,10 @@ wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/swe_bench_ver
|
|
|
255
251
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/sycophancy_eval.py,sha256=qAkLC9LxYQIyKc-k-v1pFdHcDzfT7yLhDpX-9l6eIhU,7656
|
|
256
252
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/t0_eval.py,sha256=1eSUGHSbczaaAYWov4WhwgV0p2bHP-B9BOMUdhIXin0,2577
|
|
257
253
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/tag.py,sha256=IBphPJy8Dz0FgEF0WIDMPdcErMiMnX_UbwEBF-hmffg,3572
|
|
258
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/tau_bench.py,sha256=
|
|
254
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/tau_bench.py,sha256=2tkAQhh8-SiiN0U6Kb-MJTJsrUfvJEGZ4UWpXqcqMF0,7210
|
|
259
255
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/tmlu.py,sha256=E2_2XoupBm_LdSiX5Wi6BYabHgXabItq4r8lKh-c-Mk,4550
|
|
260
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/toolbench.py,sha256=
|
|
261
|
-
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/toolemu.py,sha256=
|
|
256
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/toolbench.py,sha256=pWEhmL6qGdir27hJk4xhyTpk3Ei_25txe0yfdW4CZVM,9480
|
|
257
|
+
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/toolemu.py,sha256=QD2BwdIL21l8Wd_AlKMcso-NT8rAmePJK2H2-qAqh0c,8635
|
|
262
258
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/travelplanner.py,sha256=x2_P06ZEQFT2tRNtii3NzWXCH9ItQVZG8t4GN_vRWYM,10133
|
|
263
259
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/truthfulqa_generation.py,sha256=TW1T3_VVfZ3RAQ73xKojUb2sI9eoYMbEEyBUKdqtFOg,4591
|
|
264
260
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/unfair_tos.py,sha256=UnZFX-O-nTbNn3Cic7kZ-x0msQCxC_CEMfI5Ft2OR_c,2805
|
|
@@ -276,9 +272,9 @@ wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/wmt_ro_en_t5_
|
|
|
276
272
|
wisent/core/contrastive_pairs/huggingface_pairs/hf_task_extractors/xsum.py,sha256=zzIp0MeqI7XccHlNEaqL0w3OR3Ukt6lqMYVZQmksAMs,2907
|
|
277
273
|
wisent/core/contrastive_pairs/lm_eval_pairs/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
278
274
|
wisent/core/contrastive_pairs/lm_eval_pairs/atoms.py,sha256=u8RTCYlpUX7X3DHLx9aPlid3xrYPQK6f7Kymj0ps7Ug,9056
|
|
279
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_extractor_manifest.py,sha256=
|
|
280
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_extractor_registry.py,sha256=
|
|
281
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_pairs_generation.py,sha256=
|
|
275
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_extractor_manifest.py,sha256=DcqdQeilSKjY5UYHA-qHFljwjdrfM-1PvaN0CRsdf18,30408
|
|
276
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_extractor_registry.py,sha256=N8VpOE8JG4y8GQM6sxjzqI8M0U06KdjzIjrxVwxYS7U,6005
|
|
277
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_pairs_generation.py,sha256=mCaFhxXoE6EiknkvS6BeznBqOLfeLbmWKULRPuyht7s,8425
|
|
282
278
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/__init__.py,sha256=yxkFjHDEpD33FH1-shObI-jsperBSADjTqZxQrzC3QA,16627
|
|
283
279
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/aclue.py,sha256=jreFoIxdiaOZM-qsv_L8dAkJxXm21ajQR0XUY8LJP-k,1321
|
|
284
280
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/acp.py,sha256=2txurLRPPG4xBLMd0a8LJjF4XAyQHmQon_gp4PbTl4g,1902
|
|
@@ -329,7 +325,7 @@ wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/careqa.py,sha25
|
|
|
329
325
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/catalan_bench.py,sha256=TPUzqtL1du59Dt9EoHaKriyoFromWMAoAswjy52lOeM,3167
|
|
330
326
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/ceval_valid.py,sha256=UNjahQmaNAA4Tbk1VRrwjwskbh62xZjNTcCh75Agu_c,4229
|
|
331
327
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/cmmlu.py,sha256=HAWYWsdvK2s47rmzwf3c1XaOs-NwkVM0ovWByD6klSQ,4795
|
|
332
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/code_x_glue.py,sha256=
|
|
328
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/code_x_glue.py,sha256=Fx-tjjXV01dOJUWp_J0ylLaBsDUYSkpQKz3InC0AKr8,706
|
|
333
329
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/copal_id.py,sha256=he7n0aGC0XjMR4qa2gm0kuovyz0_x1JLEYJNPfXDmuA,372
|
|
334
330
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/crows_pairs.py,sha256=7CTdKKc494cmFzBjofRyp2_dlNwiyqBPiuwlkDyXAjY,2136
|
|
335
331
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/csatqa.py,sha256=Eo22i1KWxQX-PNZ3nGPm3UQSKmP8oxrY3V8zchNwOrc,571
|
|
@@ -340,7 +336,7 @@ wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/eus.py,sha256=i
|
|
|
340
336
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/evalita_mp.py,sha256=_LdM__wODPNdavTHGgLqF3dA_vLHC-ewmydHm8Bs7q8,6644
|
|
341
337
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/fld.py,sha256=FLzUNm80tvs-htbAfm4mNq-HSiu8oEYufTzstf9Nk4o,210
|
|
342
338
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/flores.py,sha256=A75TUNok5NVIzpCO3VwI9m9Izh8pXtIeNdr1v38Kjec,35617
|
|
343
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/freebase.py,sha256=
|
|
339
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/freebase.py,sha256=RtCWXKQwDa70bd3lSnmPAcIWrIBu_QxR2uKHnR9bvMc,226
|
|
344
340
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/french_bench.py,sha256=Rqlk55ooPSoKOp1vQCT-jPsDqinDAC6ot5YkCIy5XwA,1554
|
|
345
341
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/galician_bench.py,sha256=csNGQJO-ML0ViEuvWGDaa-V22tdOylnx0cPsSbbTdXU,3073
|
|
346
342
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/glianorex.py,sha256=diTVUzsCmpkEl-xfnMCmrUChExkEqRPtQpZ2qHmN-Q0,372
|
|
@@ -433,331 +429,327 @@ wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/xquad.py,sha256
|
|
|
433
429
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/xstorycloze.py,sha256=VLiKWLfyDPJnk_L_aLchZVV82KCIU9T6IgSvzYS_ZBA,1186
|
|
434
430
|
wisent/core/contrastive_pairs/lm_eval_pairs/group_task_manifests/xwinograd.py,sha256=RAkchOuJtal6YXe7U1kiNtLJOzepczRuRNqzv3CNKm8,636
|
|
435
431
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/__init__.py,sha256=qjtVqnPSAZjOg-ME9QjeOEkgJR4rImyfGImxEwAEfmQ,7278
|
|
436
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/aclue.py,sha256=
|
|
437
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/acp_bench.py,sha256=
|
|
438
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/acp_bench_hard.py,sha256=
|
|
439
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/advanced.py,sha256=
|
|
440
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/aexams.py,sha256=
|
|
432
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/aclue.py,sha256=ugSEM2fAh1pYaABSjCKNIjTLxdbAGMpw9-ktZFEIGwg,6685
|
|
433
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/acp_bench.py,sha256=Qo7dHcSVzqcNLOkPCfwX8MLQ-XEn2qneQLV_ELdBVmA,8391
|
|
434
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/acp_bench_hard.py,sha256=qgrCO7FZEDzHMJB5OhT7-DVTTQIFk1ztlr18fKrl52Y,7484
|
|
435
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/advanced.py,sha256=XnAnsrWEfz8TyiTJqWN1wgTHtK8oYwX5EOR0SXkRNcI,5190
|
|
436
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/aexams.py,sha256=CwQ7aee2fWqOkDOD4Rj904cZcxE8eoe-4Zmgpv7aRlg,7177
|
|
441
437
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/afrimgsm.py,sha256=ozlEmQHqxsaiH5jb1D1WI9aToAk6psQkduDwq737F5c,3527
|
|
442
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/afrimmlu.py,sha256
|
|
443
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/afrixnli.py,sha256=
|
|
438
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/afrimmlu.py,sha256=1iyuSG1FMUYur7MO6G7PL7XwZZelGWFixTJ_tE2KC-g,4041
|
|
439
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/afrixnli.py,sha256=SSSrkGOqA7paEq6P7NAWVIzwpMZMs5iEPtL2Uc6tQZc,4449
|
|
444
440
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/afrobench_cot.py,sha256=XXg_BHyIHOt_NezgVJ5K8aplTR_rTiX1Eg154L3sTI0,3319
|
|
445
441
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/afrobench_mc.py,sha256=1aRM-_bxDOqWWc5WCfaes_WIbgfs-zurYQkP_PxR660,4114
|
|
446
442
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ag.py,sha256=4lDiGXPZHhThl6fa6DKho14cGEWLnKDPP_5fdTO8gUg,5438
|
|
447
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/
|
|
443
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/agieval_aqua_rat.py,sha256=oUJD14n4sty8M2b8WXtH84XrC1GJD3r_lqMrZXHL0sQ,4637
|
|
448
444
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ai2_arc.py,sha256=0Rrn2efrqGl949i30Y83R450uoc_y8o4H31qj46dr3g,3878
|
|
449
445
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/anagrams1.py,sha256=VMEhdDEjXyQscQGSXz98H42LZ75XTuS-QcrARzWx-QQ,3141
|
|
450
446
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/anagrams2.py,sha256=gnfUcTl26pUmoYPGDg5SUBasrmCK1ggB_kIQYsijNeU,3141
|
|
451
447
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/anli.py,sha256=YunlhuOmXsEO0ic8AzTgOz5I7LaYib1IRdTwFTllErg,4808
|
|
452
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabculture.py,sha256=
|
|
453
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabic.py,sha256=
|
|
454
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabic_exams.py,sha256=
|
|
455
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabic_leaderboard_complete.py,sha256=
|
|
456
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabic_leaderboard_light.py,sha256=
|
|
457
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabicmmlu.py,sha256=
|
|
458
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/aradice.py,sha256=
|
|
459
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arc.py,sha256=
|
|
460
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arc_challenge.py,sha256=
|
|
461
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arc_easy.py,sha256=
|
|
448
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabculture.py,sha256=7tByFxwt6NmXlnOe2MtdAhktfDivwmH41l9R_0i4lnM,7239
|
|
449
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabic.py,sha256=Z3OC8h65GDsx0AX02Oc-YWaV4pPr7KDe9NS7NXlIipU,3668
|
|
450
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabic_exams.py,sha256=YYIenYtFxABAp8GMLoDYovFWG4Gal6XZXdk95yhznCY,3855
|
|
451
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabic_leaderboard_complete.py,sha256=NIMsdln4vJI3MLeuheC8NigPePqFmkTW1hFzNzOxmaM,6795
|
|
452
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabic_leaderboard_light.py,sha256=jj5HRRyOp3dVl0KNDiCUK2tfxTzJYmyWc1_04pbb2xc,6765
|
|
453
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arabicmmlu.py,sha256=S9O5FfgOUYtMf-WXnB1RnREE7-svYoyg-lz24ItWnYA,6656
|
|
454
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/aradice.py,sha256=0GuCPEHvO1jM0Wur3PQg-syczIvCWvBSjsWpsMvIlb0,11985
|
|
455
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arc.py,sha256=H7MJ0J-sjQC_odavk9yNNmaJpkjm-dZpt1jKW2dpHEU,5140
|
|
456
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arc_challenge.py,sha256=pLZG8oZJ-Rmc2midYKwFCL6X7kfejszEcZRlVKIaPf0,4024
|
|
457
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arc_easy.py,sha256=L7nRJaojsxhKA9q8YJr1dqvcWepuzBt_4bz0KQXLtMY,3979
|
|
462
458
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arc_gen.py,sha256=Eokj_PknnpqUK264I68i0DiAjQVcCQxH5lhDPIZ_zes,3881
|
|
463
459
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arc_mc.py,sha256=TXvAaLY4wAsHuozHBJ4Dp7ryOG9bA4B_AyhYzS-8WRY,4121
|
|
464
460
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/argument.py,sha256=GJt9XdLoXcnJ7_Obat9nK-CenPZNvIaFva7e5XeeXf4,5494
|
|
465
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arithmetic.py,sha256=
|
|
466
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/asdiv.py,sha256=
|
|
461
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/arithmetic.py,sha256=38DtqaahEE--j8ZgSPaJzrCYf3FyWNlWm2Eo52Pmw_M,3826
|
|
462
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/asdiv.py,sha256=NIJyDHcKGAUYjp68MVDIlp7WVBJtfKQkMsrDvT9HyKU,4161
|
|
467
463
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/assin.py,sha256=w0CEpwyxBfHa5SDXEUc-rTbogw9f6vqT7gPiND-XNa0,4158
|
|
468
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/babi.py,sha256=
|
|
469
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/basque_bench.py,sha256=
|
|
464
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/babi.py,sha256=VrYfjZXZBk9RuDdqytZKMV9lnvw9GbWc9GkHdF-Ux6w,6105
|
|
465
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/basque_bench.py,sha256=89rrlIBniuODiwhU4r0y2kIZ4RudOH5pTgSfHWU4tTQ,5967
|
|
470
466
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/basque_bench_gen.py,sha256=Er8ufToEqS5vRAbl5eHTz7Ihwrv7WYCHdm_WN-GOqWI,5983
|
|
471
467
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/basque_bench_mc.py,sha256=F_dnN_Yips5nEX9ZW-nOM4HvA5a6XQ4-WCkeUsig_Ac,5383
|
|
472
468
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bbh.py,sha256=QyL31K5p1pSAoOeaThMXcqjXvn5ARZeyn458y6wIpVw,4730
|
|
473
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bbq.py,sha256=
|
|
474
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/belebele.py,sha256=
|
|
475
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/benchmarks.py,sha256=
|
|
476
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bertaqa.py,sha256=
|
|
477
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bhs.py,sha256=
|
|
478
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bhtc.py,sha256=
|
|
469
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bbq.py,sha256=zprXP8p3zKRTPtGWjPO-GVcrpdf6nzrGssonw9AgZlM,6632
|
|
470
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/belebele.py,sha256=yID74I8e0QJIBHS5XfMpaaRQ6B88P8uhqUTvtsKZcv4,7155
|
|
471
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/benchmarks.py,sha256=5qTiZKdLlpJ2NInL3JrtbeevVC5Vdf8s2vgV3wg-WYw,5954
|
|
472
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bertaqa.py,sha256=gENly4KQM11xUc7JplTO9tpEsecDwGx7EI8saNuDCoI,6463
|
|
473
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bhs.py,sha256=CEVXu-cfKba-SArF0Z3-48UzLjIkAZa4P9we0dII-Dg,5884
|
|
474
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bhtc.py,sha256=VzOGeGDLyJhhDfJiY29Kl1Fp0gFEGU2vVTpk7mLJJU4,5666
|
|
479
475
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/bigbench.py,sha256=Yww82fQuUbEANLotw7vP7m_EDoA9CNRWPvgrB6B-wvM,6613
|
|
480
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/blimp.py,sha256=
|
|
481
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/blimp_nl.py,sha256=
|
|
482
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/boolq.py,sha256=
|
|
476
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/blimp.py,sha256=FWLTaIqd4TuTBkLSLyu_ygHoPkbmvQhB-06mTJ6alDg,6656
|
|
477
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/blimp_nl.py,sha256=LlLs75FCg2sbxbULNiiCAGbU8GZrkZNXOXEiHGQ_EK4,5865
|
|
478
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/boolq.py,sha256=NA7TnsMmr887DKQoCRwgq84-veJ-VQdXPPfg09_IkdA,3966
|
|
483
479
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/boolq_seq2seq.py,sha256=-B7CD59m5m7WmL6ed3Ior9Zt57kl4jTOlbOkv9p_iFY,3998
|
|
484
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/c4.py,sha256=
|
|
485
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cabbq.py,sha256=
|
|
480
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/c4.py,sha256=gangKka_3u7PoivPFCpa_iCSk2TfO86XcGD2ysUwiWs,5684
|
|
481
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cabbq.py,sha256=9qX7C6QfAmaepqc89FLkaXlCinNk7W1iiphSlfurZco,5840
|
|
486
482
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cabreu.py,sha256=_dS87XtZBWSvjTyzvBRjaK-dN0Fv6kDihux5PEj7neQ,5046
|
|
487
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/careqa.py,sha256=
|
|
488
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/catalan_bench.py,sha256=
|
|
483
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/careqa.py,sha256=GDW61WgODlfcgcIhuP5BuCXDbQ-XHAtT4pDmq7yUGmA,6677
|
|
484
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/catalan_bench.py,sha256=M0Ms2i5mOJFw9ayF2qySwSTqrKDJwIVht2im6eGUWkg,5977
|
|
489
485
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/catalan_bench_gen.py,sha256=vYrbmDvEWetRTxFYa00e-EPmcG698rWSNTj6abBxUs4,3976
|
|
490
486
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/catalan_bench_mc.py,sha256=U27A3A9nSYqKmqSPWeVBU66eIDiw4Y7UjA0YttcELEc,4150
|
|
491
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/catalanqa.py,sha256=
|
|
492
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/catcola.py,sha256=
|
|
493
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cb.py,sha256=
|
|
494
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ceval.py,sha256=
|
|
495
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ceval_valid.py,sha256=
|
|
496
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/chain.py,sha256=
|
|
497
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/chartqa.py,sha256=
|
|
498
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/claim.py,sha256=
|
|
499
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/click.py,sha256=
|
|
500
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cmmlu.py,sha256=
|
|
501
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cnn.py,sha256=
|
|
502
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cocoteros.py,sha256=
|
|
503
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/
|
|
504
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/
|
|
505
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/codexglue.py,sha256=qeZu8Lzj_aXbWBQYTtuhEwor2ZO9n7V_WelVLLX1zIw,4288
|
|
506
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/coedit.py,sha256=jHan7PwlX3wyQjsW49qzAw-P7DlJPYjZQ-tEoNiU-l8,5875
|
|
487
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/catalanqa.py,sha256=7GigYh1OrjB29b8E5UAbRZlWT2_IuS-ZZc8JyukRxgk,7158
|
|
488
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/catcola.py,sha256=Q2zzNtKybvSQAQlyAJusubSur64W1eFEVyqO5e0vFRs,5411
|
|
489
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cb.py,sha256=25a1mv3hRta1zna4r34nbUcaygCWLMXLm88XEa98Cis,4026
|
|
490
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ceval.py,sha256=Gx3Iw_TwdT_QK7i4iW0anY5IRjRMa5N09a1UlpKDXbM,8542
|
|
491
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ceval_valid.py,sha256=EDuO2CXJAeOE8CQylKY2MTKhH8NCwJFnP9WMZPyNskw,6224
|
|
492
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/chain.py,sha256=b0b7oclVtf9sqxlVODN76UFG5Skua1zxfyBs_bXy1_8,4249
|
|
493
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/chartqa.py,sha256=lh25ISyWo1LRUoIGrSMsOm90PJzdqVu2zoo6SYfhGAY,9215
|
|
494
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/claim.py,sha256=dKNl-GGM7Hb2KBMoJA3hng9Vnu3jGATmfgG4clDnn2U,6132
|
|
495
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/click.py,sha256=v_qtf7BlJYh3stuKA1964i1OWnF8DfEOvlKcdwi01rA,5840
|
|
496
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cmmlu.py,sha256=J1RwrSTizqoEoSBpR8gYQLbVVL8MBM48Jj7IOvIdcDE,6563
|
|
497
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cnn.py,sha256=rOBp8Lavy-H-x6C85C1CxZaInNDkxGGmSQT1yoHte4Q,5740
|
|
498
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cocoteros.py,sha256=zBoML4lLS2jSKtUKvgcdtmEEgemMSUaqDaAkUp52pEg,5936
|
|
499
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/code_x_glue.py,sha256=D14EUwniYnfUP7Z5mU5zRfkPAd1bCtYwEMd0tAavAE0,4511
|
|
500
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/coedit.py,sha256=iavlWyD1b2i5cRTJNiPVH7FzgadL8_BoHOVTHXZc3ms,5777
|
|
507
501
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cola.py,sha256=dRnZPR63cbrzVyiklwJX05cMB2fUTujZhNpQC6IVG6c,2996
|
|
508
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/commonsense.py,sha256=
|
|
509
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/commonsense_qa.py,sha256=
|
|
510
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/copa.py,sha256=
|
|
511
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/copal_id.py,sha256=
|
|
512
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/coqa.py,sha256=
|
|
502
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/commonsense.py,sha256=Z2TFnlZL--wWUWfRTaxHluiO3YgyPOB2T0BmvOkKryc,4198
|
|
503
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/commonsense_qa.py,sha256=dw_8F6yZxbr-Vf6v0yDNTqq4WdLOQQNEz2GALmuhuvc,4467
|
|
504
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/copa.py,sha256=xK9HQShXUwMxzLSaTRDfRgYEEDlKjTIK7HeFIXSBvo8,4089
|
|
505
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/copal_id.py,sha256=vK6mFf1mXehRsWqzXDDfr4MxLYRBv2pmSX5Qk6wgT5I,6727
|
|
506
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/coqa.py,sha256=wL2jO8QEO6F6XmVLKGbKKOcUAjisX0mo3M_899LL8T0,5711
|
|
513
507
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/coqcat.py,sha256=ebeI1P36JuauSiy2cuk8-BZahZfc8ylxeumXkh1me0c,4241
|
|
514
508
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/crows_pairs.py,sha256=IMDNwLFfzLxzFlF3TIdINstY4-XIrUfrMtUNmDn7g8w,6042
|
|
515
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/csatqa.py,sha256=
|
|
516
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cycle.py,sha256=
|
|
509
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/csatqa.py,sha256=4CX8ew2lcE60_CgEc-595xyc2YTS14H5cBjyLdBPq6I,5849
|
|
510
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cycle.py,sha256=plRdY59xzT0UYRLSw6v2_MZD31aHBNZIcxy9AwO5cn0,4174
|
|
517
511
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/cycle_letters.py,sha256=MUH1UEnt0ox2FCkDWrfatN1uoxNm43ut1SaToBYmJRg,3166
|
|
518
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/darija_bench.py,sha256=
|
|
519
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/darijahellaswag.py,sha256=
|
|
520
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/darijammlu.py,sha256=
|
|
521
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/dbpedia.py,sha256=
|
|
522
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/discrim_eval.py,sha256=
|
|
523
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/doc.py,sha256=
|
|
524
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/drop.py,sha256=
|
|
512
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/darija_bench.py,sha256=I8DTdKhuNbNH2_BxCdACA4VO7hdn5zeEE7BW7KoOM8M,9044
|
|
513
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/darijahellaswag.py,sha256=zKa7oglGaoydRfFUs3ZdDye3H2l42aHU8dWOrEWs-gM,6679
|
|
514
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/darijammlu.py,sha256=yq2opVGKVbjSn-nN4scVUwBqrb3VYNYkwRyKblkLjYU,5885
|
|
515
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/dbpedia.py,sha256=6bW_HnrKD2zXP4FbHKyjeZqLYbPN1W9DfvYbjpTi0ug,6025
|
|
516
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/discrim_eval.py,sha256=kpv5zLpZDwisrGPh4DcDZ1iaVGiC0ahsJQhVp0C32f8,5901
|
|
517
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/doc.py,sha256=ZNq54kLCLbZWlqymCWxSTbrQQNSgYLgFCy95jXIxaqQ,4166
|
|
518
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/drop.py,sha256=Cm-vVcnTFP4FCxWspNCJIMslKTEOsZ2MeP3qgMWcJrQ,4307
|
|
525
519
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/egyhellaswag.py,sha256=44eoNICcU6-zYrmpUl4YGuJqSqBJ9KTew6Wzj-qfH-k,4577
|
|
526
520
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/egymmlu.py,sha256=Jtia9IzuQm_FU_3vk0o0BG7za_TNP_YvSiFk10J3IqA,6369
|
|
527
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/epec.py,sha256=
|
|
528
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eq.py,sha256=
|
|
529
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eq_bench.py,sha256=
|
|
530
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eq_bench_ca.py,sha256=
|
|
531
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eq_bench_es.py,sha256=
|
|
532
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/esbbq.py,sha256=
|
|
521
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/epec.py,sha256=7_kFNMaMeBUNGv0sLo6zeRFm6NCAGmA9FuTbB7gYqtg,5615
|
|
522
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eq.py,sha256=oMj8G_mavAIPwneiAj45sEdZtGxCv-OnF_EYGd-J5H0,4162
|
|
523
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eq_bench.py,sha256=trjP3M1F8mCS-olXBCwYmOwnZCbRIh3e22Adt_paqtE,7947
|
|
524
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eq_bench_ca.py,sha256=FLWrFZ6YvKvc4YbiP1V2gTpxcHdwMO7qwyKgEDOA4oI,5890
|
|
525
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eq_bench_es.py,sha256=7frvhFFJZbbM1k51Pa7EF9T4RC2zhYP6aej10Y4CLzU,5890
|
|
526
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/esbbq.py,sha256=dhZU355vFqg9sxaum2oY5yE6xBluZyA-kYTprZw5lio,5840
|
|
533
527
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/escola.py,sha256=cDZkmuv0TXe4ShayNiLxMnaXP3B_9W7cxAOb-z3UO2I,3121
|
|
534
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ethics.py,sha256=
|
|
528
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ethics.py,sha256=PR6tReNsGQTvsh0aiRXpVSW6X4VBdZemC3aE_5PldtM,5473
|
|
535
529
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ethos.py,sha256=TcDYU5eG0Ti4UumMVDt_RqjohJf9nESuxsXIhqyPCXU,3860
|
|
536
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus.py,sha256=
|
|
537
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus_exams.py,sha256=
|
|
538
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus_proficiency.py,sha256=
|
|
539
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus_reading.py,sha256=
|
|
540
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus_trivia.py,sha256=
|
|
541
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/evalita_llm.py,sha256=
|
|
530
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus.py,sha256=tiSAOFOwVOt2vLcya-CHb2BuMvIVwUYrVnbP5LzFuFM,4166
|
|
531
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus_exams.py,sha256=0vIbmOjebDq61eY55U53QtMmyL1c-kiMaRZElQHUSiQ,8633
|
|
532
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus_proficiency.py,sha256=Ci966oYVevN0GvojhEtPwFVV41Cww0fIkJLzSAle6kI,6242
|
|
533
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus_reading.py,sha256=TKpnuAYGBKtT8Zg-dXu-WCP1gdUBKBvWQn-tttYND8Q,6194
|
|
534
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/eus_trivia.py,sha256=rAviUzX3XBRX3DC1BzjRKJvkx-TSAj46KHs15fpi7pw,6214
|
|
535
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/evalita_llm.py,sha256=r0bOBF8hDE94f3dI55-wwFU_8mvHodsBE5h5WMzL9jk,6498
|
|
542
536
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/evalita_sp.py,sha256=rvmw3MJpPHln4p2FdA8b1n9lcd-x1wvBJcUALH5nHm8,3970
|
|
543
537
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/fda.py,sha256=WsQZGYDZUwb_Krhy9RjO6c1eSjIMdLif4osWB8eAq30,3944
|
|
544
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/financial.py,sha256=
|
|
545
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/flan.py,sha256=
|
|
538
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/financial.py,sha256=G1Q1R7OtQnNYPgHGhPKNDj82QprGs8urN9BBJP2JAGY,4190
|
|
539
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/flan.py,sha256=J5vWx4ToYRa_HHELcCLDDFhNnE3i96-VymOKMbOsdFk,4479
|
|
546
540
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/fld.py,sha256=GA7Jlu4XtE0nbS0lGCjx50lt8eJk5ZlT3bTtFyUX-v4,5216
|
|
547
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/french_bench.py,sha256=
|
|
541
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/french_bench.py,sha256=T53Zno0Wl8YX-CUHa7ZEgxfxVMb4RZbzJ3yJF7ZzV_s,7722
|
|
548
542
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/french_bench_mc.py,sha256=H7BUHk857ioHCu9KhCjX6OTasagalE3_tk_Nw3Y1e2k,3616
|
|
549
543
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/french_bench_perplexity.py,sha256=ZWiytkj1TlCmKfouvpfJHz2dVmGMZ6ScDrOFXVcdPOA,3119
|
|
550
544
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/galcola.py,sha256=0ORvzlWMGi-9ybDKWSPG5pDe74gPTyigiHlMcB1fG6w,3960
|
|
551
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/galician_bench.py,sha256=
|
|
545
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/galician_bench.py,sha256=ctDWeenE6krvghsqse5tcgGUCzhhb6KioO1qW5P7Te4,6024
|
|
552
546
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/galician_bench_gen.py,sha256=3-GQBmOcYU_AH4kkVuudC-0i3z8zUR7gGMFH6SU8M0E,3956
|
|
553
547
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/galician_bench_mc.py,sha256=uuFVeFyNfEp-YUpNJshadahCvG8c5AAlr0ebxHAO7gc,4159
|
|
554
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/gaokao.py,sha256=
|
|
555
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/glianorex.py,sha256=
|
|
556
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/global_mmlu.py,sha256=
|
|
557
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/global_piqa.py,sha256=
|
|
548
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/gaokao.py,sha256=o2ExOEuontJ6GXY6ZzTaZ5wMcGkYhr42gMNYDKDgruU,4793
|
|
549
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/glianorex.py,sha256=mR11nyPK30FI87QTY28KkchHX38FMOhfUjOS_ZYDgFI,4467
|
|
550
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/global_mmlu.py,sha256=FJD58ydy1HKlh1xV2lmu8_chrP89BvxafT2Z-2uunwQ,6346
|
|
551
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/global_piqa.py,sha256=SAHydNoxdWBTBptZ9GzaDVgMemeJxn4twxn03F1d2l0,5892
|
|
558
552
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/glue.py,sha256=zIk_KN6wOCs-1ZBNvWr2VAGaRK2-0rX2pmFBQYWyIas,3739
|
|
559
553
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/gpqa.py,sha256=OnRcBqQks1j0d2wz-Lwv1kt1HRdzo9v8djF50yWxO2Q,5641
|
|
560
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/gpt3.py,sha256=
|
|
561
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/groundcocoa.py,sha256=
|
|
554
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/gpt3.py,sha256=gdCB1n7nQLgFbJ_8dDYmb_jRdMc74dx6iO1M251CqPw,4256
|
|
555
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/groundcocoa.py,sha256=wRRmgtI49KjYNeeAncqbphuRc3wz1PyIX-xRtk6PQnY,7148
|
|
562
556
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/gsm.py,sha256=JlretZyrsYcmJ0KyPYFWGLYFx8Cvt3-TvhgUOjahEmc,3830
|
|
563
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/gsm8k.py,sha256=
|
|
564
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/haerae.py,sha256=
|
|
565
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/headqa.py,sha256=
|
|
566
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hellaswag.py,sha256=
|
|
567
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hendrycks_ethics.py,sha256=
|
|
568
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hendrycks_math.py,sha256=
|
|
569
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/histoires_morales.py,sha256=
|
|
557
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/gsm8k.py,sha256=zGkwC5Tevv7B8RBA-3D9EOykU_XLoJ7BNfiZrtX0vlE,4598
|
|
558
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/haerae.py,sha256=60CPOeY7U3EfYtHO3q9jQzkxZaAy5laSTsjwFD4cQdQ,5849
|
|
559
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/headqa.py,sha256=Iq2e9XUwIQGMLDjI1xTSPEBwOMac2Qbm4XfiwGJh4_4,3821
|
|
560
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hellaswag.py,sha256=B0LblxA_p9RvfrNU0xtnfmqMQD_d0gnap-HfiyQVcQQ,4358
|
|
561
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hendrycks_ethics.py,sha256=igjBc-aZvR9_TtDWXb95_6DyHHRfaIROyAFon_p5UP8,8949
|
|
562
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hendrycks_math.py,sha256=VO3w2xgWNmoP4F0wUnogeNdfpOKdWEBOniPy99Vo5A0,8752
|
|
563
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/histoires_morales.py,sha256=Dg99_Dm3_o5Aq-zD6cTnOyU73D1nenJIJLSwYfZuHVg,7138
|
|
570
564
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hle.py,sha256=l0PNHf3taiF-UhE5VO7_GFXwtD9ReR9h1B9-eJ-ukyA,3791
|
|
571
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hrm8k.py,sha256=
|
|
565
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/hrm8k.py,sha256=VQmK_k7LvfDCd8lIdDIorixI17hGwFp91AutrXC9A6g,7613
|
|
572
566
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/humaneval.py,sha256=FBNiL5EvqxbtnNurZDKAgiTb_P28_S0DVQN3QEKBGgY,4377
|
|
573
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/humaneval_infilling.py,sha256=
|
|
574
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/icelandic_winogrande.py,sha256=
|
|
567
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/humaneval_infilling.py,sha256=byUM6QcTKPuRaYAWI7De9JX66hOVydYCod13XLaV2wc,5964
|
|
568
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/icelandic_winogrande.py,sha256=Jo30iNd2em2VqkMqw0wXOeBQMZwIa8aW9ObdkY-oCno,5973
|
|
575
569
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ifeval.py,sha256=J7AHYgnEKuePzvIR9pmMsCoaJNs6QIaSIt5MHLIHjUo,4225
|
|
576
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/inverse.py,sha256=
|
|
577
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/inverse_scaling.py,sha256=
|
|
570
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/inverse.py,sha256=n1PN49RGM4tfX8-UWPkaH--HhiIhued36iyPfKJM1e4,4182
|
|
571
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/inverse_scaling.py,sha256=K-8CHHaaLvw-EqBHc0Gn4Lnr8XDryhx4JisoV9RNzbA,7582
|
|
578
572
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/iwslt2017.py,sha256=noRk2FxmCjnk2RgGHWuvaoT3PqnjF9H-V1b8fogqKQ0,4444
|
|
579
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ja.py,sha256=
|
|
580
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/japanese_leaderboard.py,sha256=
|
|
573
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ja.py,sha256=9T8MhKPLo6xrUrxiAZZ_dqRY64kAymKu8fBj6sj69tg,4162
|
|
574
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/japanese_leaderboard.py,sha256=6IIqSgI-UUO-KbrP5rjvDBNNDLa9qCKI9tFJBmXLJHU,6052
|
|
581
575
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/japanese_leaderboard_gen.py,sha256=K3abgi4Mywn9BQMSQz_V4Hg8etbLHrBE-NpJa3LIivg,8857
|
|
582
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/japanese_leaderboard_mc.py,sha256=
|
|
576
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/japanese_leaderboard_mc.py,sha256=Ay9u6qetRNMElAD09upugrgVe-zEyHrGDxoNfHaMtCA,4993
|
|
583
577
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/jsonschema_bench.py,sha256=q-smnHB3IBpuSUebVPkcZGCqwZc6UEGD7p4MpvVNW4A,4687
|
|
584
578
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/kbl.py,sha256=ZTQ_2CF5Rj1xgU7bnZAVrDvv9F2sVORrCCmR9ZjOjEA,5179
|
|
585
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/kmmlu.py,sha256=
|
|
579
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/kmmlu.py,sha256=WaK0OCbwvTrLN9KNoaEPDNxvQ9rMHaazp2XNSQIuJWY,6553
|
|
586
580
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/kmmlu_cot.py,sha256=CvAVl1xMmvKOhpMd5INKXGjZs7wolf-hyLD-oBsH6a4,3291
|
|
587
581
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/kmmlu_mc.py,sha256=v2KK3DCmTkZyVmkw9gSTHElHV28AAp9Dji2vGizd_kE,4086
|
|
588
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/kobest.py,sha256=
|
|
589
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/kormedmcqa.py,sha256=
|
|
582
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/kobest.py,sha256=gyr3ovj-XiL-8mHLFXuKAqi7m8swhY5BmOmwkhj3aeo,6527
|
|
583
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/kormedmcqa.py,sha256=rCEJUWUHqLIILlFWwlGJsaWml2Fx2dl7bd0wdA_FIt8,4922
|
|
590
584
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lambada.py,sha256=kFbqrlO0SSn8QBhVvFd4SvoQzr79efmHBrVOBgDM9VA,4892
|
|
591
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lambada_cloze.py,sha256=
|
|
592
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lambada_multilingual.py,sha256=
|
|
585
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lambada_cloze.py,sha256=EWi9aPHaDCB-ENFw5qPtXuRouO5t5MFV1lEKmF_4PUg,7112
|
|
586
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lambada_multilingual.py,sha256=pV_oP5ZPtulZOWbMvbJf3BCpy2_msFps81f9rObB1TE,7199
|
|
593
587
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lambada_multilingual_stablelm.py,sha256=S8IBwsTM5yRzE2RRfjF4XakO9QxcIF_vmLbUceh1v4A,5157
|
|
594
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/law.py,sha256=
|
|
595
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/leaderboard.py,sha256=
|
|
588
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/law.py,sha256=O9ppiN_atyGsui7s0_Z2yyW8Lw5gy-TaGsc70Qk9HE8,4166
|
|
589
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/leaderboard.py,sha256=qPopTbVEHUAlto9jdXKfOXnpB_kpdIZRB-zxAhxT0qA,7977
|
|
596
590
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/libra.py,sha256=le4wRHUc2Dpq0gTzS_lQKCZ8zBvlYMVFq0OMkzkdrck,6107
|
|
597
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lingoly.py,sha256=
|
|
598
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/
|
|
599
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/
|
|
600
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lm_syneval.py,sha256=3N2Bt-aAaxugVmQGwt0MdQZ1qKzm8i_qWuqeQJ28zZ8,5981
|
|
591
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lingoly.py,sha256=YIs_p-KVcRoumvs4QDSHV7dpHD5YBpTSMaMSsCZTUvE,7654
|
|
592
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/llama3.py,sha256=PCFYQ1atDy_8gWAG31zca-mtDtfqVyHm8nO1MRYbWyY,5849
|
|
593
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/lm_syneval.py,sha256=efyC-bmiBxJbcSNcNm2w23ZB7pt_TW5i6BKJbqDoaUw,5883
|
|
601
594
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/logieval.py,sha256=b8mWP5I0RUsmLSDE0UyYg9VC87C_qGQWn8Uq78G_dAE,2932
|
|
602
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/logiqa.py,sha256=
|
|
603
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/logiqa2.py,sha256=
|
|
604
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/longbench.py,sha256=
|
|
605
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/longbenchv2.py,sha256=
|
|
606
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mastermind.py,sha256=
|
|
595
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/logiqa.py,sha256=oBfvYiaEcWFnVRjqMbMgZtUbbOdQpRoQuRsZhuB2qz4,3935
|
|
596
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/logiqa2.py,sha256=EE8M804oNuftutfk2Ex-GHxQpU70_og24eDvkIYbXaI,3846
|
|
597
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/longbench.py,sha256=LSP40aDEXGFCK3PxkmMe28j4E3p49EoPFv4We9nLGQ8,5876
|
|
598
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/longbenchv2.py,sha256=B9zYsogZNQKWAXrjA03tQLtijXX42fnmzwohrsFu9nw,5894
|
|
599
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mastermind.py,sha256=ZF1dsVeI5HCtgf57XXkIW2KCMo7aiaWjhcUt1Yxo3V0,7911
|
|
607
600
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mathqa.py,sha256=Pd-E5D6pRWjN7J8rMVy3IbnU4DuEd-20tAyHrMkxiYc,4779
|
|
608
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mbpp.py,sha256=
|
|
609
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mc-taco.py,sha256=
|
|
610
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/med_concepts_qa.py,sha256=
|
|
611
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/meddialog.py,sha256=
|
|
612
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/medical.py,sha256=
|
|
601
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mbpp.py,sha256=qkCmDbZcE5gOYMMeJrvoxjtZxq9wa7bHiEGpi1Sp1EE,6035
|
|
602
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mc-taco.py,sha256=JLSBGNYt7oCT1-_-IE8y4MiVTxWgoEw7PAC5TXZr8v8,3916
|
|
603
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/med_concepts_qa.py,sha256=74Br8u-kBnBTHh0LhoqVXHJ6vMBJGPtXfim33A-a9SI,8677
|
|
604
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/meddialog.py,sha256=ilYrl8A_YWPGZS3A3-leh-h57tXr4gdqZBXNg-Rc_f0,6984
|
|
605
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/medical.py,sha256=EOrfPnejfA257_Fn9CuXWgf9-0_8M2AunW6DmjLLrOs,4182
|
|
613
606
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mediqa_qa2019.py,sha256=W34U00Bk3jwolmds8-P2X-3fSULK4Eo2k0hACs5Qf_8,4796
|
|
614
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/medmcqa.py,sha256=
|
|
615
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/medqa.py,sha256
|
|
607
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/medmcqa.py,sha256=Sz2cFTbHTzKWa9xxWrVnw0XkAm0xlL7NKmpZOXiXBAI,6613
|
|
608
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/medqa.py,sha256=-aOWbDE6OzeXbjBiAWAnaR5v-gmsAsPRd3j32k78xhw,3972
|
|
616
609
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/medtext.py,sha256=OeKPSgBPfz7XjboeW3KGVmSq19xjAFp6dYz0tASwujA,4143
|
|
617
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mela.py,sha256=
|
|
610
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mela.py,sha256=uhfXLPsl8bGp2PpepmlGOBZPU0PV4xBMBZDNVVvrUMk,3774
|
|
618
611
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/meqsum.py,sha256=C1DZEn4peQm9GVfMs4fE0yKkMzwCXReZ88rsFzDSigk,4259
|
|
619
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/metabench.py,sha256=
|
|
612
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/metabench.py,sha256=_fBlmz9305jGNkEYNCbA_r_03d-WZMq2z45Mgkh2_uM,5943
|
|
620
613
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mgsm.py,sha256=K11m-ohBZ5Pxflp9ZaL8rXIeHbKmpHj2rX-uba72lcA,5060
|
|
621
614
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mimic_repsum.py,sha256=VjHLEhKwuHkHo8s8gnLg_5qR5XE3wdnizdzxQVGOG64,5351
|
|
622
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/minerva_math.py,sha256=
|
|
615
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/minerva_math.py,sha256=pUXHtXk8qkOFKOKMuFN8fzqPjdko5i9a585OwWjwO24,7115
|
|
623
616
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mlqa.py,sha256=VSx6TrBBLl125o4tF_m6o8e4huRInd8-dKs4lMkTdEA,5659
|
|
624
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mmlu.py,sha256=
|
|
617
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mmlu.py,sha256=wtnv8mUk50QhOKOgjq7T-OTv8UUMFhVt2V4bGpanY1E,5377
|
|
625
618
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mmlu_cot.py,sha256=5wtrR3gLHlhf6qy_yA7rQZOl6zxumrMbd59LqMSw7EM,3284
|
|
626
619
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mmlu_mc.py,sha256=MI_L-X1QK9OglTbxNYRhkL-nBRumVXGPk_nLRZpt700,4079
|
|
627
620
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mmlu_pro.py,sha256=A1xG34WxJmIkrRsGtFX_Bfr8rKFIjFl3kLlJnYplO9w,5353
|
|
628
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mmlusr.py,sha256=
|
|
621
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mmlusr.py,sha256=XKr1C6Q_Z1e0wjcQnxp5q5uhoiy5xILeWGwiFFuDBX8,7847
|
|
629
622
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mmmu.py,sha256=3Hh2-BdiHZpz528vPniN9f0Ac5dhuoo0J6_wRg2grN8,5606
|
|
630
623
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mnli.py,sha256=tZvZzsyp2Gxk18KEECx8uX2JLvB4VFKyJgTI0S6CGLQ,4241
|
|
631
624
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/model_written_evals.py,sha256=y-NGZVAl2AA0mN2kaFwZoNV6TouR6L-3kAWatld5q74,4591
|
|
632
625
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/moral_stories.py,sha256=cUK-aNA25X-hJsv415dz_J8I35ChcinYMYAPMbP4y08,5957
|
|
633
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mrpc.py,sha256=
|
|
626
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mrpc.py,sha256=Xr0putTvWkF0K-e1yJ_7TZflcaJG0ziyPnMr7uqJK7E,3772
|
|
634
627
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mts_dialog.py,sha256=x54oU2Wr1cg_7X1NYO-gBSV9iEbI9pRykEwR9Zlsg1o,4308
|
|
635
628
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mts_dialog_perplexity.py,sha256=o3ZsLcemHjPb2qCJlv7i7kFKLFkKKbRIIshjwmPTdcI,3622
|
|
636
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/multiblimp.py,sha256=
|
|
629
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/multiblimp.py,sha256=WRQn49f2dV_aF0H5qoeoQiM5cFk9KSnKRwwYL1rmGpY,6056
|
|
637
630
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/multilingual.py,sha256=9VBd8kU21XX5P733a1qf8JkID1sdo6m7myZJJcq1kJc,3722
|
|
638
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/multirc.py,sha256=
|
|
639
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mutual.py,sha256
|
|
640
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/non.py,sha256=
|
|
641
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval.py,sha256=
|
|
642
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_exact.py,sha256=
|
|
631
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/multirc.py,sha256=euSnkmCq0i8kZULtd36kSr3Eb-cfX2RGU37oI46rQLw,3890
|
|
632
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/mutual.py,sha256=-74jVzJ5_Fk5WImwjSHjIBSXfxG4NZl9WT8saZh2hE8,3799
|
|
633
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/non.py,sha256=pGsL8VhdqMCRqhYz4Z0fczdebv8vNxeYcSnuVuxMB1w,4166
|
|
634
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval.py,sha256=B1PTCgZd6b_LTTf4pAorQuxubvEjMQtuZzmr383M3Ic,6875
|
|
635
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_exact.py,sha256=r1k-0QnTMhvLHffjSd1KEa-vDGQ7YbeG3ax9u23t9Ms,6042
|
|
643
636
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_gen.py,sha256=KROJgvdvAtd_Otrnss_EzPxF6upZiBmRRAYzvxJzVsE,11344
|
|
644
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_gen_exact.py,sha256=
|
|
645
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_mc.py,sha256=
|
|
646
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_mc_log_likelihoods.py,sha256=
|
|
637
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_gen_exact.py,sha256=VHXF9nZypig9k6ARHqLj7EVjM1dNQI6vpCuQudWiRyk,6374
|
|
638
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_mc.py,sha256=UUmYAQ3h9Rp2HTZN0Ahel9bx_mr-QWRFn1j1p_rMEEA,9347
|
|
639
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noreval_mc_log_likelihoods.py,sha256=vGVHM16g4CzZkFe5flLJxTIPbaNTQe-GcLZSaERYU6Y,9136
|
|
647
640
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/noticia.py,sha256=fBvmsoMiGB-N5FZ3t39ZnTW44cKPIrXYpKZ-iBrWLjs,4896
|
|
648
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/nq_open.py,sha256=
|
|
641
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/nq_open.py,sha256=pBHE0l28uUO0a9vuo_w5oZM6OAmhqp5bVLUTYcaY4MI,4578
|
|
649
642
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi.py,sha256=WiABcd4en7SjqkTsKq9ACWB_-tPULj6myzrjqNCevKk,864
|
|
650
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi_arc_multilingual.py,sha256
|
|
651
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi_hellaswag_multilingual.py,sha256=
|
|
652
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi_mmlu_multilingual.py,sha256=
|
|
653
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi_truthfulqa_multilingual.py,sha256=
|
|
654
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/olaph.py,sha256=
|
|
643
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi_arc_multilingual.py,sha256=-j6fmTQ-atZwLdX9A9h7ATYbum59fs8Z86PelUpe2xs,6737
|
|
644
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi_hellaswag_multilingual.py,sha256=XZlWDfBQKfGT6i9ZvilsTdDaB7vusrkXon_Lzp3mAqc,7326
|
|
645
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi_mmlu_multilingual.py,sha256=hBQc0zzirsYrYSPqQS75ogDry11ESli1tAYN2OPrwWQ,6520
|
|
646
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/okapi_truthfulqa_multilingual.py,sha256=cIluL4k-oM8GGfJjbAolExdiBfmmiG3MUjPucmlH1j4,9298
|
|
647
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/olaph.py,sha256=7Z5MpTlpyQNcr0Hfo8znYYEy-Nx9bP-1iRQaN8Lt9mM,7181
|
|
655
648
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/olaph_perplexity.py,sha256=3aff3dr8ZHWw4_FRVqweVQNL16VmHokKlmsoTyBSuVc,3594
|
|
656
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/openbookqa.py,sha256=
|
|
657
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/option.py,sha256=
|
|
649
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/openbookqa.py,sha256=qEYzfmDme-kv6GoA2y6bh8mPVZLi1rSx5KKX9Pc_nj4,4054
|
|
650
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/option.py,sha256=UvciLPmH-M2o-4W8WsyiMnpkIpCyLRxy0tSWPMC_Uz8,4178
|
|
658
651
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/paloma.py,sha256=Y7vKEU051LHAtmzb7lAO7LgNm4orDmWLb0D1AVBxrHA,7904
|
|
659
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/parafraseja.py,sha256=
|
|
660
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/parafrases.py,sha256=
|
|
661
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/paws.py,sha256=
|
|
662
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/paws_x.py,sha256=
|
|
663
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/pawsx.py,sha256=
|
|
664
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/persona.py,sha256=
|
|
665
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/phrases.py,sha256=
|
|
652
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/parafraseja.py,sha256=Aw2j-xLLlyGKTJv1v-SWAK0XFZuEmPqVF7sDVXQy0OU,4268
|
|
653
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/parafrases.py,sha256=aPWJeY0t5oEanOrtDx4-KhBGNZmGyUZW0lf9nHL10jQ,4266
|
|
654
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/paws.py,sha256=k6hOYMIAHJ3AlAcCv3LHnwO--2P8KEwfY2bD3EBeJJM,4170
|
|
655
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/paws_x.py,sha256=bA5RBuW_7QlRQ0ocnZKWxUjIr2s3vFgGBBuj0OoJq2Y,5911
|
|
656
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/pawsx.py,sha256=UB1mAqWRmSsjG3qQ8taVztSDWeOTUOTHW4QSJfMaBKc,4016
|
|
657
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/persona.py,sha256=TWPFa2XT1AQm3bZBGfQybN1_rnUAmKoxZnuSZY_H7PA,10957
|
|
658
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/phrases.py,sha256=36-y7OkqgCDaRNZoI1eDI47gMGdYQvIVn-PR9ztaJL0,6032
|
|
666
659
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/phrases_ca_va.py,sha256=F3p14GK8kpSsknnl88JYFY0ezuZmgWit8iel7QBtIc0,2986
|
|
667
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/pile.py,sha256=
|
|
660
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/pile.py,sha256=I8ckihfe3j1GS6N6L8sL_Yc5eyL1ZiKay7invbCcM4U,6334
|
|
668
661
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/pile_10k.py,sha256=K5diNndk9obpncxS2h2pJ3WeFpceZTlCO7d1QXeKCYA,4845
|
|
669
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/piqa.py,sha256=
|
|
662
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/piqa.py,sha256=oJiOSW9B6mcwB4vBbuULMHBrgG5FPa1Rz4ZSZ0KWyMg,3838
|
|
670
663
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/polemo2.py,sha256=8WYXV84sPbNLxwfnPLSVTDKY_suFlJPLp9ffbs9wnZ8,5179
|
|
671
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/
|
|
672
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/portuguese_bench.py,sha256=Jg3foz6stbTDqr9Fi2B1YUd2ktH_PRvfi3-VfCazs98,6105
|
|
664
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/portuguese_bench.py,sha256=A9x_WfzoVetzN7lctFF3sHAne0CgxcaouggZvk-Ug2c,6007
|
|
673
665
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/portuguese_bench_gen.py,sha256=hGLtogrXR_yib9riVQZAkqpwCsMbhb7F8K-AR0uKFgU,4191
|
|
674
666
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/portuguese_bench_mc.py,sha256=u02jIQXUOuwbjfCrDtd1rIEvPq4e9CPvvsa7De8DSYk,4133
|
|
675
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/prompt.py,sha256=
|
|
676
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/prost.py,sha256
|
|
677
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/pubmedqa.py,sha256=
|
|
678
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qa4mre.py,sha256=
|
|
679
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qasper.py,sha256=
|
|
680
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qasper_bool.py,sha256=
|
|
681
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qnli.py,sha256=
|
|
682
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qnlieu.py,sha256=
|
|
683
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qqp.py,sha256=
|
|
667
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/prompt.py,sha256=0u24XuKiwfGonvzaZe30-TBZixmDI2gDJAPcUyuLvrk,4178
|
|
668
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/prost.py,sha256=FckuTbXhBhxwJ1MZfL7I6CiIfLnIExyhz1xbXDBYbnc,4006
|
|
669
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/pubmedqa.py,sha256=eJWfNKxW-yjPQ1GvN3waO5WjKUQoOal-vEX9RHrRETA,3923
|
|
670
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qa4mre.py,sha256=EiuU5mCn_HFLbYG-qbMt43h6jrJz-xmAHLl5Lgtpzvc,4100
|
|
671
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qasper.py,sha256=lvKfMu49ZSuLgSfmoURMIL9itWxK0n8mRrK7gtPEWIo,3922
|
|
672
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qasper_bool.py,sha256=ZeDBo-byUQuHDV0WYgPZ9I641rBp7xZgN2GjmA3jzNA,3800
|
|
673
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qnli.py,sha256=Bgl3kpP6kWQGFDvB-pZl0uESF0c3N1i6ufHdpYXx1PI,3749
|
|
674
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qnlieu.py,sha256=JX9aJXGzZ0p2Uv1VSnbU5krHoNBNLt0aGuOE_dZdb4g,4178
|
|
675
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/qqp.py,sha256=lk2tFRew4E4f2O-DxnfUKOib8BiMnDXqEQy_pu1rxqM,3748
|
|
684
676
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/quac.py,sha256=M7HVhIic8RB3LvV0LCsDdMqEZCPBK7sWb_fkH-Y8HGY,3797
|
|
685
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/race.py,sha256=
|
|
686
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/random.py,sha256=
|
|
677
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/race.py,sha256=QlFL2jsBV7XwoVo4FiuqUqBYE-6TYboCSQT1xschwqA,4087
|
|
678
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/random.py,sha256=mFaACpCJMJhNCa2zj7WZWYRkgPxQAvQ8apaJBFJEnlU,4178
|
|
687
679
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/realtoxicityprompts.py,sha256=1r13H8HW4N4J9eSDmFCAmdoKGhShjxjZ1PCJzhSLTcg,4575
|
|
688
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/record.py,sha256=
|
|
689
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/reversed.py,sha256=
|
|
690
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/rte.py,sha256=
|
|
691
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ruler.py,sha256=
|
|
692
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sciq.py,sha256=
|
|
693
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/score.py,sha256=
|
|
694
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/scrolls.py,sha256=
|
|
695
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/scrolls_mc.py,sha256=
|
|
696
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/self.py,sha256=
|
|
697
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sglue.py,sha256=
|
|
698
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sglue_rte.py,sha256=
|
|
680
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/record.py,sha256=IElbX-S3xDVEjnDOtMAgq4-PtO7tUbXnLfrotzMehUo,4207
|
|
681
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/reversed.py,sha256=uy40cjl6s-E89Jg40GmdK1Rw1NEg2X0_9LHTTG5_ROM,4255
|
|
682
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/rte.py,sha256=sj4eviWxZo5Cqyo4CG21-DBa3ZeKR8RnE-mihLlv1bg,3733
|
|
683
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/ruler.py,sha256=t0UTzPFmnLYt82X1TeWzDdngDJV5HVWNu-TFbEdXg14,6731
|
|
684
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sciq.py,sha256=brMvk3IkbUbqnVzoToqjIjcLWye8ipEG7JuFufTYtJI,3853
|
|
685
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/score.py,sha256=D34PY7yyMzyYZrDnTHRfsWSzb_lm9zeSaSqvPSzXN_o,6689
|
|
686
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/scrolls.py,sha256=4HgI2jViwUAIhIXs44kEP7mD6-C0Ju7BIS7YNfXB2QU,6033
|
|
687
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/scrolls_mc.py,sha256=lMNuCvmRq5MZa9Xd_EfsVite0qDhoN6nD3RfYpPRBTs,5944
|
|
688
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/self.py,sha256=NrPDLq_VjFL-ipnKts2MQGr4JDnhf8gk5it768xTPlQ,4245
|
|
689
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sglue.py,sha256=FVFIMSMHZyVD1PFIxRq1PpHIgGj1BQQIjN2QK_MkvNQ,5270
|
|
690
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sglue_rte.py,sha256=eHTrAnSwEeBTvb66XJQYYAxgIoyjRzwr39WY3a1NPx8,4191
|
|
699
691
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/simple_cooccurrence_bias.py,sha256=pipWwa2PNQVTfJeqU1xi_lPbv1XVUdgedKXsku2Lrpo,4490
|
|
700
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/siqa.py,sha256=
|
|
701
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/social_iqa.py,sha256=
|
|
702
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/spanish_bench.py,sha256=
|
|
692
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/siqa.py,sha256=2GqKb6ccsjWn5wzPrSmH9xmIfurxX3veocy2vmEGxFo,8028
|
|
693
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/social_iqa.py,sha256=O3GSl56G6wUZ1iYRQETcY0gvfQ5l2ifReAVLvtyduG8,4001
|
|
694
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/spanish_bench.py,sha256=MaaLf_FbtiF0DxjTDyY_LsihaSMx77paPAZ91eLwCKc,5977
|
|
703
695
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/spanish_bench_gen.py,sha256=N878fSFoeO3334gnht8zg5Gfb_sy1lbsZcsj0D5ENck,3919
|
|
704
696
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/spanish_bench_mc.py,sha256=izYHAzjLmdFVfmUMB21ZZZhiUtDIMUdyKo9yNfPm404,4128
|
|
705
697
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/squad2.py,sha256=vMQezYU6gN0aD5oiLItMCjRAxxXa1_GBYc6VBCSeJMs,4602
|
|
706
698
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/squad_completion.py,sha256=qrkVhWAw-gKGfwNCqglqFP1TCU1_LPJQmIr6qd2i2iQ,4410
|
|
707
699
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sst2.py,sha256=eqpA1VNI08nMdxF4ltNq333RJLICvENxSS7svQY57Z4,3851
|
|
708
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/storycloze.py,sha256=
|
|
709
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/summarization.py,sha256=
|
|
710
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/super.py,sha256=
|
|
711
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/super_glue.py,sha256=
|
|
700
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/storycloze.py,sha256=jphtZcg9VIYZ3krgknrNtPQIPwEM5nV0bdEag0tTJyY,9406
|
|
701
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/summarization.py,sha256=TWOeNTmE1lfa2ks3Ook9uphU3Z6jBFa82vS0kTyiBnc,4206
|
|
702
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/super.py,sha256=rRp5VEcz7_ltUWTJOUwL_gPiNZzX-OH-qYP0r8ZUviM,4174
|
|
703
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/super_glue.py,sha256=hdKqmtrqaCiSfLqCTIPp9xiRc65HTDJVLKK4rpHVdr8,5951
|
|
712
704
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/superglue.py,sha256=NosWWhOPRF45WkNCgJFJXI4x132tFwRX102DcdrXf0E,3827
|
|
713
705
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/supergpqa.py,sha256=4hIJpmgdVxZf2xsFOkbvgIkfyFAXF0vbnwlCNyoYNJU,3827
|
|
714
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/swag.py,sha256=
|
|
715
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/swde.py,sha256=
|
|
716
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sycophancy.py,sha256=
|
|
717
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/t0.py,sha256=
|
|
718
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/teca.py,sha256=
|
|
719
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinyarc.py,sha256=
|
|
720
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinybenchmarks.py,sha256=
|
|
721
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinygsm8k.py,sha256=
|
|
722
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinyhellaswag.py,sha256=
|
|
723
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinymmlu.py,sha256=
|
|
724
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinytruthfulqa.py,sha256=
|
|
725
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinywinogrande.py,sha256=
|
|
726
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tmmluplus.py,sha256=
|
|
706
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/swag.py,sha256=0ZB8PvzKVhZiZaq_HS133xj3-5MqucudKZQysq6IVLo,3892
|
|
707
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/swde.py,sha256=0m0WMPiUMzjDfc1wuLFtpBzDU4l3twvPLl8lg3R1dH4,6880
|
|
708
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/sycophancy.py,sha256=ldHakmbs_ChOCzgfAF1EtOngoy9edmXDdpmhuZlkUFY,4277
|
|
709
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/t0.py,sha256=2DKa1BmS6iZLLcN3Z-IoJsYYXiJlrEnAR-5Q6HN5h9Q,4223
|
|
710
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/teca.py,sha256=VDg_po-TKD8gwF8naWmOea6ec8_OO72f0BhRtSebYKc,4233
|
|
711
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinyarc.py,sha256=W0usZ9riBei7km4WV8_eXTnfL2IamGls8ZegisqBlmk,4248
|
|
712
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinybenchmarks.py,sha256=8CK5WIiWLQte7KW-afuRKrcK-MIZggf1Z00BJsmt8dY,5994
|
|
713
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinygsm8k.py,sha256=GLP3EObZ_9j_-Sf62ucgwHNkmsRHDG9ycR3CP5_mMlQ,4253
|
|
714
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinyhellaswag.py,sha256=3dGc6qhDISKjNACTU1bXVJToQHlsh756AD_kwtVGxlg,4278
|
|
715
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinymmlu.py,sha256=4JyBUFl3O8Gdlh6Wija9JV2lUwEhcEQr_62rJWtCAK8,4253
|
|
716
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinytruthfulqa.py,sha256=El-fPGj0szWZlRK0V9SjCySm9llvQQObVXzg0Ri_-gU,4315
|
|
717
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tinywinogrande.py,sha256=3_-EFzulS2GxI2E4RbmGd6MYHdhQoy16jlLtvlX_lFM,4283
|
|
718
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/tmmluplus.py,sha256=ItfpZdnxKoiONGUHiBZMmMKRK4lS9FoK4s6UVZjWLCo,8108
|
|
727
719
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/toxigen.py,sha256=wyr9CDq4LupITsRR327vGhIfcgjXdtDgcZBPS0EexDc,3270
|
|
728
720
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/translation.py,sha256=rHNpXKyLCl5qUtTw0nMjg0jW4sFOK9SOKkawc0UBH3g,5167
|
|
729
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/triviaqa.py,sha256
|
|
730
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/truthfulqa.py,sha256=
|
|
731
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/truthfulqa_mc1.py,sha256=
|
|
732
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/truthfulqa_mc2.py,sha256=
|
|
721
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/triviaqa.py,sha256=6Hc1IkZXfBtDAN7qrcFtsLcssnPnKdCXZRa6c1HHHWM,4360
|
|
722
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/truthfulqa.py,sha256=nO4LRVeTJXKkjXvDRZJ3WK4onJSYRNKx-kmYqXSIdvo,4382
|
|
723
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/truthfulqa_mc1.py,sha256=70Tuawb5FTrhWOKeAezoWthVf81A5FrATeiIX-_AhGM,4004
|
|
724
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/truthfulqa_mc2.py,sha256=PW686J9_AAdPyLBlsYeMQ6XROczPb1IcEjeTP_f6g6Q,4998
|
|
733
725
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/truthfulqa_multi.py,sha256=oCWC6hY3RI9Nj04Rij71fDZCT-L17kXirkGE9fyob-I,4945
|
|
734
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/turblimp_core.py,sha256=
|
|
735
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/turkishmmlu.py,sha256=
|
|
726
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/turblimp_core.py,sha256=Cg3edq6WfVd6444Ap6YUEmKNiU4mnaqFv_HzZ3g4QEQ,5910
|
|
727
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/turkishmmlu.py,sha256=WN8weWS1TNyNy3qw9coM_vknHYSsCnb40yVEq1CvjOI,6240
|
|
736
728
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/turkishmmlu_cot.py,sha256=nD7B0tA1rMd80eazkrnGjXS1VemkEp-pvqMweyGMphg,3871
|
|
737
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/turkishmmlu_mc.py,sha256=
|
|
729
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/turkishmmlu_mc.py,sha256=sSMEhTucmkxhtrqSD85suP4ZjIOJ14nk9uTNDvmux0k,3702
|
|
738
730
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/twenty_newsgroups.py,sha256=_mAy170d7m1SlPtbNNkToyr5zFasvyEUlWgJyuNZK38,4563
|
|
739
731
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/unitxt.py,sha256=OhhhQJfwBTSjWipi3nPIelpjrSpvI3vCZ1FmYPH5WGc,4592
|
|
740
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/unscramble.py,sha256=
|
|
741
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/vaxx.py,sha256=
|
|
742
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/webqs.py,sha256=
|
|
743
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wic.py,sha256=
|
|
732
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/unscramble.py,sha256=3LyrHvUVZwlas6vVriIh28vJUYVKzM32_UnlBRst7G4,5950
|
|
733
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/vaxx.py,sha256=TfckjIy-_sV9_tLjPxmgpdPa0kO3esG0h7Yf_o7ms88,3527
|
|
734
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/webqs.py,sha256=GHzoWid4Epw7-lL4oygxfoT_oaBK_kiNAoX86MGzKVw,4384
|
|
735
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wic.py,sha256=HEE7qyKyEMoJlXUKD88iWpqrsCA6bnVsbSxiwkgDXtw,4041
|
|
744
736
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wikitext.py,sha256=r2izxF9w-LsQg3erIk3v8vGQttc7nxpqi0KHkYe_cPc,5000
|
|
745
737
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/winogender.py,sha256=1CoZe0Btrt06gu6TCfcPnobbewPgY2EOdijKISq0bgE,4766
|
|
746
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/winogrande.py,sha256=
|
|
747
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wmdp.py,sha256=
|
|
738
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/winogrande.py,sha256=deTEUw0oT86cl_8xq6rqEbPKGjZnOazDTcYZAlE4QDw,4062
|
|
739
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wmdp.py,sha256=OWnnlt6Ng5RayIxvUsB0HstVFti_-pROBxzaMNfnQkI,5932
|
|
748
740
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wmt14.py,sha256=_zHPAk_V9VyigtVcpTLpbLgFoNrHeASloddh9lQLUGU,4043
|
|
749
741
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wmt16.py,sha256=pX8F91Um3kUbsKgxJZDdRBfFzlmCr5WUx-OFBYGF5CM,4446
|
|
750
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wnli.py,sha256=
|
|
751
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wsc.py,sha256=
|
|
752
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wsc273.py,sha256=
|
|
753
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xcopa.py,sha256
|
|
754
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xlsum.py,sha256=
|
|
755
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xnli.py,sha256=
|
|
756
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xquad.py,sha256=
|
|
757
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xstorycloze.py,sha256=
|
|
758
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xwinograd.py,sha256=
|
|
742
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wnli.py,sha256=ZjvaIwrqGk1CiP9Q7j0-9LabEnov47vpR53tcbGhslg,3803
|
|
743
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wsc.py,sha256=aY_bzRuWwDu2sUb_YTXafZvO8c1_9E5E5m4aP9dCuLg,3932
|
|
744
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/wsc273.py,sha256=yhslwubim0colqpT6t84EOrp844RfDeRrXFKDT-kuqw,6976
|
|
745
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xcopa.py,sha256=-xGIiysi_c_mht3MEZwX3dPabfi7kYnTXNM7x9afrPw,7365
|
|
746
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xlsum.py,sha256=fViGmOE9bi0o5T6K5yXwdHfqZ7B-FWhuecFdpuNVCps,5273
|
|
747
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xnli.py,sha256=4q2n2eWy00QAU238ruA057f8pfwOYp4dTfUKcZmAEcQ,4127
|
|
748
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xquad.py,sha256=VI448Ro_eDF-rzPdmQlCuoCkQIFWs-Hoe6d_sC30NOw,7637
|
|
749
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xstorycloze.py,sha256=gr39S_zUyO0llrS_y43j-S8CqgIj86saTBpsZwIyiiU,4416
|
|
750
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/xwinograd.py,sha256=2lsXdPSVTzcuhGWK8Gx8bXmRh0xTqWcoLRKA3KrDBW4,4054
|
|
759
751
|
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/yahoo.py,sha256=oI2VKhoGTIVPrJGv4L7-o2H-8CauckVDql1wRMs_WWw,3949
|
|
760
|
-
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/zhoblimp.py,sha256=
|
|
752
|
+
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/zhoblimp.py,sha256=U13gF5-nYth4L9gIIlbpLlbvA10dXYbUwjPKcaUXUO4,5934
|
|
761
753
|
wisent/core/data_loaders/__init__.py,sha256=VAcOq6wRL3oihqeJz6Pk23u1enwEkM8w2lShv0V8Sik,8667
|
|
762
754
|
wisent/core/data_loaders/rotator.py,sha256=hlahoJz_cvl7pxsFwVDcF1fc9Uj690rb7aWpqdfq9HU,3794
|
|
763
755
|
wisent/core/data_loaders/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
@@ -765,7 +757,7 @@ wisent/core/data_loaders/core/atoms.py,sha256=26vJ1B35_8EoQrFOEdNvXHcJRGxSfqsYpF
|
|
|
765
757
|
wisent/core/data_loaders/loaders/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
766
758
|
wisent/core/data_loaders/loaders/custom.py,sha256=Xe1sOHH3_dRjBnQg9vwMM-XA8ROn65dUr9TeT-nuNtQ,4144
|
|
767
759
|
wisent/core/data_loaders/loaders/huggingface_loader.py,sha256=AvMG2DpEAOMfzz339WlDJ3qeqLjvcqY7P4P7lVnjKTE,5147
|
|
768
|
-
wisent/core/data_loaders/loaders/lm_loader.py,sha256=
|
|
760
|
+
wisent/core/data_loaders/loaders/lm_loader.py,sha256=_uPsvYXGApETcvn9hooT3rDdgrvE8gfXw3bDyewKL4Y,63150
|
|
769
761
|
wisent/core/data_loaders/loaders/lm_loader_special_cases.py,sha256=-Ku7dOZIBgJjbNAbP5ihXvRn5KCStzSmk8_nLsshmzs,18885
|
|
770
762
|
wisent/core/data_loaders/loaders/task_interface_loader.py,sha256=QGDfqMvdTFfogF9P533b-Gw52uHe0GnsS64AfnVVlek,11771
|
|
771
763
|
wisent/core/errors/__init__.py,sha256=DX-T4zW2PwNvTcyXyt1T_-oZ_xXl4WhzqaOZKiDaWFo,5535
|
|
@@ -777,7 +769,8 @@ wisent/core/evaluators/steering_evaluators.py,sha256=3b2voLO9BzRzNmEjhiw2GzOuHLy
|
|
|
777
769
|
wisent/core/evaluators/synthetic_evaluator.py,sha256=odKzYAHp1pIIvZtvRpodfVbnCK_E_LEMg7Z4TJG2O9I,14284
|
|
778
770
|
wisent/core/evaluators/benchmark_specific/__init__.py,sha256=hTcHcv3GEQQWZ7Z_puSUbI8LlQuzljr_-GtMA19wiro,1432
|
|
779
771
|
wisent/core/evaluators/benchmark_specific/aime_evaluator.py,sha256=3VD6C0MsEyIO7i744QmSoZk5uuqE_OnhvkhG8hweKzk,3062
|
|
780
|
-
wisent/core/evaluators/benchmark_specific/
|
|
772
|
+
wisent/core/evaluators/benchmark_specific/apps_evaluator.py,sha256=_BoQjf6IouWWWMoiKk83-woZA7a73dBZC_qKKYEs9v0,4322
|
|
773
|
+
wisent/core/evaluators/benchmark_specific/conala_evaluator.py,sha256=z2tlm9mnMbglnnfEn2h_d9X1Z9D0KWSjFBKAB7oh0AY,6475
|
|
781
774
|
wisent/core/evaluators/benchmark_specific/exact_match_evaluator.py,sha256=rc-QfiAYOzAkd5MAfghj7kQ6pEEYFtr4630pt-HRXmE,2756
|
|
782
775
|
wisent/core/evaluators/benchmark_specific/f1_evaluator.py,sha256=6_9_U3mUKBSBpOFq7HGXnN3xrmGOSV-H2agTE_s1I_g,6608
|
|
783
776
|
wisent/core/evaluators/benchmark_specific/generation_evaluator.py,sha256=6XNmp774qI9PqzybqQEwKgI_gn3ui3mIZc71GT5JXcY,20052
|
|
@@ -789,7 +782,7 @@ wisent/core/evaluators/benchmark_specific/polymath_evaluator.py,sha256=bZfGRp_ad
|
|
|
789
782
|
wisent/core/evaluators/benchmark_specific/coding/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
790
783
|
wisent/core/evaluators/benchmark_specific/coding/solution_generator.py,sha256=PX3RdwhrrYG_2nx10GVvQjdq-_6AFP-Q-yEGFA9rYpc,9329
|
|
791
784
|
wisent/core/evaluators/benchmark_specific/coding/metrics/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
792
|
-
wisent/core/evaluators/benchmark_specific/coding/metrics/evaluator.py,sha256=
|
|
785
|
+
wisent/core/evaluators/benchmark_specific/coding/metrics/evaluator.py,sha256=KHlWIMkQcuKnES8H3qEo9IHMPAlsbhnF5yGCde-mUHQ,15313
|
|
793
786
|
wisent/core/evaluators/benchmark_specific/coding/metrics/passk.py,sha256=WCkdt9a1KG2qoHNQtXdKPupVNQtppPyUGeq5yF6ZO7M,2059
|
|
794
787
|
wisent/core/evaluators/benchmark_specific/coding/metrics/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
795
788
|
wisent/core/evaluators/benchmark_specific/coding/metrics/core/atoms.py,sha256=I4wwOUTDjJ_4Jo6Bbpl8Tkv0Uz9zpwNjzeWBrXru-9g,1001
|
|
@@ -825,43 +818,44 @@ wisent/core/evaluators/custom/examples/__init__.py,sha256=Jho4mJgB6eGc5CaRjtcyrO
|
|
|
825
818
|
wisent/core/evaluators/custom/examples/desklib_detector.py,sha256=1ysygPE-TpO7sKqOEZtOvdGMv5nLp6n57MawU7mH3Ic,5566
|
|
826
819
|
wisent/core/evaluators/custom/examples/gptzero.py,sha256=El4Sypuee0a6QMv7HrPhfqfTeJbaEXQRLjuV_clPlgg,6129
|
|
827
820
|
wisent/core/evaluators/custom/examples/humanization.py,sha256=bNTDLNqckkCgq_T7elG5EdqBsidWzRh-ncbCKNibvMo,2677
|
|
828
|
-
wisent/core/evaluators/custom/examples/humanization_coherent.py,sha256=
|
|
821
|
+
wisent/core/evaluators/custom/examples/humanization_coherent.py,sha256=4jad6VsPs9QSyDH0PKwhyjsxTvIM6a0tfZsOseeF46I,6628
|
|
829
822
|
wisent/core/evaluators/custom/examples/roberta_detector.py,sha256=mq9MHdm6sosuzV8qRt-rj6gaYFaWsodgfBt1ZpCqwFM,6107
|
|
830
823
|
wisent/core/evaluators/oracles/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
831
824
|
wisent/core/evaluators/oracles/interactive.py,sha256=f3v2_N17fKzGyeOxONRJbrbn8i5uMeZmRvMmF0ShNf0,2638
|
|
832
825
|
wisent/core/evaluators/oracles/nlp_evaluator.py,sha256=KxbnF-I2IFbBQpoYyjQKGbYh4NErsEuhTCRYX_Tob8o,18220
|
|
833
|
-
wisent/core/evaluators/oracles/truthfulqa_gen_evaluator.py,sha256=
|
|
826
|
+
wisent/core/evaluators/oracles/truthfulqa_gen_evaluator.py,sha256=fUejtchm8bWFQitW-xIPkvo2BYvpyjGVFU-FR_s60EE,5954
|
|
834
827
|
wisent/core/evaluators/oracles/user_specified.py,sha256=V1dKrNj3Oq7UC_I7DT0WGnktP7R_DSW6UAwDdrA8SnE,2360
|
|
835
828
|
wisent/core/evaluators/personalization/__init__.py,sha256=t3lWkNFXA27eDzEQIZnkpasjGJ0w6UaZee4dJEQpFEQ,311
|
|
836
829
|
wisent/core/evaluators/personalization/alignment.py,sha256=UcF5ismNElPbWkJNb-EuUKZraYE5aI46SAXoniQxQwE,5449
|
|
837
|
-
wisent/core/evaluators/personalization/coherence.py,sha256=
|
|
830
|
+
wisent/core/evaluators/personalization/coherence.py,sha256=f_0VHXm2GbS68JnQkYXS7tuR1sH6vsuLqSvjRB6M9kM,13641
|
|
838
831
|
wisent/core/evaluators/personalization/difference.py,sha256=8D9azBdqciYo4IJt2lwrFGrwpm7q3Kyze6K_yBYPHoo,2649
|
|
839
832
|
wisent/core/modalities/__init__.py,sha256=jtowcmTMQ_kOYai7FKwXY0vqSYQ8vews84VSMH73XFM,20138
|
|
840
833
|
wisent/core/models/__init__.py,sha256=G9JfaVU_CXCG_wnz5D5gjDJ-_G7zqHFmjaixDpbCixM,456
|
|
841
834
|
wisent/core/models/inference_config.py,sha256=0n8647avNb4w0o0UsbWnU_eh6cMU23ppdJ-FDYx8mAY,3704
|
|
842
|
-
wisent/core/models/wisent_model.py,sha256=
|
|
835
|
+
wisent/core/models/wisent_model.py,sha256=sweOiwBMsPaA1AZ3zGPn6ao-oI2kbbtTs-T5DMkWDd8,36566
|
|
843
836
|
wisent/core/models/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
844
|
-
wisent/core/models/core/atoms.py,sha256=
|
|
837
|
+
wisent/core/models/core/atoms.py,sha256=XsasyE6Ki7jIwmsn5n1r9sOHPhOpKGdMfvD_MRSDSx4,16170
|
|
845
838
|
wisent/core/opti/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
846
839
|
wisent/core/opti/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
847
840
|
wisent/core/opti/core/atoms.py,sha256=7D6TxhEcBKxCplajICCfpZQ0g2rsKB6iWoRB0Mwr7yg,5438
|
|
848
841
|
wisent/core/opti/methods/__init__.py,sha256=AJmvQZqWRAJ_EYzrF28uA1mN37C-AtVnUgCKfXaD0qQ,365
|
|
849
842
|
wisent/core/opti/methods/opti_classificator.py,sha256=qVnpA57ncSsPLOby-rXvEOI_c_cRp06pJSsOLtO-tuw,6864
|
|
850
843
|
wisent/core/opti/methods/opti_steering.py,sha256=Lr8dYKpqgGvuJauvYl7FNUMtR1cUAl93aepiqPIeslw,5407
|
|
851
|
-
wisent/core/opti/methods/opti_weights.py,sha256=
|
|
844
|
+
wisent/core/opti/methods/opti_weights.py,sha256=0dUN0lqMsRfB0Fcv851Kv-alseuS9N0Z4O1B12Y-qyU,21104
|
|
852
845
|
wisent/core/optuna/__init__.py,sha256=efbr9QeNaeWMle9pppWBJXs5ObiPti9QZBQGBvuli-s,2250
|
|
853
846
|
wisent/core/optuna/classifier/__init__.py,sha256=vv2wCAbw8ccZxq3vxrQt9plUdbr7VJj-t2rRnh6jBR8,819
|
|
854
|
-
wisent/core/optuna/classifier/activation_generator.py,sha256=
|
|
847
|
+
wisent/core/optuna/classifier/activation_generator.py,sha256=9zV4qEGVovBP_3HYQq0UXArZ_xPSIdjHEiGHzBveikY,14432
|
|
855
848
|
wisent/core/optuna/classifier/classifier_cache.py,sha256=Q8PNBJ2rpHWvAQRVPR_ax0zvnrbRKN0yUjOhCwXf9jw,17439
|
|
856
|
-
wisent/core/optuna/classifier/optuna_classifier_optimizer.py,sha256=
|
|
849
|
+
wisent/core/optuna/classifier/optuna_classifier_optimizer.py,sha256=VmqEGNjM-omYEQmsneQs7uhZGsdOPfExSCTd4XLogH4,25511
|
|
857
850
|
wisent/core/optuna/steering/__init__.py,sha256=C1O9Y2AMFsFvLq6fmTW_wJ5vnRXKVGftykRw3NaiHwM,508
|
|
858
851
|
wisent/core/optuna/steering/bigcode_evaluator_wrapper.py,sha256=ZVp159jbcdUAf8A2q5AwINak0n6YqBUuq0iDLvXObyQ,7157
|
|
859
852
|
wisent/core/optuna/steering/data_utils.py,sha256=PUQ8Gqu8oPfoGGFi_lTfaPXhTZ5MRQO2Gf73vRa7NDU,12431
|
|
860
853
|
wisent/core/optuna/steering/metrics.py,sha256=6UbW9AMrRpT1pgvDVK9rb1-ieqqOq1I1KdVh6MtB4CI,16394
|
|
861
|
-
wisent/core/optuna/steering/steering_optimization.py,sha256=
|
|
854
|
+
wisent/core/optuna/steering/steering_optimization.py,sha256=V5iu5uttoT1Uq6Lj5jiUfnJ9-vIXVyAVD6UzXHdvXWA,45016
|
|
862
855
|
wisent/core/parser_arguments/__init__.py,sha256=MpBsnsPcZQ8cqAn1tN4OYfb3oMQraNW-23g3Z5gSqeg,299
|
|
863
856
|
wisent/core/parser_arguments/agent_parser.py,sha256=PG3V-F9xKE53guiiQ2GudGKZnjvtoAbdyMI8Qhm_sZw,4971
|
|
864
|
-
wisent/core/parser_arguments/check_linearity_parser.py,sha256=
|
|
857
|
+
wisent/core/parser_arguments/check_linearity_parser.py,sha256=82a6WJCUdPyM95rb4NrtUMhd-XQ2lNYq3NByxm4k4Yw,2392
|
|
858
|
+
wisent/core/parser_arguments/cluster_benchmarks_parser.py,sha256=QvEjOIRZswffCNMcEsIgCt1a7V-CzaHbFVWTaDF2-7U,889
|
|
865
859
|
wisent/core/parser_arguments/configure_model_parser.py,sha256=LmsS0mYF7eP-zpYB7SdEbtFZLVtPtcbkEi9CMkYqMVo,350
|
|
866
860
|
wisent/core/parser_arguments/create_steering_vector_parser.py,sha256=GvyHt0fqwVk5dDmAsilOttsybZ3jj5Z6dQWzE8EUj-Y,1735
|
|
867
861
|
wisent/core/parser_arguments/diagnose_pairs_parser.py,sha256=i_kV0sEYkpWEur0BK32Y3nMMRwjz7bAjUY9BbhqSDws,591
|
|
@@ -873,12 +867,13 @@ wisent/core/parser_arguments/full_optimize_parser.py,sha256=BTd2Wc_qUkrdwvaPeoXk
|
|
|
873
867
|
wisent/core/parser_arguments/generate_pairs_from_task_parser.py,sha256=wEZLIXocqgLduufNMYTNm4YcQwerq53zp5YseCqiCbY,924
|
|
874
868
|
wisent/core/parser_arguments/generate_pairs_parser.py,sha256=nDTQ63bvjl-GcSrMdtcR_Pdh1dzbqtRnGaSCFhPO-4Q,1918
|
|
875
869
|
wisent/core/parser_arguments/generate_responses_parser.py,sha256=LnjIx7gOdysEMGwUIHFHlaEOE306qr4rXto9gzBSjkg,1345
|
|
876
|
-
wisent/core/parser_arguments/generate_vector_from_synthetic_parser.py,sha256=
|
|
877
|
-
wisent/core/parser_arguments/generate_vector_from_task_parser.py,sha256=
|
|
870
|
+
wisent/core/parser_arguments/generate_vector_from_synthetic_parser.py,sha256=MvwLJYm-23pAwAocJqrjWS12RlAMW70ATCEWa2VfJ2w,4225
|
|
871
|
+
wisent/core/parser_arguments/generate_vector_from_task_parser.py,sha256=95jOVRH22aFcngJJYrLvpj-SFAPZaTSlAeh277NuWbg,4889
|
|
878
872
|
wisent/core/parser_arguments/generate_vector_parser.py,sha256=bf2PHAdvNZetXaSe3sKarvK6McIODPdmRSNRQN_rHto,3622
|
|
873
|
+
wisent/core/parser_arguments/geometry_search_parser.py,sha256=-ytDrseoIRJnjMq8pvh6jE9fxn5IXDCVmZB_5wlub8Q,1739
|
|
879
874
|
wisent/core/parser_arguments/get_activations_parser.py,sha256=pCBET7CsFz-8WFE3mb677o4W-vVa09wz-3YDMx-8ukA,2445
|
|
880
875
|
wisent/core/parser_arguments/inference_config_parser.py,sha256=-TAcjy8yTzDKWFc42JCmVtGq1MowQI-IauRNFNj_se0,1853
|
|
881
|
-
wisent/core/parser_arguments/main_parser.py,sha256=
|
|
876
|
+
wisent/core/parser_arguments/main_parser.py,sha256=6RPGpcf5eXqMpSK4adVVU_vJit3pICZMoAzgjpcb29c,12789
|
|
882
877
|
wisent/core/parser_arguments/model_config_parser.py,sha256=RlcSyQkj0uDlmJJE8sMq_CjvJ1VdCcjf8_BqspsSHd0,3210
|
|
883
878
|
wisent/core/parser_arguments/modify_weights_parser.py,sha256=077Gz6GLk1aR2k6rboU4tcVBgxHaTB01sSRx7ZqlzPU,9336
|
|
884
879
|
wisent/core/parser_arguments/monitor_parser.py,sha256=qo3vyyVmdZBkhGuhlHqbEzTiIKcdFIvG3IIuc-DIRQE,1234
|
|
@@ -888,11 +883,11 @@ wisent/core/parser_arguments/optimization_cache_parser.py,sha256=R54XzVY4GUgpXu8
|
|
|
888
883
|
wisent/core/parser_arguments/optimize_classification_parser.py,sha256=tzHAvOPIbXP8risT6eMICpsRfO6RETwP4s8qIAe60ms,4170
|
|
889
884
|
wisent/core/parser_arguments/optimize_parser.py,sha256=HTuhFspCAZkNcYhP69-JmaT91CRm_wV9IaF-BFvg_I8,4603
|
|
890
885
|
wisent/core/parser_arguments/optimize_sample_size_parser.py,sha256=OJEY2y89-9pbA7FnTgDvxoa3SXvogL5yM2QqStbpBCA,2836
|
|
891
|
-
wisent/core/parser_arguments/optimize_steering_parser.py,sha256=
|
|
892
|
-
wisent/core/parser_arguments/optimize_weights_parser.py,sha256=
|
|
886
|
+
wisent/core/parser_arguments/optimize_steering_parser.py,sha256=fRG64w-eb0ezUp9T5-zsMJ8X8L4Z6C9myeg21R8DTuI,28731
|
|
887
|
+
wisent/core/parser_arguments/optimize_weights_parser.py,sha256=7SEOhgBs9GWGLyPzNfZHQztt4o24HHUPgCf7sbW1kVo,13904
|
|
893
888
|
wisent/core/parser_arguments/synthetic_parser.py,sha256=99fGg_k9vQl80COuVZw5LOYLRQ0sDlZ4ozwsx0T--Qs,5135
|
|
894
|
-
wisent/core/parser_arguments/tasks_parser.py,sha256=
|
|
895
|
-
wisent/core/parser_arguments/train_unified_goodness_parser.py,sha256=
|
|
889
|
+
wisent/core/parser_arguments/tasks_parser.py,sha256=MNSijAG6zzinuwy9lIOwJxrL0JavM7MKx443Nwe7uEs,22440
|
|
890
|
+
wisent/core/parser_arguments/train_unified_goodness_parser.py,sha256=DQF46sBOAvYCdzzdQlGvKhKgsyZPiR8sdZuCmonuWV0,4977
|
|
896
891
|
wisent/core/parser_arguments/utils.py,sha256=XTtssIt05HlAyO6kMPZvu4l_UIZSMDaV-gl50NO7qOw,3543
|
|
897
892
|
wisent/core/prompts/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
898
893
|
wisent/core/prompts/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
@@ -905,15 +900,16 @@ wisent/core/prompts/prompt_stratiegies/multiple_choice.py,sha256=L4dOtocXte91Mn2
|
|
|
905
900
|
wisent/core/prompts/prompt_stratiegies/role_playing.py,sha256=Bl_4A-OJgepDB33iRLB-fTdCLmy4QvfGKJ7kIq1ApUE,1101
|
|
906
901
|
wisent/core/steering_methods/__init__.py,sha256=ULxu5kHL5jCyrGoPAUiOYtuxU_iTYYY7e0frABdflfk,1364
|
|
907
902
|
wisent/core/steering_methods/preflight.py,sha256=26Pxx7b3TBRSHfnKF2NWhYN2mjTCnbnd3k7advIqjfU,12009
|
|
908
|
-
wisent/core/steering_methods/registry.py,sha256=
|
|
903
|
+
wisent/core/steering_methods/registry.py,sha256=t7gvgCa294HhY__Nb_swt1TvfEWNRXqh578LJxNuWWc,24066
|
|
909
904
|
wisent/core/steering_methods/rotator.py,sha256=Lt_IW2I1u9h79KLyiTtLIocGhdW0DxcQylMyqC8gClo,4053
|
|
910
905
|
wisent/core/steering_methods/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
911
|
-
wisent/core/steering_methods/core/atoms.py,sha256=
|
|
906
|
+
wisent/core/steering_methods/core/atoms.py,sha256=kDN-lvaQnMi9UTCdz-4rZ8x5baqrsVGVYGO-P2EpVUY,5377
|
|
912
907
|
wisent/core/steering_methods/methods/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
913
|
-
wisent/core/steering_methods/methods/caa.py,sha256=
|
|
914
|
-
wisent/core/steering_methods/methods/
|
|
915
|
-
wisent/core/steering_methods/methods/
|
|
916
|
-
wisent/core/steering_methods/methods/
|
|
908
|
+
wisent/core/steering_methods/methods/caa.py,sha256=EsodLtBV66YR7ROngU7-9fJFhzWcmzo7HFjZCNE28Ko,1717
|
|
909
|
+
wisent/core/steering_methods/methods/hyperplane.py,sha256=NeLbFoxlDrnJ_8PTQ6J3BGXtNSTRbaLpwXtpifNgCP8,2976
|
|
910
|
+
wisent/core/steering_methods/methods/prism.py,sha256=Cb18ip7tl57hz7KW6br4EsLWxYP5__bMYppsyBEPzIY,23995
|
|
911
|
+
wisent/core/steering_methods/methods/pulse.py,sha256=aowQtMONcBkNaO99gT7qVClifKyyEdWPQqKMv-PwjSE,25801
|
|
912
|
+
wisent/core/steering_methods/methods/titan.py,sha256=OVj02CrOlO_YVKxiOK6kBZUiViLZL3ot2709J91tFf8,41521
|
|
917
913
|
wisent/core/synthetic/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
918
914
|
wisent/core/synthetic/cleaners/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
919
915
|
wisent/core/synthetic/cleaners/deduper_cleaner.py,sha256=XI19V8IpX5lGWasW43Qa2peEEcxsrAfmB_W9uKzw11U,1571
|
|
@@ -931,7 +927,7 @@ wisent/core/synthetic/db_instructions/mini_dp.py,sha256=XElWJGkIG9DR5q4wcY11kJDJ
|
|
|
931
927
|
wisent/core/synthetic/db_instructions/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
932
928
|
wisent/core/synthetic/db_instructions/core/atoms.py,sha256=jBazuD37hyBMIsbFNDjpwlGnxECAOuh4YT0fmpH8C6o,748
|
|
933
929
|
wisent/core/synthetic/generators/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
934
|
-
wisent/core/synthetic/generators/nonsense_generator.py,sha256=
|
|
930
|
+
wisent/core/synthetic/generators/nonsense_generator.py,sha256=JqgJKUU6prgT62R5OzNy-8DIAlgkWE9jRp5uExrqnTo,6156
|
|
935
931
|
wisent/core/synthetic/generators/pairs_generator.py,sha256=VgxeXwTe_Ctvms8b5oBZL-H5l2ck9rExfQf0FHxeIVE,12927
|
|
936
932
|
wisent/core/synthetic/generators/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
937
933
|
wisent/core/synthetic/generators/core/atoms.py,sha256=9wL0v38BCqn3y9LtoRkQsK_X3egjdYcPmFXH0mgFSWg,2290
|
|
@@ -955,22 +951,39 @@ wisent/core/tracking/__init__.py,sha256=rda2gaV_tFP6CChzx8TBQUrh_PObqvX35-BHJCxi
|
|
|
955
951
|
wisent/core/tracking/latency.py,sha256=uKibYRodOurQoCh5MqfJwo_k5Ho4H5dFQ0p_nddHGOg,21909
|
|
956
952
|
wisent/core/tracking/memory.py,sha256=Fwg92c_M997uToNLIZvFlHbp3F5TTrUZsA_X25J-QfM,13201
|
|
957
953
|
wisent/core/trainers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
958
|
-
wisent/core/trainers/steering_trainer.py,sha256=
|
|
954
|
+
wisent/core/trainers/steering_trainer.py,sha256=hTtEP--odC_SfXaVQ8O0i66f6isDKyN5koeaZ5WMxUU,15091
|
|
959
955
|
wisent/core/trainers/core/__init__.py,sha256=zkv6f6Auk4dbJ5PTQP96gP2TUM55W3tc1flHLWBvI4M,1246
|
|
960
956
|
wisent/core/trainers/core/atoms.py,sha256=ycWk0G-7EIAEOnQL-o5_V5B8KTQ7CQUilGF4ibjighM,1536
|
|
961
957
|
wisent/core/utils/__init__.py,sha256=ee4tMv5W_qxtTwRS-n8ZCl69CgBUqPGjugrkomOhzhE,1419
|
|
962
958
|
wisent/core/utils/base_rotator.py,sha256=5seiluDYXeOARs7Z5RIHlfW__9nUbxir6KGCs0wUHwI,10018
|
|
963
959
|
wisent/core/utils/dataset_splits.py,sha256=1G8TTiNFbjLcf17LjVh9xxlAqC1oyCMnOTQckHxPN6E,5937
|
|
964
|
-
wisent/core/utils/device.py,sha256=
|
|
960
|
+
wisent/core/utils/device.py,sha256=Ohe-WbVUDHJpOBn8NtxkFJ2lDgklokDk3Oi_HlNuZf8,9283
|
|
961
|
+
wisent/core/utils/layer_combinations.py,sha256=3zyQqxiSJM8vpJOkU5Y2AXewUjESwmeLeYU3v6IA4l0,2462
|
|
965
962
|
wisent/core/weight_modification/__init__.py,sha256=UrQh_lVfQIAddYQDOkmVWY3BP4X6uuvltHY6KHPDu0g,4329
|
|
966
963
|
wisent/core/weight_modification/additive.py,sha256=USpIfiz2K486qisbs8nubhyfaGgMGzT4CJnGjAB17sU,11375
|
|
967
964
|
wisent/core/weight_modification/directional.py,sha256=GLcbn7IRQp2uqgl1t5uRA0IE9QukfyiZGNxt-YVdK4s,49253
|
|
968
965
|
wisent/core/weight_modification/export.py,sha256=zikHU9dGDswa61ZPd_xo61kAdNt46O1VOQm3HOSYfNY,10266
|
|
969
966
|
wisent/core/weight_modification/multi_direction.py,sha256=tpnEG54GHIzWmytt3ajUmwTbl2_ClpZS7AebJHHrkfA,12858
|
|
970
967
|
wisent/core/weight_modification/utils.py,sha256=h6QM5FrpvOu29_6YZNvs5bwBuJBvVgtBo18RQ_MW3_o,6907
|
|
968
|
+
wisent/examples/__init__.py,sha256=gaDcawBaga7CMOkxnu9cTGP2-Xq0bN1IkWZiDEPPCoM,18
|
|
971
969
|
wisent/examples/contrastive_pairs/humanization_human_vs_ai.json,sha256=7D6GpW-B99nXnhLj2q7WYZp5DWu8AMFzk3uyq7ambV0,247507
|
|
970
|
+
wisent/examples/scripts/__init__.py,sha256=HmFOUP_4AjzolMRK2FXhLzz_u29L-GxpppYUjW7M-Kw,30
|
|
972
971
|
wisent/examples/scripts/benchmark_tags.json,sha256=JjZGitGdgbJPXxk6PXGDsEaQBvAKlwJOAcET4rucRWA,29279
|
|
972
|
+
wisent/examples/scripts/count_all_benchmarks.py,sha256=WjgyFCV07QgOQfxV0_04GcQYi7eRaEfb3CipPYjAcHM,3913
|
|
973
|
+
wisent/examples/scripts/discover_directions.py,sha256=3KJjksYda9UB_GrFV3pNmgTfTi3u_Gxz0zpgZkncyD8,17532
|
|
974
|
+
wisent/examples/scripts/extract_benchmark_info.py,sha256=3JME-s-6UUBuQRBOlM5TgVyMu9pkLbF4jdm_QB9Dfuk,2243
|
|
975
|
+
wisent/examples/scripts/generate_paper_data.py,sha256=zKHG54r-gYtqvdhJJONXjtBsGtVeMpOEu2RbFOG-74I,14467
|
|
976
|
+
wisent/examples/scripts/intervention_validation.py,sha256=mrxM2E0DZgtxMuXi_LPJ0NFyGDSU0ZMwC1qk4I65Pv4,21962
|
|
973
977
|
wisent/examples/scripts/lm_eval_readme.json,sha256=X5bYjQrAUw031rjjFlrTlxxnllWGBSlqywF5kjh4mOw,89869
|
|
978
|
+
wisent/examples/scripts/search_all_short_names.py,sha256=brLUqAKTnmo4KA3v3vnou0BWOXUK2M0qpofPSXC0du0,1191
|
|
979
|
+
wisent/examples/scripts/test_all_benchmarks.py,sha256=oKwCgbSPQcQwRrjRjWdWn6Cz-JRBrRiWu7svwnWJc-g,4207
|
|
980
|
+
wisent/examples/scripts/test_all_benchmarks_new.py,sha256=4E1K_IuzC7Ut7dVYdd9lHZqa6dMMlsHPcbTz7JVhDCo,730
|
|
981
|
+
wisent/examples/scripts/test_contrastive_pairs_all_supported.py,sha256=FIQ6P6hXfLBArBp0OhliDaeqlbvRJafJiO9dMjBIkmw,8011
|
|
982
|
+
wisent/examples/scripts/test_nonsense_baseline.py,sha256=spdWAUb7sViAGpHOJyu3HThABcsJ_eolDxyhV5fkdBY,10254
|
|
983
|
+
wisent/examples/scripts/test_one_benchmark.py,sha256=_2iy1GB2CYXooZCuSo7vJ0sKBtjLZofsWSIO0lkEtu4,13624
|
|
984
|
+
wisent/examples/scripts/test_one_coding_benchmark.py,sha256=AXoD_E6kaNnTnI4Czi9ZYhd6aLrmjZP1PKDhKIUXb_A,10427
|
|
985
|
+
wisent/examples/scripts/threshold_analysis.py,sha256=Ugp5Whn7L_7C8S8JrskfdtOXIRz31Lt1232Uva77hgM,14906
|
|
986
|
+
wisent/examples/scripts/visualization_gallery.py,sha256=DP025fuVXEJ8-CPOB0O88IGQfek__TuHFo56Y-zfNv4,20243
|
|
974
987
|
wisent/examples/scripts/1/test_basqueglue_evaluation.json,sha256=4dmo2Mu7zZ_mFhrn1EWn5grPkOhNI4XjKUYmhCoICl0,1898
|
|
975
988
|
wisent/examples/scripts/1/test_basqueglue_pairs.json,sha256=yCLswgp9q3SDzhso-pB5jbIlTHzqS_GEBtwCQgVwlXo,650
|
|
976
989
|
wisent/examples/scripts/1/test_bec2016eu_evaluation.json,sha256=rVRPrb-pot0bCu1p69ks2ltQiW_grUtRvxZonYupUY4,1897
|
|
@@ -1032,635 +1045,17 @@ wisent/examples/scripts/2/test_babilong_pairs.json,sha256=OOWUdyqtMXUv2_WWIqTTEY
|
|
|
1032
1045
|
wisent/examples/scripts/2/test_bangla_mmlu_evaluation.json,sha256=OtR2JvARwR99QphQDprHiyv7wjLPK9583gR_rCM9RQU,2073
|
|
1033
1046
|
wisent/examples/scripts/2/test_bangla_mmlu_pairs.json,sha256=GR9eXDwYdp0CBOyOZ9XF_yHv07KlDcpv8BpPF5wovXw,1340
|
|
1034
1047
|
wisent/examples/scripts/2/test_basque-glue_pairs.json,sha256=yCLswgp9q3SDzhso-pB5jbIlTHzqS_GEBtwCQgVwlXo,650
|
|
1035
|
-
wisent/examples/scripts/results/
|
|
1036
|
-
wisent/examples/scripts/results/
|
|
1037
|
-
wisent/examples/scripts/results/
|
|
1038
|
-
wisent/examples/scripts/results/
|
|
1039
|
-
wisent/examples/scripts/results/
|
|
1040
|
-
wisent/examples/scripts/results/
|
|
1041
|
-
wisent/examples/scripts/results/
|
|
1042
|
-
wisent/examples/scripts/results/benchmark_pair_totals.json,sha256=4QxerUtba3olSFBdFyjaY5DLXuc5Ml_TWP7_Z0s5AqU,5745
|
|
1043
|
-
wisent/examples/scripts/results/benchmark_tags.json,sha256=X_ouWT0yAz5tXEcoe6mEK2z8FoMxl3hyFKQFa6DFJtA,18479
|
|
1044
|
-
wisent/examples/scripts/results/benchmark_test_summary_nov4.json,sha256=Alj610XpssUmA4TUIBA8XahaPkZhygpW9Qxxp31Kw50,1248
|
|
1045
|
-
wisent/examples/scripts/results/coding_benchmarks_test_code_status.json,sha256=fdK0WRug8ZIc0xUVhc_6Qzik92BF_BWoaoHbGEbfyXI,5550
|
|
1046
|
-
wisent/examples/scripts/results/failing_benchmarks.json,sha256=q1QOAIFU5oUvU3YEQvIluTIaRAnyQbm1fi7wsrJjw9g,36471
|
|
1047
|
-
wisent/examples/scripts/results/failing_benchmarks_list.json,sha256=yLjh4irOrwutzpF6OQGwC3lxLJRGpvfrZxsEMHjIIuE,1625
|
|
1048
|
-
wisent/examples/scripts/results/failing_benchmarks_test_results.json,sha256=ziouxsa8VO_f5AuVuJtWmTgz_v4Zuh9nIDHnqigaU4c,18149
|
|
1049
|
-
wisent/examples/scripts/results/missing_benchmark_tags.json,sha256=UoXptlWIEX3edEJbAiJ06Do8-H3uHOMgioO9tUZyr10,4706
|
|
1050
|
-
wisent/examples/scripts/results/test_20_newsgroups_evaluation.json,sha256=UJXxIGeFmb-qoQCL1V12X5csTiGMA7yMPvk4pNHCWWU,916
|
|
1051
|
-
wisent/examples/scripts/results/test_20_newsgroups_pairs.json,sha256=w7GNDUp6hf-FSGR8Z2djvnuYDKZZHynnnBZb-kg-Agg,1124
|
|
1052
|
-
wisent/examples/scripts/results/test_AraDICE_evaluation.json,sha256=2lniZTUZ-g5TQFjW-_daDD_Zl7HaFiqzpDzcGOXSPUY,2447
|
|
1053
|
-
wisent/examples/scripts/results/test_AraDICE_pairs.json,sha256=ZcTWPtrbEnTABLf1t8MRVuMW6UP4zdJ5FuC7BBEnwus,1076
|
|
1054
|
-
wisent/examples/scripts/results/test_ArabCulture_evaluation.json,sha256=dDToZso53F7E2NT-rWxgPtSqqrBoNWRC5q-4KsbDes4,5664
|
|
1055
|
-
wisent/examples/scripts/results/test_ArabCulture_pairs.json,sha256=0WKa_XqsgWS3NrPuzg_bwTFW3xcm4D7BTsGaiOSMMnw,2742
|
|
1056
|
-
wisent/examples/scripts/results/test_Tag_evaluation.json,sha256=diHsOMTBW4AVNg-GU6CaF6etSofZLEVdWa9cRPrN-s4,1073
|
|
1057
|
-
wisent/examples/scripts/results/test_Tag_pairs.json,sha256=anAOb_Saxi_l_RZ8cE78KMEwMQIn0dX3zsWN_ipsPrA,384
|
|
1058
|
-
wisent/examples/scripts/results/test_aclue_evaluation.json,sha256=dlh3Nch72S0a4qyf-YzaM4VxCR2-DaViH_EH5VJrZCw,4111
|
|
1059
|
-
wisent/examples/scripts/results/test_aclue_pairs.json,sha256=-YrdFc_L2OzAmtkM0BAus1qfhGJfYl7pYL3Gvssy-to,1859
|
|
1060
|
-
wisent/examples/scripts/results/test_acp_bench_evaluation.json,sha256=h5D1gkKgKVY9ieT4jwcYjnBGF_1VajJ7fiIvaGI2uhY,1589
|
|
1061
|
-
wisent/examples/scripts/results/test_acp_bench_hard_evaluation.json,sha256=9Vb7T7ChOs_TBsHS7piJ-x1scgJyJ7kwilMFTmIuiy8,2804
|
|
1062
|
-
wisent/examples/scripts/results/test_acp_bench_hard_pairs.json,sha256=ZT8S5GIgWwPyfNtf8jHEO1_SAApmVx5dt6TgLei_W0o,2544
|
|
1063
|
-
wisent/examples/scripts/results/test_acp_bench_pairs.json,sha256=D3L4hYxhS0J3JBsk2izEmXhxt5SSWbng76vsA6sfI-4,1652
|
|
1064
|
-
wisent/examples/scripts/results/test_advanced_ai_risk_evaluation.json,sha256=0rbRqeXUxYIIk-QxNva2WMYoFzpATSHgGnfJufACaUM,1604
|
|
1065
|
-
wisent/examples/scripts/results/test_advanced_ai_risk_pairs.json,sha256=i7Sg5QIV1_E8bb4jT6AXkNvvyBrNeW9PVl6YdxFJb5U,590
|
|
1066
|
-
wisent/examples/scripts/results/test_aexams_evaluation.json,sha256=fCdtf1V6lf-qviXWgsN-bnq9t7WeQ-3jvhAkxJsrMO4,2768
|
|
1067
|
-
wisent/examples/scripts/results/test_aexams_pairs.json,sha256=1evSD_zurT_bTUQkdqBYq-xt4KoPeFcUB5Z20-BACpI,1138
|
|
1068
|
-
wisent/examples/scripts/results/test_afrimgsm_direct_amh_evaluation.json,sha256=bDPS5GxmsmKRb6sAxErR4nogXmgSOxzIP_BOzzf9EQ8,1271
|
|
1069
|
-
wisent/examples/scripts/results/test_afrimgsm_direct_amh_pairs.json,sha256=xtGe0bshz2iLAbIuI12IUeOI-6LpugfhSbXUWi8dYfQ,1000
|
|
1070
|
-
wisent/examples/scripts/results/test_afrimmlu_direct_amh_evaluation.json,sha256=eM0Rp54yfE6xswWrx4CCXRHj7Wo7ZJA5Q8i0V0lOz-0,1190
|
|
1071
|
-
wisent/examples/scripts/results/test_afrimmlu_direct_amh_pairs.json,sha256=DLJ7qHdvIdpzAFTDDlGqdFqYQLmdjHsVbq5PgjnrrjU,669
|
|
1072
|
-
wisent/examples/scripts/results/test_afrixnli_en_direct_amh_evaluation.json,sha256=qNsSpTnnRG8yVEfYeYV4sixnxg1XrSzrj0I0Rkkesag,1080
|
|
1073
|
-
wisent/examples/scripts/results/test_afrixnli_en_direct_amh_pairs.json,sha256=BKbzJUR8HjFLi7IGYudSXIx94pGh9x4AvO-ZkOndsRc,386
|
|
1074
|
-
wisent/examples/scripts/results/test_ag_news_evaluation.json,sha256=9oF_oOxv8M4X4pszreBA3V6wvvdO2mBxuqyMzH4flbI,894
|
|
1075
|
-
wisent/examples/scripts/results/test_ag_news_pairs.json,sha256=gjrHIcGIAjlYhn4a2ebIwER6BxA_7Y7Xp9XczzOFfTs,479
|
|
1076
|
-
wisent/examples/scripts/results/test_agieval_evaluation.json,sha256=S2pRGt0RfH5roC6wRVyYjZcpa3ZG4Om9dSTLEiVd784,1628
|
|
1077
|
-
wisent/examples/scripts/results/test_agieval_pairs.json,sha256=us7zfgCQMGb4ZGSxdSLgR89P-25_Uop_RgdYQt1E0Ls,664
|
|
1078
|
-
wisent/examples/scripts/results/test_aime2024_evaluation.json,sha256=iG-4CFZRQZI6N2PM-_DQAwht9D10IOaOkBf3ZG5YHtY,867
|
|
1079
|
-
wisent/examples/scripts/results/test_aime2024_pairs.json,sha256=16Oxx8g2g21iKaUADksGSPKVY00i7I7C3PcczBoWbcA,221
|
|
1080
|
-
wisent/examples/scripts/results/test_aime2025_evaluation.json,sha256=zeuyGWCDGicdpXctuf13NhgG34O9CIMnkqpBg7UvoUM,867
|
|
1081
|
-
wisent/examples/scripts/results/test_aime2025_pairs.json,sha256=16Oxx8g2g21iKaUADksGSPKVY00i7I7C3PcczBoWbcA,221
|
|
1082
|
-
wisent/examples/scripts/results/test_aime_evaluation.json,sha256=lPUpLNXGLc2mIv7J7M-rDEXeiy5PR8vNrq1l_I88KeU,863
|
|
1083
|
-
wisent/examples/scripts/results/test_aime_pairs.json,sha256=16Oxx8g2g21iKaUADksGSPKVY00i7I7C3PcczBoWbcA,221
|
|
1084
|
-
wisent/examples/scripts/results/test_anagrams1_evaluation.json,sha256=9WCkRaLkJdLe-l3B3EkGM962EK_d_IXA99EyoWpcPAk,798
|
|
1085
|
-
wisent/examples/scripts/results/test_anagrams1_pairs.json,sha256=4JPuIVLPonmZp1aryksfHTy7yvq5TilpRjgBlfsHGD4,124
|
|
1086
|
-
wisent/examples/scripts/results/test_anagrams2_evaluation.json,sha256=VpI6UcF9XjvcL_8FIoJ-BpwiO9MNhzyRQRQcdGKot4U,828
|
|
1087
|
-
wisent/examples/scripts/results/test_anagrams2_pairs.json,sha256=KxxhxCgmBPi6zob3r__7kMGrI2mQtXw1Y-cq3qYQltw,137
|
|
1088
|
-
wisent/examples/scripts/results/test_anli_evaluation.json,sha256=9abyL6Jh4J9wM8dW0g-FvtqoNHqTLFqv0DMPHBa4790,885
|
|
1089
|
-
wisent/examples/scripts/results/test_anli_pairs.json,sha256=3CaPgA3zSy6PaHucuK4paSX411Gx18N2LOZftJ_OpPE,525
|
|
1090
|
-
wisent/examples/scripts/results/test_apps_evaluation.json,sha256=yuOyofvIOBv7zCu328X5rRcskb7YrJHezwvNWnDNqUM,9529
|
|
1091
|
-
wisent/examples/scripts/results/test_apps_pairs.json,sha256=qym_IuMoP3pbBSWplvQ0cMnAwl0z-0kcRmheUQUH5Ao,5746
|
|
1092
|
-
wisent/examples/scripts/results/test_arabic_exams_evaluation.json,sha256=F6IVmGHJsRGI1AhpG25N_zQdrWy5FoF8cT0GDobtNhk,1123
|
|
1093
|
-
wisent/examples/scripts/results/test_arabic_exams_pairs.json,sha256=9mUDUuSksBUB1L1DzAyYlcIL8OSxY552i5v2L59WRFI,446
|
|
1094
|
-
wisent/examples/scripts/results/test_arabic_leaderboard_complete_evaluation.json,sha256=04MoEweDm8ghjHplVEl4F7v8yib_ATO1XhJ3aBcFftw,2266
|
|
1095
|
-
wisent/examples/scripts/results/test_arabic_leaderboard_complete_pairs.json,sha256=epwwxpn8d7LRlTUZg_aAa15hCxEx3_enKgRlMUeNxkI,989
|
|
1096
|
-
wisent/examples/scripts/results/test_arabic_leaderboard_light_evaluation.json,sha256=ZFFMu6-QFGXl32-Sjnbo8Eb4pckd9U9QfBOqhQgKhbc,2036
|
|
1097
|
-
wisent/examples/scripts/results/test_arabic_leaderboard_light_pairs.json,sha256=1kQfNNeVRMPyBTinXK9ka1kWSHyNCR6H9QSddSNRP1o,762
|
|
1098
|
-
wisent/examples/scripts/results/test_arabicmmlu_evaluation.json,sha256=hcxHHt2_dzZHr5YNjQikEl8mg8CDzAAugARjgcNSP3Q,4028
|
|
1099
|
-
wisent/examples/scripts/results/test_arabicmmlu_pairs.json,sha256=qJzEIlg4SDZsL5QCDmfSqxnrVqwa7RIwFjKFZ3Vm4Cw,2092
|
|
1100
|
-
wisent/examples/scripts/results/test_arc_ar_evaluation.json,sha256=siu_sO29iLp7Dz_K475pps8TPYTwBfmxr7bPzfG6zXw,2358
|
|
1101
|
-
wisent/examples/scripts/results/test_arc_ar_pairs.json,sha256=dN5eXC6lL2WF3cpuZKOJEtTXM7P7EpFHvSkheFrMw8M,1188
|
|
1102
|
-
wisent/examples/scripts/results/test_arc_challenge_evaluation.json,sha256=gAlZ2puwR8LqvMC7nFUSzdBJke5K-wx1hD4XO8YTwRo,1070
|
|
1103
|
-
wisent/examples/scripts/results/test_arc_challenge_pairs.json,sha256=i_ZNQATvJAvvUh3IyoEZaVz2PPK3e9qakj96jTkX4jw,415
|
|
1104
|
-
wisent/examples/scripts/results/test_arc_easy_evaluation.json,sha256=u6Fz5JyIp3XNxOqgyCuK322JCSKKpsOAeyV7NznaqDQ,938
|
|
1105
|
-
wisent/examples/scripts/results/test_arc_easy_pairs.json,sha256=ILijbNk0MRN8QVigMTJj20iWI-cT0htqemvDRbo8NSU,225
|
|
1106
|
-
wisent/examples/scripts/results/test_argument_topic_evaluation.json,sha256=n2rP_sHh-8uT4z49Vn6j_jiCrepM89sSPZCPPd_DdqA,959
|
|
1107
|
-
wisent/examples/scripts/results/test_argument_topic_pairs.json,sha256=K89ZeRQQPd5Y8GxfsVXFiDQl8rJ86FU9VhiDj-LNfnk,1630
|
|
1108
|
-
wisent/examples/scripts/results/test_arithmetic_evaluation.json,sha256=2DZcnt5HyiWLiGq1nf-IC036lb5Sz3iVE2jPk0-RpkQ,1514
|
|
1109
|
-
wisent/examples/scripts/results/test_arithmetic_pairs.json,sha256=c31tGjv2mG7qqbymz5DneDxlYO4wMbhrVUUQUDeRrw4,334
|
|
1110
|
-
wisent/examples/scripts/results/test_asdiv_evaluation.json,sha256=HAwj7V8cHtyM4j7GwWbasl6zXZepW0mYZNj0OWycq2k,859
|
|
1111
|
-
wisent/examples/scripts/results/test_asdiv_pairs.json,sha256=9uIoQJXdSnpn2HYFH_sYeUz78vpeRi7Nz8VS5Zrj7q8,221
|
|
1112
|
-
wisent/examples/scripts/results/test_assin_entailment_evaluation.json,sha256=ogZaWg1VDrmYs8xjubr_yGtwmjPmpXgsrtD3ewzxq04,2146
|
|
1113
|
-
wisent/examples/scripts/results/test_assin_entailment_pairs.json,sha256=0Qt0R3rGcSzEciIbX8fFJxZTsdtdnYTGXS2p55l9WKI,633
|
|
1114
|
-
wisent/examples/scripts/results/test_atis_evaluation.json,sha256=pv1lWUOHOPfQUxhu8S5dvfoypxSBTPxaknMv2D9baNc,1365
|
|
1115
|
-
wisent/examples/scripts/results/test_atis_pairs.json,sha256=EieW893xtNjVBpJrJxJuTy1OvHnnZzJKPctnH1TevVE,1916
|
|
1116
|
-
wisent/examples/scripts/results/test_babi_evaluation.json,sha256=2O0czob2UoLANSIBO0BEAVNe4-gTOPdPH3sFcDA3u0k,899
|
|
1117
|
-
wisent/examples/scripts/results/test_babi_pairs.json,sha256=SjxpSXlWLOHx26XEozN6rTiYfwrkBG8rqies72sekLw,222
|
|
1118
|
-
wisent/examples/scripts/results/test_babilong_evaluation.json,sha256=sBiv35EeORDv4TOQRx3yd_SoB99LblbsTznrFbeEWUk,1454
|
|
1119
|
-
wisent/examples/scripts/results/test_babilong_pairs.json,sha256=OOWUdyqtMXUv2_WWIqTTEYX9okJXGVzIgnSYgAGljuc,41866
|
|
1120
|
-
wisent/examples/scripts/results/test_bangla_mmlu_evaluation.json,sha256=OtR2JvARwR99QphQDprHiyv7wjLPK9583gR_rCM9RQU,2073
|
|
1121
|
-
wisent/examples/scripts/results/test_bangla_mmlu_pairs.json,sha256=GR9eXDwYdp0CBOyOZ9XF_yHv07KlDcpv8BpPF5wovXw,1340
|
|
1122
|
-
wisent/examples/scripts/results/test_banking77_evaluation.json,sha256=4qs2s_yVg7iYEp9u5O58tCAUHxg7qQqBkkyHovV89w4,982
|
|
1123
|
-
wisent/examples/scripts/results/test_banking77_pairs.json,sha256=26xg0AmI1Z4DPKwdvCZt2jwjVpOnMmMv3Rs6cyV4y0o,1991
|
|
1124
|
-
wisent/examples/scripts/results/test_basque-glue_evaluation.json,sha256=WRLIktFz9oQIcpHp0zd4HCStK9G-LzFX3t8LNao6zFU,2955
|
|
1125
|
-
wisent/examples/scripts/results/test_basque-glue_pairs.json,sha256=I5cwPeJcJXsaRrao0X_Q8iJCcCAzBPjNOaQxQIymgRA,1228
|
|
1126
|
-
wisent/examples/scripts/results/test_basque_bench_evaluation.json,sha256=qbmcyxku2K_K14Jh7pjT593oiRLX11c3pnqZNGUc_hc,2956
|
|
1127
|
-
wisent/examples/scripts/results/test_basque_bench_pairs.json,sha256=JzsmkN33b71HOLaZZAyBX9pdfgRZlDf_bIM-frz4a00,1228
|
|
1128
|
-
wisent/examples/scripts/results/test_basqueglue_evaluation.json,sha256=0KYY8wMMpHuvdtlsV9CmQjEW1xJ9-zOEnzEZIsSQzLg,2954
|
|
1129
|
-
wisent/examples/scripts/results/test_basqueglue_pairs.json,sha256=YzUEnHI38ZhDKsbBNOsnYy1OmjKTF3gZdgJSa5a-IAk,1228
|
|
1130
|
-
wisent/examples/scripts/results/test_bbh_evaluation.json,sha256=XcZ_04q_bB-0vgGoE0hiqB_nppKvnISTpcja_H0dvFo,2135
|
|
1131
|
-
wisent/examples/scripts/results/test_bbh_pairs.json,sha256=7KCwuccPW3lugOJWvUUlHpxhr4wZ3UzFf_wy_ssbC_A,1311
|
|
1132
|
-
wisent/examples/scripts/results/test_bbq_evaluation.json,sha256=-Lo6RQXt_XkMhWzwOzHBI39dbVlSRa7jspBuxSAXod4,954
|
|
1133
|
-
wisent/examples/scripts/results/test_bbq_pairs.json,sha256=26v1q-03Pb42IVkyfhgNLxSWh34AZ_atA9HGzo-EvyQ,331
|
|
1134
|
-
wisent/examples/scripts/results/test_bec2016eu_evaluation.json,sha256=DfqUQphUbPLSFnMRRo4yy07qSoQG7T79uRR8FhnMJ_A,2953
|
|
1135
|
-
wisent/examples/scripts/results/test_bec2016eu_pairs.json,sha256=7lNJz42y25-SMuIrhUlfJ7BHyek5x36r8aHcNhmSYSs,1228
|
|
1136
|
-
wisent/examples/scripts/results/test_belebele_evaluation.json,sha256=xxQkvL-kBvLKhhsNsSCEni7Dw7BFoEaUMY69uJO99w0,2214
|
|
1137
|
-
wisent/examples/scripts/results/test_belebele_pairs.json,sha256=h9RypNbw7geXsg7fWcBUwgJB5bS5gy0eDPGDizbouPQ,944
|
|
1138
|
-
wisent/examples/scripts/results/test_benchmarks_evaluation.json,sha256=MAOCk2IdwkhJ_uDtTSNl1CrO2HxhXLwNSMTAUgZZ9Lc,1812
|
|
1139
|
-
wisent/examples/scripts/results/test_benchmarks_pairs.json,sha256=KlTcdNMmXAlwArOmV3qLdfjTTSygO8Elu_eZWK3k-5A,1086
|
|
1140
|
-
wisent/examples/scripts/results/test_bertaqa_evaluation.json,sha256=kto40P6Jo5UuPWvxjjLvTr_bN7MRSbATwIoWHff4BbY,1604
|
|
1141
|
-
wisent/examples/scripts/results/test_bertaqa_pairs.json,sha256=7OtQCoFqK1_29r4zL8FSsF2c91KUKN4FYBeomdwfPL4,391
|
|
1142
|
-
wisent/examples/scripts/results/test_bhtc_v2_evaluation.json,sha256=izOv-P-hWlmm-d27yPmscDSVLZ9UzLnX3E5nztZK10Q,904
|
|
1143
|
-
wisent/examples/scripts/results/test_bhtc_v2_pairs.json,sha256=KZRti9y-wFKygQkcTM7LuimkUhcHd4qpgEGwCgPuw_0,427
|
|
1144
|
-
wisent/examples/scripts/results/test_bigbench_evaluation.json,sha256=JyskONgf5iIJu-_klbZ4xMHO9XSV0_Z8z_VwkVM7fjU,1664
|
|
1145
|
-
wisent/examples/scripts/results/test_bigbench_pairs.json,sha256=rrh2TwJtjMmU2HoIUCAWWgaJQ5qDCyhBz4d2XvVDWNU,1799
|
|
1146
|
-
wisent/examples/scripts/results/test_blimp_evaluation.json,sha256=k-t20pwFwWEamVh8UGzPgKQCrYEVUiFYLsxZ7VhW0nE,2251
|
|
1147
|
-
wisent/examples/scripts/results/test_blimp_pairs.json,sha256=yiDwzVlle_cyQ6Ro9jnjcRohtoFMsXTNHqivjIOv3ao,558
|
|
1148
|
-
wisent/examples/scripts/results/test_boolq-seq2seq_evaluation.json,sha256=T4qMKma5AtYicG6xFccx03GLYnLAyA-Wa-qmvACbIc4,872
|
|
1149
|
-
wisent/examples/scripts/results/test_boolq-seq2seq_pairs.json,sha256=YZiJJSLsFTIRMfctwiXSEStI3YaznaWTbF58-eGE8OQ,1583
|
|
1150
|
-
wisent/examples/scripts/results/test_boolq_evaluation.json,sha256=b4iXD4lHIrUZjntmXJSXQ-ONFpsdQ_nh7zLSiev-HlA,864
|
|
1151
|
-
wisent/examples/scripts/results/test_boolq_pairs.json,sha256=jK_jGZrMSaJVwiBYYmG9FxYaQhpn4-J9HH5lflr0lZ4,1554
|
|
1152
|
-
wisent/examples/scripts/results/test_c4_evaluation.json,sha256=WWCj0Hx4tbJ5cfQBpMRHY4gop2l4ofhLG7h0Q6M0I5M,1288
|
|
1153
|
-
wisent/examples/scripts/results/test_c4_pairs.json,sha256=WT3CZayRSj_RMC_Uoi057gj5WrsArkpQZx0nDS5t2xw,371
|
|
1154
|
-
wisent/examples/scripts/results/test_cabreu_evaluation.json,sha256=LOrsAwYzppKWpoClOyTxBKDcpIP8Gqf6-vxbkMo85ys,7307
|
|
1155
|
-
wisent/examples/scripts/results/test_cabreu_pairs.json,sha256=PF0Ml8b3oo2-KEHpmYOFa_aZirNeK-woqOAwtZ3f6OE,6895
|
|
1156
|
-
wisent/examples/scripts/results/test_careqa_evaluation.json,sha256=B8C75kicOK3quYBZCDhFkh-LHJV7hkINoI_6NwGu-g4,1672
|
|
1157
|
-
wisent/examples/scripts/results/test_careqa_pairs.json,sha256=Of0zuMtBLEafqCEKR5ffqC-PghQCzykMCT9N3Rp4NwI,731
|
|
1158
|
-
wisent/examples/scripts/results/test_catalan_bench_evaluation.json,sha256=sJWE9OcP2gFWTyaDJiim_O4O6BIY0XQmTUR46_Ve9lI,1829
|
|
1159
|
-
wisent/examples/scripts/results/test_catalan_bench_pairs.json,sha256=ybJuUti0sCeyZuGFSdsTCfkKtiNSCjksSHc1VeLczys,1883
|
|
1160
|
-
wisent/examples/scripts/results/test_catalanqa_evaluation.json,sha256=bomYcxWdkdabZ7ptvrPWpugAJcVNpSbKtHlfW-JXuLs,918
|
|
1161
|
-
wisent/examples/scripts/results/test_catalanqa_pairs.json,sha256=9zue9ntmKjFwKJetuLz3BX0HpBCL72000sjWT4IdkjA,952
|
|
1162
|
-
wisent/examples/scripts/results/test_catcola_evaluation.json,sha256=w2zfhB6YQ7l8szinoIni_zi8ncbIGiUuIolXa9JDrDA,918
|
|
1163
|
-
wisent/examples/scripts/results/test_catcola_pairs.json,sha256=DES1F-Bavgy_-7fl420bSb32fuSa-JQBjBwKuv1hMmE,240
|
|
1164
|
-
wisent/examples/scripts/results/test_cb_evaluation.json,sha256=4RdWDmJ3xDINLKxeyIf09kqcGWWcnenUs8O2qpnSjfQ,881
|
|
1165
|
-
wisent/examples/scripts/results/test_cb_pairs.json,sha256=QKViqRnSVeb-nQgJL1zRvNVZ2r_UcgXgX3yrePZx7Es,329
|
|
1166
|
-
wisent/examples/scripts/results/test_ceval_evaluation.json,sha256=wcjDYFj5B8R7UcHxLMLFQR-7w97eIk0nRVl3lf1tPuc,2283
|
|
1167
|
-
wisent/examples/scripts/results/test_ceval_pairs.json,sha256=dk4jGjqCE_HZLAWz6lIivYWRAt6rz0cao2GhhElzGVg,872
|
|
1168
|
-
wisent/examples/scripts/results/test_chain_of_thought_evaluation.json,sha256=NIsj71ylbuDJqB_dEAmcnGf2hwvFjb4UxgwHbYwTZrY,1582
|
|
1169
|
-
wisent/examples/scripts/results/test_chain_of_thought_pairs.json,sha256=Hj0R614SWLTerw8Z-TtuY_ezknF4xVmt2RD1m7beZek,553
|
|
1170
|
-
wisent/examples/scripts/results/test_chartqa_evaluation.json,sha256=DJacdQkemuDjwuFuqhXjznhWLWPhnea9C-f4_GYcCSE,819
|
|
1171
|
-
wisent/examples/scripts/results/test_chartqa_pairs.json,sha256=lVc_WfpfxUY6JWT1f8hcQQlOA0kRLq5BDRKD-sTrdHU,163
|
|
1172
|
-
wisent/examples/scripts/results/test_claim_stance_topic_evaluation.json,sha256=r43kMchm9NeoBqvrwRGSmdf_RQ8DkR8k-CiPnpu_COY,917
|
|
1173
|
-
wisent/examples/scripts/results/test_claim_stance_topic_pairs.json,sha256=Q4DP2sKyGgPqnerSfkLpmjGeYjUuEqdkaHLbs6GfADM,1910
|
|
1174
|
-
wisent/examples/scripts/results/test_cmmlu_evaluation.json,sha256=kD3YFj90X3YPDM8xYyHCVSZtINHXxa54n-W4jY6ad4I,3085
|
|
1175
|
-
wisent/examples/scripts/results/test_cmmlu_pairs.json,sha256=3CR0KaZccsrT3UBuox-T4xI3DGfZMWheFOT9rmSzOjU,1932
|
|
1176
|
-
wisent/examples/scripts/results/test_cnn_dailymail_evaluation.json,sha256=2xdFLCuLrI7Jhqu04QyhSPSjXPrwjKbPGhMV4kSjEl8,1710
|
|
1177
|
-
wisent/examples/scripts/results/test_cnn_dailymail_pairs.json,sha256=S1c_5HNR7YMIRy7z0fjMsRlCd5KhbPpmYXdgbl1WUIs,4727
|
|
1178
|
-
wisent/examples/scripts/results/test_cocoteros_es_evaluation.json,sha256=ahXlptFbAil4kf2iknnu8qPQG5Auklb_xbCeYIKjgSI,1181
|
|
1179
|
-
wisent/examples/scripts/results/test_cocoteros_es_pairs.json,sha256=x1XUZXKbohHuJcouIezJFi_1d_Ok8iGkuIVdtHVSo2A,385
|
|
1180
|
-
wisent/examples/scripts/results/test_codexglue_code_to_text_go_evaluation.json,sha256=T7k912Zo6CCp6KqP-uxv_wCltul3LdG3lzNdDNe8PwM,1144
|
|
1181
|
-
wisent/examples/scripts/results/test_codexglue_code_to_text_go_pairs.json,sha256=bE4f9bw6_bmzhDvBK7eUUcIp0YZdMUN4MLIABOjyReA,1271
|
|
1182
|
-
wisent/examples/scripts/results/test_codexglue_code_to_text_java_evaluation.json,sha256=eVluqR6mKYRYzBfUaY9vwg7vkwLkEtnBvHhcHxI9E2E,1146
|
|
1183
|
-
wisent/examples/scripts/results/test_codexglue_code_to_text_java_pairs.json,sha256=bE4f9bw6_bmzhDvBK7eUUcIp0YZdMUN4MLIABOjyReA,1271
|
|
1184
|
-
wisent/examples/scripts/results/test_codexglue_code_to_text_javascript_evaluation.json,sha256=t-DV2ml6tBNlxZCbZR85Mk6TLHPebVHp5XMF0mu4r0s,1152
|
|
1185
|
-
wisent/examples/scripts/results/test_codexglue_code_to_text_javascript_pairs.json,sha256=bE4f9bw6_bmzhDvBK7eUUcIp0YZdMUN4MLIABOjyReA,1271
|
|
1186
|
-
wisent/examples/scripts/results/test_codexglue_code_to_text_php_evaluation.json,sha256=wjaBRlJVk9FDqWLov8qhZSiGE5IX4ACCRfoycJqtpfs,1145
|
|
1187
|
-
wisent/examples/scripts/results/test_codexglue_code_to_text_php_pairs.json,sha256=bE4f9bw6_bmzhDvBK7eUUcIp0YZdMUN4MLIABOjyReA,1271
|
|
1188
|
-
wisent/examples/scripts/results/test_codexglue_code_to_text_python_evaluation.json,sha256=0vjJpfyI7YSiZk2cLDsRLKON62ekJ_yPpO-nLKBit6U,1148
|
|
1189
|
-
wisent/examples/scripts/results/test_codexglue_code_to_text_python_pairs.json,sha256=bE4f9bw6_bmzhDvBK7eUUcIp0YZdMUN4MLIABOjyReA,1271
|
|
1190
|
-
wisent/examples/scripts/results/test_codexglue_code_to_text_ruby_evaluation.json,sha256=iadmJqrfAQOrsoCGghFWi6uYfZWwQ2Y35Q4OQ-FK9m8,1146
|
|
1191
|
-
wisent/examples/scripts/results/test_codexglue_code_to_text_ruby_pairs.json,sha256=bE4f9bw6_bmzhDvBK7eUUcIp0YZdMUN4MLIABOjyReA,1271
|
|
1192
|
-
wisent/examples/scripts/results/test_coedit_gec_evaluation.json,sha256=oNucJ-YJW0OrWf8Jmlbf6ie3lCvM_HcYY1nddcvpIN4,1762
|
|
1193
|
-
wisent/examples/scripts/results/test_coedit_gec_pairs.json,sha256=80t6Cfu9be8TpPNaF0WOsRME6YbfLVyIBJyLGEuqM9o,687
|
|
1194
|
-
wisent/examples/scripts/results/test_cola_evaluation.json,sha256=4TOycnPImbfXliX05dKc8CUTW2MR8cKihmH0DRKR7OY,915
|
|
1195
|
-
wisent/examples/scripts/results/test_cola_pairs.json,sha256=8a5Dd84Qbeuy2a3CVpNfDwX4PGhYuw60j7YsM_5YwYE,249
|
|
1196
|
-
wisent/examples/scripts/results/test_commonsense_qa_evaluation.json,sha256=Dh2RPjf8vmF3Sqn4a83tPWUAX282KQ92NVj5UHmKpE0,889
|
|
1197
|
-
wisent/examples/scripts/results/test_commonsense_qa_pairs.json,sha256=GElMRlEYrHO2foSLcNMeYFZq_ILowHYV-ITl-RLkCcI,254
|
|
1198
|
-
wisent/examples/scripts/results/test_conala_evaluation.json,sha256=vFtN0a3pDm6tWG_0FxyYtKE4mX5Tl0NmvThkkP4YRfE,1153
|
|
1199
|
-
wisent/examples/scripts/results/test_conala_pairs.json,sha256=6HjJa_c-InK2aVa8TXyV5y0gwkldcKZdsw2PCBqrC88,307
|
|
1200
|
-
wisent/examples/scripts/results/test_concode_evaluation.json,sha256=jDU3G7zrHjeGL84AwJ9S6cgrFcQ6W0aHX_eJrrEN_gw,1126
|
|
1201
|
-
wisent/examples/scripts/results/test_concode_pairs.json,sha256=bE4f9bw6_bmzhDvBK7eUUcIp0YZdMUN4MLIABOjyReA,1271
|
|
1202
|
-
wisent/examples/scripts/results/test_copa_evaluation.json,sha256=7ds_h7aX0DclM-UT3kbFtfy5BTcC61-_GLj_PTa6tsk,1021
|
|
1203
|
-
wisent/examples/scripts/results/test_copa_pairs.json,sha256=9vZ5qZCZzMSLoLkSL2dW7JtvuaJ61INwowtMNJno6Mc,266
|
|
1204
|
-
wisent/examples/scripts/results/test_copal_id_evaluation.json,sha256=E00472fSXkOsrghGgu-ZOE3BLV5CK4L37_wHzDXDDps,1049
|
|
1205
|
-
wisent/examples/scripts/results/test_copal_id_pairs.json,sha256=oBZB1hq3BZkAudQyPIc2KAaaz7iQ6ZpWB1ceRkbjWgY,286
|
|
1206
|
-
wisent/examples/scripts/results/test_coqa_evaluation.json,sha256=Dbmjef69NmeTGM4F0b1FlCrSQES_scoQtxtUZXJpXqw,863
|
|
1207
|
-
wisent/examples/scripts/results/test_coqa_pairs.json,sha256=n2RU3_euUIwPzk1qCThIojrOo_z9JUIwNQwBQixs2mI,2348
|
|
1208
|
-
wisent/examples/scripts/results/test_coqcat_evaluation.json,sha256=i5pKT9mUk6iS2ubiq_mkW4utZIP15oVFqCK76a-adpE,978
|
|
1209
|
-
wisent/examples/scripts/results/test_coqcat_pairs.json,sha256=GWzqrA3XI7CK6VElef36IanFOOS7uJU-uKJSQ_8lQgg,1414
|
|
1210
|
-
wisent/examples/scripts/results/test_crows_pairs_evaluation.json,sha256=5LU5q4oHbHYTLzDz6_RL33WWzIimkY5FBI3jilhYNvo,2223
|
|
1211
|
-
wisent/examples/scripts/results/test_crows_pairs_pairs.json,sha256=DTMDM6kUAdiZb_osQFzBPJKW4ACLawbP91y_6O5pcE8,543
|
|
1212
|
-
wisent/examples/scripts/results/test_csatqa_evaluation.json,sha256=ZemydlxeR97I_NAsIWh4EvwfBInnJrqXYFP0PFD4VSU,2062
|
|
1213
|
-
wisent/examples/scripts/results/test_csatqa_pairs.json,sha256=EhaWZ6gF4iEZZiPdgmA57FT3Rjxm0BX69wUOHlv7NPY,16738
|
|
1214
|
-
wisent/examples/scripts/results/test_cycle_letters_evaluation.json,sha256=ynLm4vDWMSJKwbl-Xsemgz1m5Z1aEdQ3MB4n28RJONI,804
|
|
1215
|
-
wisent/examples/scripts/results/test_cycle_letters_pairs.json,sha256=Rn_PkojOpuiIDTHFBirHdfeia101K0EBo_GSpPPM1Ew,125
|
|
1216
|
-
wisent/examples/scripts/results/test_darija_bench_evaluation.json,sha256=mE-UlpD4_bpnlQt-rYW-4S4hS_HXOKpjup-f4pj20hw,2599
|
|
1217
|
-
wisent/examples/scripts/results/test_darija_bench_pairs.json,sha256=td8oZ9RFS5qeVx3gNdf6bgo3yjWGd6Tkz7jOa-8zByg,1711
|
|
1218
|
-
wisent/examples/scripts/results/test_darijahellaswag_evaluation.json,sha256=FGtUWgfmQsswahqXkE4LCSsHZz07gdJOiNdhkN9yCf4,2249
|
|
1219
|
-
wisent/examples/scripts/results/test_darijahellaswag_pairs.json,sha256=-buMWLczhUuoI2nWlszur0lhC7QkIh3jKfDMTKXpiYY,1075
|
|
1220
|
-
wisent/examples/scripts/results/test_darijammlu_evaluation.json,sha256=pPFB5GyxpL5la7L4g1fliScubibw7njgK1-oLvouaL8,4884
|
|
1221
|
-
wisent/examples/scripts/results/test_darijammlu_pairs.json,sha256=NGGpYIdGsT01HfjC0zYGOwBZWb8TYVEOk0s2WzOlCCU,4938
|
|
1222
|
-
wisent/examples/scripts/results/test_dbpedia_14_evaluation.json,sha256=9IKJ7skQ9IChdGin5YH2C8FD4dRZwb6zYG4IypiZ4eA,889
|
|
1223
|
-
wisent/examples/scripts/results/test_dbpedia_14_pairs.json,sha256=5DCuHnpY4v9-JNSoQwOh-UG9bFBNF2CJi9RBqVTIyBc,443
|
|
1224
|
-
wisent/examples/scripts/results/test_drop_evaluation.json,sha256=O0SvU8t-t35INLizNmLgYZoc3ToeySPEvRnn6VmRgqM,927
|
|
1225
|
-
wisent/examples/scripts/results/test_drop_pairs.json,sha256=_68MgtdAUN5y1_zQ5IdFGPXRjcbJhJcikbWU4FuQO9s,1140
|
|
1226
|
-
wisent/examples/scripts/results/test_ds1000_evaluation.json,sha256=5NTDhZcD_ni6XuXrxn3qI9l7JJ4FwSHiCujMpvURYTM,1314
|
|
1227
|
-
wisent/examples/scripts/results/test_ds1000_pairs.json,sha256=56SnkofYQiXDXYGjWYbKxOfUhW0hSew4GyZuaGgE9e8,1449
|
|
1228
|
-
wisent/examples/scripts/results/test_egyhellaswag_evaluation.json,sha256=Mnndav8dU-XSQSuhi62jix-O2XCTj50nJ6XW41Yrt_o,1776
|
|
1229
|
-
wisent/examples/scripts/results/test_egyhellaswag_pairs.json,sha256=p-3YQa3I76CEMxbrky9C5i1JqGLV_fB7-bMU-qAuOE0,605
|
|
1230
|
-
wisent/examples/scripts/results/test_egymmlu_evaluation.json,sha256=WoxCCYTlcCfJlSWlrYWnNNi_yjnJSBvJO3GWQCdYnWI,2817
|
|
1231
|
-
wisent/examples/scripts/results/test_egymmlu_pairs.json,sha256=aA_nRrn1UDmGT7MkXvgijhP9sa9Rnyfpfs-V2GJhHSE,1914
|
|
1232
|
-
wisent/examples/scripts/results/test_epec_koref_bin_evaluation.json,sha256=uptYxyqdNCvVAMXKVBzOe7MD-iagHcaPDDHzBPkeIJU,875
|
|
1233
|
-
wisent/examples/scripts/results/test_epec_koref_bin_pairs.json,sha256=_D4-SAq-KYq4Dh7Sz4Je_grkJs2A16XhYRcjWHMDBfM,395
|
|
1234
|
-
wisent/examples/scripts/results/test_eq_bench_evaluation.json,sha256=B-AqxREzlu0ECD_YtS---LdSKolwu70wwcu7AKE8HeY,1203
|
|
1235
|
-
wisent/examples/scripts/results/test_eq_bench_pairs.json,sha256=phvyjATGYJ1epmiCCdOBPxN1l_AO792udzCuAiZnWqY,1364
|
|
1236
|
-
wisent/examples/scripts/results/test_escola_evaluation.json,sha256=JKPRlQVkuaDLsLKzI5XxN4gwyOuJH04Qh37QDMB0TmA,939
|
|
1237
|
-
wisent/examples/scripts/results/test_escola_pairs.json,sha256=SiA_WBXRzwxUnQ2_j56d3t3MJyt7iklZguDmWl06rlI,177
|
|
1238
|
-
wisent/examples/scripts/results/test_ethics_cm_evaluation.json,sha256=MmzSjNpXgo2SRv37SDy9jm6uCP0C2gF73Z9B-oTVsdk,836
|
|
1239
|
-
wisent/examples/scripts/results/test_ethics_cm_pairs.json,sha256=00wwW87OJi4_RUt3AizJR6lMLTPYOkKhGzy7uwYlmhk,177
|
|
1240
|
-
wisent/examples/scripts/results/test_ethos_binary_evaluation.json,sha256=XeHT77YVOvGVUtIqu73B6FuxkxsdtWh8-C_U-5dYhsQ,939
|
|
1241
|
-
wisent/examples/scripts/results/test_ethos_binary_pairs.json,sha256=mfqI7rEbpZlnyMCufGG5QcCyq4iOSEJHZiKEbY7Mm7M,449
|
|
1242
|
-
wisent/examples/scripts/results/test_eus_exams_es_evaluation.json,sha256=eCeeKM0EKjAuyYuQo8iW7wDL0XlVuTFPl3n6cE5tVZw,4112
|
|
1243
|
-
wisent/examples/scripts/results/test_eus_exams_es_pairs.json,sha256=Bn3Xm1qJseSwhdAT8j3F4vu3u3K6e3smdMimdorX_JM,2025
|
|
1244
|
-
wisent/examples/scripts/results/test_eus_exams_evaluation.json,sha256=aMWHOmI1qOEPnUadmadu28pYLb4u-_Kxj2OHfHgXs4w,4109
|
|
1245
|
-
wisent/examples/scripts/results/test_eus_exams_pairs.json,sha256=Bn3Xm1qJseSwhdAT8j3F4vu3u3K6e3smdMimdorX_JM,2025
|
|
1246
|
-
wisent/examples/scripts/results/test_eus_proficiency_evaluation.json,sha256=cfm_4e8ZCArtf4t6c55JOSwgJ_N7EELQ9PsZ9zhq3T4,922
|
|
1247
|
-
wisent/examples/scripts/results/test_eus_proficiency_pairs.json,sha256=6JzoYrt_c26GokB3znOT7TgvY0O1EWLT_kqmKy26oJg,211
|
|
1248
|
-
wisent/examples/scripts/results/test_eus_reading_evaluation.json,sha256=IH05FVYgcDTVuTqddbdgzvmvBRIr1s4AuFjzqIz5x30,1385
|
|
1249
|
-
wisent/examples/scripts/results/test_eus_reading_pairs.json,sha256=PKa11xuBbOcI6FpAREUMesxjfIDhlSZmRdtbogECZLo,498
|
|
1250
|
-
wisent/examples/scripts/results/test_eus_trivia_evaluation.json,sha256=urYqWTWSYJcoaS1o1QRW_6e7vWfYRKsXUivmMxZSR4E,913
|
|
1251
|
-
wisent/examples/scripts/results/test_eus_trivia_pairs.json,sha256=sB3Pn-0utMG9Z1GrfATsLszoWobvY_Po51r3g2sRvxU,214
|
|
1252
|
-
wisent/examples/scripts/results/test_evalita-mp_evaluation.json,sha256=5MS0hwskRstAR2BhPOg-4-yl5J7AqFG8WfABkb4mYXE,1904
|
|
1253
|
-
wisent/examples/scripts/results/test_evalita-mp_pairs.json,sha256=HjC70ItXgdB5iE0LyEILkNb7JHsOrFsb3AGNhZc44zs,1785
|
|
1254
|
-
wisent/examples/scripts/results/test_evalita-sp_sum_task_fp-small_p1_evaluation.json,sha256=QfzE-7Sltc5ZiAn0HH66dgLNwLFtR3SgV_PW0p_FHiM,2869
|
|
1255
|
-
wisent/examples/scripts/results/test_evalita-sp_sum_task_fp-small_p1_pairs.json,sha256=BUTzfqVMdF-_emOOOn4cpvIEhiO4ggjs9tnak--DTNw,3268
|
|
1256
|
-
wisent/examples/scripts/results/test_evalita_LLM_evaluation.json,sha256=XAv0b6ZsY3FQTfePmAwZctCZKQjaTedZ5aDDMeGr_gU,1905
|
|
1257
|
-
wisent/examples/scripts/results/test_evalita_LLM_pairs.json,sha256=HjC70ItXgdB5iE0LyEILkNb7JHsOrFsb3AGNhZc44zs,1785
|
|
1258
|
-
wisent/examples/scripts/results/test_fda_evaluation.json,sha256=aP74kYT6BOD2qM05L4kRnAYuVw-tZvitE9caeG8e__M,998
|
|
1259
|
-
wisent/examples/scripts/results/test_fda_pairs.json,sha256=XZTBelsFlYkB0-valzK6W96-p-TE-8nlFq7zVhMCSa8,8182
|
|
1260
|
-
wisent/examples/scripts/results/test_financial_tweets_evaluation.json,sha256=SDmml0B30P1RSZiQY502QTV7fXyUH_YHlE0YJjy7Xm0,921
|
|
1261
|
-
wisent/examples/scripts/results/test_financial_tweets_pairs.json,sha256=JcsMYuLOrJ550nh_zrN8v2MxYNvIhtvReHFwD0OPVek,669
|
|
1262
|
-
wisent/examples/scripts/results/test_fld_evaluation.json,sha256=aiEXO4lqEdjtTzY4hFbFTH2CPZXeDPfKfme87WacMhE,842
|
|
1263
|
-
wisent/examples/scripts/results/test_fld_pairs.json,sha256=1L5jg_v5WHopxNJYpEplZXRowQ4hH3bKT3G2TMnW-CQ,1629
|
|
1264
|
-
wisent/examples/scripts/results/test_flores_evaluation.json,sha256=vDkapQOxi5g2qal8IEGF08szTWxM8ATQHRKiIfi4b-s,3915
|
|
1265
|
-
wisent/examples/scripts/results/test_flores_pairs.json,sha256=HRmZsjTuME55GRtXP5_KBPsxojNefPQPRs4l_QWc2_M,1910
|
|
1266
|
-
wisent/examples/scripts/results/test_freebase_evaluation.json,sha256=N3kgEsfL-mkSn4H6nyX5wUVlE8GSb7-H-X8XKnhBv3o,1048
|
|
1267
|
-
wisent/examples/scripts/results/test_freebase_pairs.json,sha256=29RyCFZUDEVuo9okvNWGWD4wvF-pvnTtV33F2gkV8wI,293
|
|
1268
|
-
wisent/examples/scripts/results/test_french_bench_evaluation.json,sha256=fleGxHmOfhe1_pVl_snl8CMfrqj4_QiL4UpIjQBPIHQ,2677
|
|
1269
|
-
wisent/examples/scripts/results/test_french_bench_pairs.json,sha256=Vb-FUJaL-wTV0cEgqpVmfJwegmeZniRRqirwT3HUuNk,1258
|
|
1270
|
-
wisent/examples/scripts/results/test_galcola_evaluation.json,sha256=3lMUcse5omV9hk17btflMTZnOq7y1TtAsr_krXbuQvw,982
|
|
1271
|
-
wisent/examples/scripts/results/test_galcola_pairs.json,sha256=D4ECFn7QtOstIXignhIHP9acClIrh0vpe_oKZdxGbNE,243
|
|
1272
|
-
wisent/examples/scripts/results/test_galician_bench_evaluation.json,sha256=3KKwdau0a-5knxgX6kkVrlPlxueTRwRBNravHkmwr2E,5047
|
|
1273
|
-
wisent/examples/scripts/results/test_galician_bench_pairs.json,sha256=srtHtUgyzmAOEqnJhWJisaKhSTRJYw4U7U6jNIQgmQE,2886
|
|
1274
|
-
wisent/examples/scripts/results/test_glianorex_evaluation.json,sha256=6CLnzisor1mMqlxpLvTgYTXQmY3UhHsk7Nf0zxb7UO8,1006
|
|
1275
|
-
wisent/examples/scripts/results/test_glianorex_pairs.json,sha256=mqwrGlAwyWtMzftOfO_4HQbKVGNSppP_iDbMU5AvGZQ,658
|
|
1276
|
-
wisent/examples/scripts/results/test_global_mmlu_evaluation.json,sha256=EQiG1RkHTLvR4VBEXiv8b5vHXOq_PajfNIij7_YmT7c,2133
|
|
1277
|
-
wisent/examples/scripts/results/test_global_mmlu_pairs.json,sha256=spLwFJkOGruG-i1Csn6RCpKLr0-a8CVpQg4mzvO0JFs,826
|
|
1278
|
-
wisent/examples/scripts/results/test_glue_evaluation.json,sha256=xXKAFKDXmg0xaCj369bPD570sNIjOeLOVtTbSUkABvA,1600
|
|
1279
|
-
wisent/examples/scripts/results/test_glue_pairs.json,sha256=mymkijh1I9vEaoiIzq39Lm0L73UShIxQFBMcayoB7j4,628
|
|
1280
|
-
wisent/examples/scripts/results/test_gpqa_evaluation.json,sha256=2fEW-8wj4TDoHXhCas_YPZ4Z_N7xJiAzjXry7C3-lCk,1840
|
|
1281
|
-
wisent/examples/scripts/results/test_gpqa_pairs.json,sha256=y-TOv-Lo40zSpXVo4MXPGZTkIu_u3WNs4FZjjsK6upc,1084
|
|
1282
|
-
wisent/examples/scripts/results/test_gpt3_translation_benchmarks_evaluation.json,sha256=IdcK2tguDuY_WUWj4odEan4Oqjy_FVUfiPJiiP7JLxc,4101
|
|
1283
|
-
wisent/examples/scripts/results/test_gpt3_translation_benchmarks_pairs.json,sha256=3dOdaSTHcX0ccOVYYIWkpq687tJwFL1eIFc6EHoIKww,1419
|
|
1284
|
-
wisent/examples/scripts/results/test_groundcocoa_evaluation.json,sha256=rV_veFpVK3OImuZyzulwmph6NAdy7pI156SfE_dOKeM,988
|
|
1285
|
-
wisent/examples/scripts/results/test_groundcocoa_pairs.json,sha256=CirRCcb2q2pmIu8e6ANHBuubuvtj2shGc0zDjg0lBZQ,5350
|
|
1286
|
-
wisent/examples/scripts/results/test_gsm8k_evaluation.json,sha256=_nNDLwwfjqOFihfMuv0O3ZF_Ew2_0k_D-2o-d_DcZ5o,867
|
|
1287
|
-
wisent/examples/scripts/results/test_gsm8k_pairs.json,sha256=yxW6_k2XylyEqPMPhZhwxyCnw-vwCYBedSkx1o5Zeg4,403
|
|
1288
|
-
wisent/examples/scripts/results/test_haerae_evaluation.json,sha256=uK5ol-97fU29DkV0Vrb9L_4KScnSJzGOP8UU2Q8MFrg,2215
|
|
1289
|
-
wisent/examples/scripts/results/test_haerae_pairs.json,sha256=ltoQ282NCuvZlRnxBxrSc0sp1XqbRDGDJVv1PlMIMHQ,1468
|
|
1290
|
-
wisent/examples/scripts/results/test_headqa_evaluation.json,sha256=0k3HEcKU7qSyNN7W79tHDxGZopq_kqzbRMFfUtmx1K4,1029
|
|
1291
|
-
wisent/examples/scripts/results/test_headqa_pairs.json,sha256=rGY9CijTDzGGL85pxKZXZe_M-Px_E-uGOPOxqU26_M8,351
|
|
1292
|
-
wisent/examples/scripts/results/test_hellaswag_evaluation.json,sha256=_-iilhXZXRsaWp7LlJMFTc-Qmh2xCK4GOEB5a2mB3f0,1074
|
|
1293
|
-
wisent/examples/scripts/results/test_hellaswag_pairs.json,sha256=rbSvCblmQGvUgw-kZL03kidiCfiTIVfLnt_0yvmSoZI,312
|
|
1294
|
-
wisent/examples/scripts/results/test_hendrycks_ethics_evaluation.json,sha256=0wHr0vhBm2i8_3lgqhGrwcM65YuPgs33G6cxVDF609w,1598
|
|
1295
|
-
wisent/examples/scripts/results/test_hendrycks_ethics_pairs.json,sha256=uBKdLhk00i6DAAtQut1B0tqxx19kiPBEjlGBxFTfTwM,458
|
|
1296
|
-
wisent/examples/scripts/results/test_hendrycks_math_evaluation.json,sha256=s2orwBnwfMYspX3_GD3FO5e8J2ZuEwdlQDOrMKCbgMU,1665
|
|
1297
|
-
wisent/examples/scripts/results/test_hendrycks_math_pairs.json,sha256=MyZHhACbkn0PkMmAChQh3wIXOWrXpWYiNyLpmtSgo_4,445
|
|
1298
|
-
wisent/examples/scripts/results/test_histoires_morales_evaluation.json,sha256=5e8X1La9oLlLkkRRnU5zoSuf8CuGondBEwXM7pWIJSo,1396
|
|
1299
|
-
wisent/examples/scripts/results/test_histoires_morales_pairs.json,sha256=g1rM_DrRSeTwOG7SDGknO2W6Nyqb5NSS0vHFQzxqpjA,565
|
|
1300
|
-
wisent/examples/scripts/results/test_hmmt_evaluation.json,sha256=8XB_yyMUQOuzkYX__vmQSos4vDNX6Yt_MaDc9anyX1k,867
|
|
1301
|
-
wisent/examples/scripts/results/test_hmmt_feb_2025_evaluation.json,sha256=OIDOuto4Qm9HCBCjX3CVUhDIBQp6Ml4SeJ4yAzlraWI,876
|
|
1302
|
-
wisent/examples/scripts/results/test_hmmt_feb_2025_pairs.json,sha256=bfe5YJsR1WMdMNkaMjYBGxU8hqZaKLguLY9afvlCfjA,234
|
|
1303
|
-
wisent/examples/scripts/results/test_hmmt_pairs.json,sha256=bfe5YJsR1WMdMNkaMjYBGxU8hqZaKLguLY9afvlCfjA,234
|
|
1304
|
-
wisent/examples/scripts/results/test_hrm8k_evaluation.json,sha256=6HYYFhWhpzq2Y0DYk6NfJOmvHFl_shwL_x7SCbx46CY,1875
|
|
1305
|
-
wisent/examples/scripts/results/test_hrm8k_pairs.json,sha256=lZN6MfCBQ6Bq1GKVsaNE-CcLbT7TmwkzVcw_LXMFlQU,839
|
|
1306
|
-
wisent/examples/scripts/results/test_humaneval_evaluation.json,sha256=HC7TbsZN7SrjpHUBpdEWM35wBQj6jGLlXJnovjcjyl4,4167
|
|
1307
|
-
wisent/examples/scripts/results/test_humaneval_pairs.json,sha256=qZXOhERJoMGYk8J5EFoKLyKYu49_l5OealvoML-RWmo,1541
|
|
1308
|
-
wisent/examples/scripts/results/test_humaneval_plus_evaluation.json,sha256=ldl3iyWRY4Sc7WEFj-hJ7BQD0-QRBbgHq9l4JGPF8GA,4172
|
|
1309
|
-
wisent/examples/scripts/results/test_humaneval_plus_pairs.json,sha256=qZXOhERJoMGYk8J5EFoKLyKYu49_l5OealvoML-RWmo,1541
|
|
1310
|
-
wisent/examples/scripts/results/test_ifeval_evaluation.json,sha256=gOtlvCuVrfBgSJ73Xa5Yfjuv3z5U7aI17SHk13fg4F0,1104
|
|
1311
|
-
wisent/examples/scripts/results/test_ifeval_pairs.json,sha256=TCi8sdQ9kbjF1Ob9MQaJf10JBTpUlYmN_BrudTWclHk,534
|
|
1312
|
-
wisent/examples/scripts/results/test_instruct_humaneval_evaluation.json,sha256=UMpGUa1qXuXRocy6eBl2swB3D_R9fwwrVchzb-uFCHY,2214
|
|
1313
|
-
wisent/examples/scripts/results/test_instruct_humaneval_pairs.json,sha256=-XPga07HK8oiOMD1i22smzUp1KAI5xqg81YQf6ofdi4,1836
|
|
1314
|
-
wisent/examples/scripts/results/test_inverse_scaling_evaluation.json,sha256=oHUzSzzhF-Lfb91VZX-r869qacnyifJxGcEswDrjOfg,1587
|
|
1315
|
-
wisent/examples/scripts/results/test_inverse_scaling_hindsight_neglect_10shot_evaluation.json,sha256=NJN-QphkJMpBo5FD8c6vMHWVwG7MJjq621fPSERLZaA,897
|
|
1316
|
-
wisent/examples/scripts/results/test_inverse_scaling_hindsight_neglect_10shot_pairs.json,sha256=dmiHcLpmP90-KaWrHXWcRFaLI51cl7wKJBS1OVvkBXk,3043
|
|
1317
|
-
wisent/examples/scripts/results/test_inverse_scaling_pairs.json,sha256=BGaTxMETM5oGL24Mukz2_EgsUmGwHphm5tJ5zrnh7oo,1973
|
|
1318
|
-
wisent/examples/scripts/results/test_iwslt2017-ar-en_evaluation.json,sha256=JUjNmv-0VSb3NeX2v5oYNCijgvSDiYsFawf7G-h0Bx4,2307
|
|
1319
|
-
wisent/examples/scripts/results/test_iwslt2017-ar-en_pairs.json,sha256=mHj6LEr0usvxdt5K4rbi64c0ZqTMmFi4i57JjDpCesw,1414
|
|
1320
|
-
wisent/examples/scripts/results/test_iwslt2017-en-ar_evaluation.json,sha256=VMZGv37Ji7PjjmlliajLVehPWbafzkq0TGzsjXQi_zA,2307
|
|
1321
|
-
wisent/examples/scripts/results/test_iwslt2017-en-ar_pairs.json,sha256=hnCYmmkPDL9fVosNOMKtwKuz64Zik26kn5z5NT__GVE,1414
|
|
1322
|
-
wisent/examples/scripts/results/test_japanese_leaderboard_evaluation.json,sha256=yHx8LLslijfskvgapcNb8DX5tTmz_rKNUo3uYxliEL8,1901
|
|
1323
|
-
wisent/examples/scripts/results/test_japanese_leaderboard_pairs.json,sha256=sQdfqPcDetEMeHbOAeyt5r5WxVC1h3b2Iat4ob7rLNo,613
|
|
1324
|
-
wisent/examples/scripts/results/test_jsonschema_bench_evaluation.json,sha256=Vnp1Ha2PyH-VA3IasJtKQ4w9AJKSZldqcV9voMAP980,893
|
|
1325
|
-
wisent/examples/scripts/results/test_jsonschema_bench_pairs.json,sha256=rTNcw8zRB8sino6WuO6P2lhKEiRG2VHXSh-a2mhJMdc,19480
|
|
1326
|
-
wisent/examples/scripts/results/test_kbl_evaluation.json,sha256=8kGpFhxjO8x_HRSvAg6-WbTez2E8A51ES0i1b0MOCCM,1980
|
|
1327
|
-
wisent/examples/scripts/results/test_kbl_pairs.json,sha256=LV-Ua4yLlHsewRWlSYsZwTQsd9Gph9iJlDyrgPTTGdo,1803
|
|
1328
|
-
wisent/examples/scripts/results/test_kmmlu_evaluation.json,sha256=_ipQsnbnlMqNAcya6x_1yaEukdv75GShBsduslKP6js,4367
|
|
1329
|
-
wisent/examples/scripts/results/test_kmmlu_pairs.json,sha256=k4ZJBgxx-gYI0LFrCHfO_b-8eCA2Q6l1jX-lua53Nxk,2216
|
|
1330
|
-
wisent/examples/scripts/results/test_kobest_evaluation.json,sha256=GazAN4Lllr17o1Xyy4KXpGSpLjxAqO_zGFsLTd-l88k,2251
|
|
1331
|
-
wisent/examples/scripts/results/test_kobest_pairs.json,sha256=IWkCy1MdcVYoEk6vKaRGG5rERbsUgig5B-H_w4Bojsg,1855
|
|
1332
|
-
wisent/examples/scripts/results/test_kormedmcqa_evaluation.json,sha256=j85PbuvVbOUZCiROCx5s6xGeaDEqGvJmY-zFzC-To-Y,1221
|
|
1333
|
-
wisent/examples/scripts/results/test_kormedmcqa_pairs.json,sha256=1zItWyoLhYMnSx5dEUSm62Wl47PTgM7IFA0vabZ7yNU,1133
|
|
1334
|
-
wisent/examples/scripts/results/test_lambada_cloze_evaluation.json,sha256=gvT47FFYyM9Z9Nh_Uko-hAaOd63B82MjHLkdT_hvPas,887
|
|
1335
|
-
wisent/examples/scripts/results/test_lambada_cloze_pairs.json,sha256=8RCMdUcaJRjHeayPWYdV_3uXiurW6zzwUWtAvAIzsyU,458
|
|
1336
|
-
wisent/examples/scripts/results/test_lambada_evaluation.json,sha256=beUxcF4FDT7j8ZqXMkiUOJjfR7FvN1oMwmJjO7SLK7o,881
|
|
1337
|
-
wisent/examples/scripts/results/test_lambada_multilingual_evaluation.json,sha256=DNICi_fRYNDqTwCKkTViMh5u2Tb9r2fMCvYAFDAKUhw,1648
|
|
1338
|
-
wisent/examples/scripts/results/test_lambada_multilingual_pairs.json,sha256=J_wDReRhKlfTCNowV9xqgU0ko4uewXp6VVEJhVvt5ro,930
|
|
1339
|
-
wisent/examples/scripts/results/test_lambada_multilingual_stablelm_evaluation.json,sha256=qDYpgEeyaeoQhDYWC9Vnb8n6-sQ6wl9Ii4ojl2maaJ0,1674
|
|
1340
|
-
wisent/examples/scripts/results/test_lambada_multilingual_stablelm_pairs.json,sha256=4CTyzbFCDFjq6wIzR30iL_TBjx9yYpm5rj1ZjTj7thw,827
|
|
1341
|
-
wisent/examples/scripts/results/test_lambada_openai_evaluation.json,sha256=tObl_eY7drZaVDK6GDdRaqN7clgcD45iBX5YozJK-UY,886
|
|
1342
|
-
wisent/examples/scripts/results/test_lambada_openai_pairs.json,sha256=xMGsuzVg68MYRlY390HChWBK0BcxeWiwAK4hobQ0NPc,451
|
|
1343
|
-
wisent/examples/scripts/results/test_lambada_pairs.json,sha256=wN49Lxh6CB442qrLeP2Jo2-F8clJtx1C5W9GJzXIt2o,452
|
|
1344
|
-
wisent/examples/scripts/results/test_lambada_standard_evaluation.json,sha256=jSewuBV9w-EIab_RpOIwFn6RxuLb4XKCJYa4ljwjfHk,885
|
|
1345
|
-
wisent/examples/scripts/results/test_lambada_standard_pairs.json,sha256=zh9Ru3R849fBwppp8UZoj7BscDjyxW8qfeyOtAroyzs,589
|
|
1346
|
-
wisent/examples/scripts/results/test_leaderboard_evaluation.json,sha256=Tpck6aCefnexgobcfXM3ji8hbwMJ0yxAfeVBZBEzjFA,1917
|
|
1347
|
-
wisent/examples/scripts/results/test_leaderboard_pairs.json,sha256=8B0GFqsopf9uyW0rf_M2-Tv7ufxm1NB5FzRt5AqOTT0,872
|
|
1348
|
-
wisent/examples/scripts/results/test_libra_evaluation.json,sha256=XvgFoua3CpIO7PNBVzKFgji9rsU83YIE4CHNUJW2jZg,2485
|
|
1349
|
-
wisent/examples/scripts/results/test_libra_pairs.json,sha256=QA0Vxch6FIOKpd17z1ytL9TTA2vGnp-qYFtmk3ePu7M,880379
|
|
1350
|
-
wisent/examples/scripts/results/test_lingoly_evaluation.json,sha256=i3to6V4qYutI9nyjx_7lowdPeTE6VDxbn0X4MRCE-KE,1114
|
|
1351
|
-
wisent/examples/scripts/results/test_lingoly_pairs.json,sha256=2iAkMsykDno2K4ZkCSn2QdSbBqxXtk6S68jtz2gtjfU,3397
|
|
1352
|
-
wisent/examples/scripts/results/test_livecodebench_evaluation.json,sha256=vwTMrFUwRRSp-P4eisuiyUzHfwUWSC8xpBk-d2YX7h0,3481
|
|
1353
|
-
wisent/examples/scripts/results/test_livecodebench_pairs.json,sha256=W3P0-akjy_5kbetws0yAvnGUSK-7BNk99w5affkdQo4,2463
|
|
1354
|
-
wisent/examples/scripts/results/test_livemathbench_cnmo_en_evaluation.json,sha256=xigdJBdMptJZ-6aLe8eDmEH6T7w7iTjYEqX09Xtaz-s,900
|
|
1355
|
-
wisent/examples/scripts/results/test_livemathbench_cnmo_en_pairs.json,sha256=McXMGtCz2UD2QUXqylo1sTf-a6iAmoo5qLIthtNHVWo,260
|
|
1356
|
-
wisent/examples/scripts/results/test_livemathbench_cnmo_zh_evaluation.json,sha256=BkFqTOBtPM9fuSsEPV-4mNzWhV2vWJmBu5YRGGqCeRU,956
|
|
1357
|
-
wisent/examples/scripts/results/test_livemathbench_cnmo_zh_pairs.json,sha256=rvpcmohMC5eBnL5im_-JdUPRHh7XFFJZ1gt1JPM0osk,272
|
|
1358
|
-
wisent/examples/scripts/results/test_llama_evaluation.json,sha256=iDVGx1269b7B8W2fdYPX0LPSnS_V-WOZZR8jnuFv9ns,1062
|
|
1359
|
-
wisent/examples/scripts/results/test_llama_pairs.json,sha256=i_ZNQATvJAvvUh3IyoEZaVz2PPK3e9qakj96jTkX4jw,415
|
|
1360
|
-
wisent/examples/scripts/results/test_logiqa2_evaluation.json,sha256=Za93i3cFpej8eA1jn62rHi1LMKQPe88QSm6_vC_Hy5o,1402
|
|
1361
|
-
wisent/examples/scripts/results/test_logiqa2_pairs.json,sha256=KVIfTmhyZdttg2ryAgrl-oO16VK4_kvSZM2WeL2bwig,908
|
|
1362
|
-
wisent/examples/scripts/results/test_logiqa_evaluation.json,sha256=C8iRLhxAXwTFy8ptdIZx-Lwie13NZ4-Sewa51BRDSfo,1691
|
|
1363
|
-
wisent/examples/scripts/results/test_logiqa_pairs.json,sha256=elVOWcg1jhq0dIF7RLnDA2MDK4NN_FnPZN-grM343qA,1272
|
|
1364
|
-
wisent/examples/scripts/results/test_m_mmlu_evaluation.json,sha256=PclJkewbHm3_Rw5qTC8NfOT2NgERpZmuYbn2oyzJV_g,3301
|
|
1365
|
-
wisent/examples/scripts/results/test_m_mmlu_pairs.json,sha256=wAAzpckbG1ZtJzULClaMmzjMb58vCexgJy04I3en6po,6160
|
|
1366
|
-
wisent/examples/scripts/results/test_mastermind_evaluation.json,sha256=f69woRnb2_yIiKm6JNTpM17z3YkisTqiYgwTgvv8Fzc,1846
|
|
1367
|
-
wisent/examples/scripts/results/test_mastermind_pairs.json,sha256=nZiJ_cPmiPfl799XB7t5vejrct1fZYCG_dWvHiGbKS0,1778
|
|
1368
|
-
wisent/examples/scripts/results/test_math500_evaluation.json,sha256=F8FHRWhePZGYu3k29BmDJEmwt14LDIfEkWk2yPOv6p8,1070
|
|
1369
|
-
wisent/examples/scripts/results/test_math500_pairs.json,sha256=h-g2WQ-86hoGHOly0_DD2fG7FJre0P8NUihhOI5NWkE,376
|
|
1370
|
-
wisent/examples/scripts/results/test_math_evaluation.json,sha256=-kzF9nksoli-AaMJRyvSw5qJK8c65XDcWZbQp3gABso,1067
|
|
1371
|
-
wisent/examples/scripts/results/test_math_pairs.json,sha256=h-g2WQ-86hoGHOly0_DD2fG7FJre0P8NUihhOI5NWkE,376
|
|
1372
|
-
wisent/examples/scripts/results/test_mathqa_evaluation.json,sha256=X-1i9Lz5YUamprD48dYZE5K9w9YjzyMutU0EpciTVWQ,867
|
|
1373
|
-
wisent/examples/scripts/results/test_mathqa_pairs.json,sha256=faRg8WeEewq6vGd6jl2p7vcrJ_tDUqAKjuVLyZ5bPYg,296
|
|
1374
|
-
wisent/examples/scripts/results/test_mbpp_evaluation.json,sha256=u52WM6boj2wKelvH8mdmDE5OTwvA3at1EdfQDGct6vk,2619
|
|
1375
|
-
wisent/examples/scripts/results/test_mbpp_pairs.json,sha256=Gkc2VORp4d11JV7OGQBSumeMSr6svf69Hc74ZiluKvY,840
|
|
1376
|
-
wisent/examples/scripts/results/test_mbpp_plus_evaluation.json,sha256=s1lIEhaqSsSnzCk-pXeuq4lK-PM-FvO9g4l67KI4SwA,2624
|
|
1377
|
-
wisent/examples/scripts/results/test_mbpp_plus_pairs.json,sha256=Gkc2VORp4d11JV7OGQBSumeMSr6svf69Hc74ZiluKvY,840
|
|
1378
|
-
wisent/examples/scripts/results/test_mc_taco_evaluation.json,sha256=1Y5oIUdsosSJoYLmur7l11epNgIE9EiGXGdTtx3wxOs,866
|
|
1379
|
-
wisent/examples/scripts/results/test_mc_taco_pairs.json,sha256=WPbTNx9ADn2LSU-P1jAs7-iarNG0Z-uCdHqwF3tnDzU,343
|
|
1380
|
-
wisent/examples/scripts/results/test_med_concepts_qa_evaluation.json,sha256=ouFMxeZaFneONKOFiCabnHUhi6GK5nqN0v0BLYwj_W4,1577
|
|
1381
|
-
wisent/examples/scripts/results/test_med_concepts_qa_pairs.json,sha256=QRn1FPe4dRcoE1E1DzIlg7hCqnVdeBZiXSeteJW44Kk,926
|
|
1382
|
-
wisent/examples/scripts/results/test_meddialog_evaluation.json,sha256=f4avjS3zlNiMbev2Bji9kVycJkXbOMEfC5LyTMvlDfs,1224
|
|
1383
|
-
wisent/examples/scripts/results/test_meddialog_pairs.json,sha256=Az1EqGbgyi-w-rLU0jdBN1KF1njqonbSowiY0dahbTU,2211
|
|
1384
|
-
wisent/examples/scripts/results/test_mediqa_qa2019_evaluation.json,sha256=Fvfph4eUhNd2jfrUjwFC71tl_b6SuG_yWvztP33maYQ,24657
|
|
1385
|
-
wisent/examples/scripts/results/test_mediqa_qa2019_pairs.json,sha256=7y_9xrpYvGk1D8A3oz6TLB481lH0vaemYR0WTDSCYvg,6176
|
|
1386
|
-
wisent/examples/scripts/results/test_medmcqa_evaluation.json,sha256=P__zH8WsY20aBMZvENbSzvv4dsm6kCsnjbMsx0BkpO0,1235
|
|
1387
|
-
wisent/examples/scripts/results/test_medmcqa_pairs.json,sha256=-RPjq5ws9WEHvDuA2kKb7PcLt_xO_pKHOmX9ZFo0vOA,429
|
|
1388
|
-
wisent/examples/scripts/results/test_medqa_evaluation.json,sha256=7Vit2oW56PIRdB7KIuc-0De1ViUZy_0mnCRxbK6krhw,918
|
|
1389
|
-
wisent/examples/scripts/results/test_medqa_pairs.json,sha256=r7IpFV92Er1y8qQG1uP3AgqMx43lKlHmS7ghSHuWuk4,580
|
|
1390
|
-
wisent/examples/scripts/results/test_medtext_evaluation.json,sha256=os6rwCha3MxiLHtb2K4_d2Pw8ETjsUUIz9gluDagaC8,3320
|
|
1391
|
-
wisent/examples/scripts/results/test_medtext_pairs.json,sha256=gCX_ukp2Vz3XHVvXbHesJrMClk-jAUpL_hGiHDPuoRU,1132
|
|
1392
|
-
wisent/examples/scripts/results/test_mela_evaluation.json,sha256=YdoMUr0kc9mRISC4VX2LqBTgvYhwj9lnhFVM0jxDza4,1943
|
|
1393
|
-
wisent/examples/scripts/results/test_mela_pairs.json,sha256=1NcEOC-CypJNCGS2Z25bf4TKEniHE4sLwY0nd8NAMYk,779
|
|
1394
|
-
wisent/examples/scripts/results/test_meqsum_evaluation.json,sha256=T5cQUUNtSigyJKEhnGZokz2u9cTSZWJY8g4_1XRBZMo,1070
|
|
1395
|
-
wisent/examples/scripts/results/test_meqsum_pairs.json,sha256=6iAKdPeN42vvxkbP8JEDcNYN8G6J0o6hYqgpSOzld70,357
|
|
1396
|
-
wisent/examples/scripts/results/test_mercury_evaluation.json,sha256=7__Lb975QG74ongFxumyhuNADJjEK8v4HKxlsfPo-i4,3149
|
|
1397
|
-
wisent/examples/scripts/results/test_mercury_pairs.json,sha256=qGSktBzVt_D5eEbUOw8q7buwpy9QlNynSHskgIf_EMU,1101
|
|
1398
|
-
wisent/examples/scripts/results/test_metabench_evaluation.json,sha256=_Djazx2oyBNDMjmYfobqs--ZS-VK2Y0LizaB8K8b16g,2011
|
|
1399
|
-
wisent/examples/scripts/results/test_metabench_pairs.json,sha256=4f698yHCNn45jWtvsi937vlDwXc_bc8keBR1t7_WwME,1370
|
|
1400
|
-
wisent/examples/scripts/results/test_mgsm_evaluation.json,sha256=FDIgggevW6B6v-LVpG35Adnqevu0rhzqpFLFYuBGgCg,1905
|
|
1401
|
-
wisent/examples/scripts/results/test_mgsm_pairs.json,sha256=awNlZYzMZAnpvqIYAsmYIpX__dNpyULkK8SXB2eWtg0,1247
|
|
1402
|
-
wisent/examples/scripts/results/test_mimic_repsum_evaluation.json,sha256=HEx6y6epZtVORZ5SUcddcW2QaPQ2RWDAVcQrOOUaBBE,8379
|
|
1403
|
-
wisent/examples/scripts/results/test_mimic_repsum_pairs.json,sha256=6xrehIiqBprm0UlbTXcjDiClhkVNR2OCplerG4FbHrE,2679
|
|
1404
|
-
wisent/examples/scripts/results/test_minerva_math_evaluation.json,sha256=C0KqtQDoDVvQUrBOQi71y8EDy5XGjgH8Jh842-699hA,1959
|
|
1405
|
-
wisent/examples/scripts/results/test_minerva_math_pairs.json,sha256=x1tDTGTuf1Yz_M5EHN5c_mQUZH98ZlVRu_mbsXhxEvY,635
|
|
1406
|
-
wisent/examples/scripts/results/test_mlqa_evaluation.json,sha256=DfvQWNrJc6dVzHIaAP6Cu6VafX5E88eCi6Ec2r3_FuI,2261
|
|
1407
|
-
wisent/examples/scripts/results/test_mlqa_pairs.json,sha256=_nGqCBrp3b3AB9jByXnn9EqyJkAMffEaXJrp0vH7LrY,12808
|
|
1408
|
-
wisent/examples/scripts/results/test_mmlu-pro-plus_evaluation.json,sha256=fr6x3pn8JXjm7j3ZTvdiFW__SZCxQJNiSlBgjgRhxqI,1673
|
|
1409
|
-
wisent/examples/scripts/results/test_mmlu-pro-plus_pairs.json,sha256=LYLIMLEPk26hTFGdPa9wC600Yr7BSdIdtFy5eBoJh4s,1281
|
|
1410
|
-
wisent/examples/scripts/results/test_mmlu_evaluation.json,sha256=tuLggxat1t0pZHRyKWc5-gI_doo0CTR7DPigcERrVn8,2224
|
|
1411
|
-
wisent/examples/scripts/results/test_mmlu_pairs.json,sha256=NR0RPFx7gpxLk10bK5JJW-OPEm3sKARkHdx1Au6egB8,1212
|
|
1412
|
-
wisent/examples/scripts/results/test_mmlu_pro_evaluation.json,sha256=3xCCgz2waH5GcaQ8ORKr8Cy6_kXDSz8OLzRNYQTM1oo,1703
|
|
1413
|
-
wisent/examples/scripts/results/test_mmlu_pro_pairs.json,sha256=gRzICeSFw9FmONXL85pDuInxkD5aqdaGygfSFWWNdRU,1476
|
|
1414
|
-
wisent/examples/scripts/results/test_mmlu_prox_evaluation.json,sha256=sk_jcTTRMZrbQLD8mpxrF6xncdC_DiV9FLsakIVAIIU,2536
|
|
1415
|
-
wisent/examples/scripts/results/test_mmlu_prox_pairs.json,sha256=VISvlVzvo7SbVtg9-Hq2XWhfRJyqjYJRxFciIZ6CRWU,2398
|
|
1416
|
-
wisent/examples/scripts/results/test_mmlusr_evaluation.json,sha256=cJKhoFSSdCYc5bVDqC0rVoifhyWlRwXZUu1E_-1GLh8,869
|
|
1417
|
-
wisent/examples/scripts/results/test_mmlusr_pairs.json,sha256=5apvFNyzubhlep2ARl_-g055Hfn-Hq-f7aiO8-a-5Yk,230
|
|
1418
|
-
wisent/examples/scripts/results/test_mmmu_evaluation.json,sha256=4MVDj3KlgJg_LKZvlcJUfDrZoulOog04iJDwpsqS4hg,1547
|
|
1419
|
-
wisent/examples/scripts/results/test_mmmu_pairs.json,sha256=GNM-Pm-LSoLuOAkpg1fC-xAnAHG7Yo_QJ_BE8I53k4w,406
|
|
1420
|
-
wisent/examples/scripts/results/test_mnli_evaluation.json,sha256=PlDAWmGKjIbhxq6t81vUMbXwx6ssLZOBk2w_LaahQ5k,888
|
|
1421
|
-
wisent/examples/scripts/results/test_mnli_pairs.json,sha256=Pap-Hwf-p65DEgSqim6tFbcuwAMXJvds9gB5vkqsT5M,233
|
|
1422
|
-
wisent/examples/scripts/results/test_model_written_evals_evaluation.json,sha256=5rcANb0-W_ckW5OOtzx6US4RqxSSzsYcHT9pSWWTFIg,1603
|
|
1423
|
-
wisent/examples/scripts/results/test_model_written_evals_pairs.json,sha256=8aGjw1tE7oaMBd6ac7_wG0cwHDZPeWbX5Keq9o6Fr7w,1163
|
|
1424
|
-
wisent/examples/scripts/results/test_moral_stories_evaluation.json,sha256=Rf_hHwFRkrKhhtPSN3BmZmCEhWp0Qmiw_3xnikMax9g,1238
|
|
1425
|
-
wisent/examples/scripts/results/test_moral_stories_pairs.json,sha256=pEI0KX8TcmEx8BoVQQTtcA-BKgDpNpuYKL973ice68A,415
|
|
1426
|
-
wisent/examples/scripts/results/test_mts_dialog_evaluation.json,sha256=8zti1z8b_djL1UB01BzNt4nZBfKJO1injNUa3hD9LM8,2544
|
|
1427
|
-
wisent/examples/scripts/results/test_mts_dialog_pairs.json,sha256=fi6mGGIcT_LjNHrRpr9NISMc_VPls6n0trSSXfjQ-No,1243
|
|
1428
|
-
wisent/examples/scripts/results/test_multiblimp_evaluation.json,sha256=Vp-rOHvLtqu051a2rX__hz-TwXiEZc2yqLh6d01t6PA,2641
|
|
1429
|
-
wisent/examples/scripts/results/test_multiblimp_pairs.json,sha256=o7VTB8oeu9E_SJFeW5vUydoyCmNeN50g8opvnCu_rIM,1008
|
|
1430
|
-
wisent/examples/scripts/results/test_multimedqa_evaluation.json,sha256=rY3Hy5wWLd47sESGw3GIUrdO_miKBWeVlkPCGM6MJUo,1661
|
|
1431
|
-
wisent/examples/scripts/results/test_multimedqa_pairs.json,sha256=z-r1cibi5LPUp5-O2C7oL0q-7DXHh7b7sicD2Zn9z0c,1094
|
|
1432
|
-
wisent/examples/scripts/results/test_multipl_e_evaluation.json,sha256=vlfKWPP0dK2QbZz5-uCQMh480At1yyWRkX0AkxcoRqI,4579
|
|
1433
|
-
wisent/examples/scripts/results/test_multipl_e_pairs.json,sha256=MzcZml2RBBD0DlAmP-vs3xZXtoT0m3wD2pGsCe6YukM,1668
|
|
1434
|
-
wisent/examples/scripts/results/test_mutual_evaluation.json,sha256=IGoKKW2kCb5XPm5l08w7Tk2hVc-aA_vBm6aBG3GWrt4,1347
|
|
1435
|
-
wisent/examples/scripts/results/test_mutual_pairs.json,sha256=8-u5J_cx_0IxYKaiJklBEuDreE8FLohc3JARCC4l52Q,1033
|
|
1436
|
-
wisent/examples/scripts/results/test_non_greedy_robustness_agieval_aqua_rat_evaluation.json,sha256=MUr_9WEOuunLgQeh7NSMwQQuRRDWu7WMZiGwKURFAqw,979
|
|
1437
|
-
wisent/examples/scripts/results/test_non_greedy_robustness_agieval_aqua_rat_pairs.json,sha256=hlfqPK1o0KodtMbH4q3nKZFU6j6erXUzz7lOGg_NQuk,514
|
|
1438
|
-
wisent/examples/scripts/results/test_noreval_evaluation.json,sha256=ine0Fxve9kpdESw67UIOwIFlRi8p6FdoLFVjdzvUgRA,1555
|
|
1439
|
-
wisent/examples/scripts/results/test_noreval_pairs.json,sha256=gnPbR9uHRjxueKc1d6zrCVZz6PD1_c_KrZsW0ExV4VU,362
|
|
1440
|
-
wisent/examples/scripts/results/test_noticia_evaluation.json,sha256=v9I8VwXLfjB2TMLf_zERIvmWUNuaNsxoRz75qi_ra6o,1114
|
|
1441
|
-
wisent/examples/scripts/results/test_noticia_pairs.json,sha256=P5O5Tc67RNV45A_DRJgLyPDngzKqWs_X8oxpy4w-wFw,2268
|
|
1442
|
-
wisent/examples/scripts/results/test_nq_open_evaluation.json,sha256=CZZNIoRpjNDbScxC9nxWwSn3v25httU0Zz065zrXNyU,975
|
|
1443
|
-
wisent/examples/scripts/results/test_nq_open_pairs.json,sha256=vmsi1wyYZMVYmxHMdDMGrWTGNk7McE4s9JA8SC8x7BI,258
|
|
1444
|
-
wisent/examples/scripts/results/test_olaph_evaluation.json,sha256=tlFZzxONRbkhJjUHEmOBPo06qx130O-piPVXu5GDnMU,3322
|
|
1445
|
-
wisent/examples/scripts/results/test_olaph_pairs.json,sha256=sLKs-cEEg8wOIcG7bL5-REel2UPfnofgTt2PtBNuydc,921
|
|
1446
|
-
wisent/examples/scripts/results/test_openbookqa_evaluation.json,sha256=YmXM2mR7WE5-7X6H5EwTiedo6QY8o-ozrJIZuQ7rPTg,927
|
|
1447
|
-
wisent/examples/scripts/results/test_openbookqa_pairs.json,sha256=L_VshVYJlou9bj8GfZQPpbgR5ycTVrV75UmMkajzdyU,258
|
|
1448
|
-
wisent/examples/scripts/results/test_openllm_evaluation.json,sha256=RA7y4wESjsBdEoXqBR7SjWVOnK1Ep8Tk7lf-McXYCS4,3589
|
|
1449
|
-
wisent/examples/scripts/results/test_openllm_pairs.json,sha256=gc3r1_eo3BdM_V_oiJ36hVXanyqCcj2AYP7wUc6MjhI,2068
|
|
1450
|
-
wisent/examples/scripts/results/test_option_order_robustness_agieval_aqua_rat_evaluation.json,sha256=JCpnuTyJTqhRNnMaz70-Ksfu31wDjkHOxXTP4Hczhkw,981
|
|
1451
|
-
wisent/examples/scripts/results/test_option_order_robustness_agieval_aqua_rat_pairs.json,sha256=hlfqPK1o0KodtMbH4q3nKZFU6j6erXUzz7lOGg_NQuk,514
|
|
1452
|
-
wisent/examples/scripts/results/test_paloma_evaluation.json,sha256=cTLr0S6bGMkkK6ywp-0YlTzdF2yzHIfUyOyReaAlBuU,13794
|
|
1453
|
-
wisent/examples/scripts/results/test_paloma_pairs.json,sha256=1NCnC87kemagr0Qv1Ec6u5YTsjpQSAy4IOv8QdY911g,4378
|
|
1454
|
-
wisent/examples/scripts/results/test_paws-x_evaluation.json,sha256=ZhxMHD8OqUw1xaM4UMlckSG5lgWJrm3Vm9KhbAXKOOo,1844
|
|
1455
|
-
wisent/examples/scripts/results/test_paws-x_pairs.json,sha256=QomDQVAjgmRiOYAtnuZkYevFjwPyNmLPZDgpYxiAv_k,887
|
|
1456
|
-
wisent/examples/scripts/results/test_penn_treebank_evaluation.json,sha256=whE__BRLDMW-cFr20TJ5za8A4wvLqFxZTBCLlmWaPdw,3722
|
|
1457
|
-
wisent/examples/scripts/results/test_penn_treebank_pairs.json,sha256=_AWjDaXjel4jaiFb1IOk-bZ3wqNi9Yg4e59dZSOYlPc,1565
|
|
1458
|
-
wisent/examples/scripts/results/test_piqa_evaluation.json,sha256=P6YyDegF8wSsyGmuzQsynkzbXA1LCTmBI59vbcwTqEk,1839
|
|
1459
|
-
wisent/examples/scripts/results/test_piqa_pairs.json,sha256=1wH2ylQidQpuy1UvxaBVONjjc7zC8Pa2cT3rvp_RT0Q,849
|
|
1460
|
-
wisent/examples/scripts/results/test_polemo2_evaluation.json,sha256=FOO99tAhAoQwthVaPUw5P9nUk31zkgPB2WHJoVgLKW8,911
|
|
1461
|
-
wisent/examples/scripts/results/test_polemo2_pairs.json,sha256=LjWnibwZ9GWrfZ5kSiNmi3nZXoWmtsEvW_Hcqf-kgvI,429
|
|
1462
|
-
wisent/examples/scripts/results/test_polymath_en_high_evaluation.json,sha256=PTCjnInzvE8JAblMzvmx8m5EudBMqrf74nBX1clNkkg,875
|
|
1463
|
-
wisent/examples/scripts/results/test_polymath_en_high_pairs.json,sha256=vXaNI8UtVGZo7ysrQGWYh47GcumeQF6_VQ4ngRg8zNE,225
|
|
1464
|
-
wisent/examples/scripts/results/test_polymath_en_medium_evaluation.json,sha256=jEX02vrP9l_ticRXaG13GKTxemhRxI00Ens0K88Mca8,979
|
|
1465
|
-
wisent/examples/scripts/results/test_polymath_en_medium_pairs.json,sha256=vjC0qByKtHt4xMFG9OUPu4pUGtLx415CFLZ4MJRjop0,290
|
|
1466
|
-
wisent/examples/scripts/results/test_polymath_zh_high_evaluation.json,sha256=f-z_ZxD12J45n-8Nz0Emno3lwvkuhXIla9M3EvthZjo,935
|
|
1467
|
-
wisent/examples/scripts/results/test_polymath_zh_high_pairs.json,sha256=t8i5ZriVIT_KyyatYwcvJ16NOcHrDxhN41Z_lY2A4V8,270
|
|
1468
|
-
wisent/examples/scripts/results/test_polymath_zh_medium_evaluation.json,sha256=AGapX04mz2KzDEVLtgC4EPq8wuRzEOhoFm-gEyfz7ms,1061
|
|
1469
|
-
wisent/examples/scripts/results/test_polymath_zh_medium_pairs.json,sha256=a2nLV56FBnLPNp3C5gctjoei6iUzLP4JTWJ3mp2CT8k,349
|
|
1470
|
-
wisent/examples/scripts/results/test_portuguese_bench_evaluation.json,sha256=8dsVknTWuTKda85YoVKmhi5YU-sqNoRJu2yXG7HQmgc,4000
|
|
1471
|
-
wisent/examples/scripts/results/test_portuguese_bench_pairs.json,sha256=0pwL4bTLRJ6uXbkIMnLWYoD4JPXqT2Fbcy1G0UG3BNQ,2190
|
|
1472
|
-
wisent/examples/scripts/results/test_prompt_robustness_agieval_aqua_rat_evaluation.json,sha256=JEQ_-iDoK5au-IVf2idaaxs5lLkRQkcfK9O2l0q93_E,975
|
|
1473
|
-
wisent/examples/scripts/results/test_prompt_robustness_agieval_aqua_rat_pairs.json,sha256=hlfqPK1o0KodtMbH4q3nKZFU6j6erXUzz7lOGg_NQuk,514
|
|
1474
|
-
wisent/examples/scripts/results/test_prost_evaluation.json,sha256=wJj51-v8JEpcMvROsItrMBmsV_Uh98KB7TnXQ2Hb4E0,883
|
|
1475
|
-
wisent/examples/scripts/results/test_prost_pairs.json,sha256=0UA-IVEhtaS7AQ_QrFC87qhXTnXSZNye_CQecxdPc2M,253
|
|
1476
|
-
wisent/examples/scripts/results/test_ptb_evaluation.json,sha256=Gz2JHDOGGd7jFdK8y-UgLxPK9CV42Rql0CbLsljXviM,3712
|
|
1477
|
-
wisent/examples/scripts/results/test_ptb_pairs.json,sha256=2XajZW4Db3MDXK4lkPxwwoWFZfQ8Sk3xmpxef36UpBw,1565
|
|
1478
|
-
wisent/examples/scripts/results/test_pubmedqa_evaluation.json,sha256=GM4Lrp6jQ7wqfKr3KC9pkA36XsHb6x8x0ZS1jaUYe4I,869
|
|
1479
|
-
wisent/examples/scripts/results/test_pubmedqa_pairs.json,sha256=krcgQCockT7B4fgDty68L_lqFa8IPSB85JsJROjIZYg,1557
|
|
1480
|
-
wisent/examples/scripts/results/test_pythia_evaluation.json,sha256=B4hBcCinToy7vucnVoH5Y2zrGzHu0-UYpHXkk1_7Yk0,1806
|
|
1481
|
-
wisent/examples/scripts/results/test_pythia_pairs.json,sha256=tm8oBMDIJ0Zb_x-V9H-fjc4MCdfHsK4-7jG8kaYz7og,413
|
|
1482
|
-
wisent/examples/scripts/results/test_qa4mre_evaluation.json,sha256=d91z1t8qpUPmcohmF60rbeVMXH3hVpcWbyWPV94IdHY,1023
|
|
1483
|
-
wisent/examples/scripts/results/test_qa4mre_pairs.json,sha256=8dzioTuq2j3ZeDRoYhKqzMHr1YolLu8bEGFN4nT-E4U,8745
|
|
1484
|
-
wisent/examples/scripts/results/test_qasper_evaluation.json,sha256=ins_h22cFfVkEzqnEUc6gBfzSbieI1QtKKst081Ya7M,1072
|
|
1485
|
-
wisent/examples/scripts/results/test_qasper_pairs.json,sha256=CdR7bklX5esyhk36hH8bvW7WDeBKKKElvnBTvHMwbn4,1477
|
|
1486
|
-
wisent/examples/scripts/results/test_race_evaluation.json,sha256=zCXDua0wj5kFSvgSb_N3KUo5eSQiKTxQugxyRGDjEVM,1049
|
|
1487
|
-
wisent/examples/scripts/results/test_race_pairs.json,sha256=uKxuV24iH5hD87fIe3A1_o9MIHBjapH7EPOIcTVNT3I,1888
|
|
1488
|
-
wisent/examples/scripts/results/test_realtoxicityprompts_evaluation.json,sha256=AliJVbmT2TzflHaNQ54XftN5KZqJvQ4I6wQ-cJFxmlA,1383
|
|
1489
|
-
wisent/examples/scripts/results/test_realtoxicityprompts_pairs.json,sha256=-ZRWtUI0qSAWOx7PP3uXBWtOvq32JsqQdxszgY-16UY,351
|
|
1490
|
-
wisent/examples/scripts/results/test_recode_evaluation.json,sha256=BkHn0HZlhc0P2YM9GB16S-Su-rOuI4VcSsiN3ML47WM,3389
|
|
1491
|
-
wisent/examples/scripts/results/test_recode_pairs.json,sha256=-P3lrMjLrU47kjK1A-DZTGE2oRVZ-UdttRGvblom6aY,1277
|
|
1492
|
-
wisent/examples/scripts/results/test_record_evaluation.json,sha256=cA02Mecr4Ygb050Jk3AjeM5j6_9c1FZ9j52snPqext0,897
|
|
1493
|
-
wisent/examples/scripts/results/test_record_pairs.json,sha256=AFNH1tSovcNwBtJlBKV9fSlVBCw-2FsrWPV4cfgOWwc,1427
|
|
1494
|
-
wisent/examples/scripts/results/test_ruler_evaluation.json,sha256=xo49T3t1QmjQS-k0mZbxSZeV79bOZwl7F_ros4-DN-E,1719
|
|
1495
|
-
wisent/examples/scripts/results/test_ruler_pairs.json,sha256=cBQbgenfSKJfoHKgaMNkfLvw_Ozm1i7WjDyCJ3zp4fk,28484
|
|
1496
|
-
wisent/examples/scripts/results/test_sciq_evaluation.json,sha256=dNqTNtGCGziK3A6b-uoL_Uz_h2K1-Nk1vUDvu8JonRc,909
|
|
1497
|
-
wisent/examples/scripts/results/test_sciq_pairs.json,sha256=CG9VCEWOT0S3gR3RzzUAGi7oUpC2yHoACfbUUsyAmtg,537
|
|
1498
|
-
wisent/examples/scripts/results/test_score_evaluation.json,sha256=j-liQQqy3apfNakCcgnt1I2f-ZUWF0I09KQx2U-lNYQ,1773
|
|
1499
|
-
wisent/examples/scripts/results/test_score_pairs.json,sha256=hoG_hQSfSEPveBILiGzXNjGyW9DOXTWtEl6fDvYKQFw,581
|
|
1500
|
-
wisent/examples/scripts/results/test_self_consistency_evaluation.json,sha256=B9ZoGJlhOIbhuFLt2zNG2rCKxow5tqHIn8U2NyRk864,878
|
|
1501
|
-
wisent/examples/scripts/results/test_self_consistency_pairs.json,sha256=yxW6_k2XylyEqPMPhZhwxyCnw-vwCYBedSkx1o5Zeg4,403
|
|
1502
|
-
wisent/examples/scripts/results/test_siqa_evaluation.json,sha256=1alziLCUyDX_7o0N5sbNndysZBEaYSzR7luyVLnvTnY,987
|
|
1503
|
-
wisent/examples/scripts/results/test_siqa_pairs.json,sha256=fEDTSRyrTHBW1zgfjmP6XhonINqLcwsMnQOGqRF3RDs,347
|
|
1504
|
-
wisent/examples/scripts/results/test_spanish_bench_evaluation.json,sha256=wCfI38yE6Aln-ZjEkQfe2kIYsbjYSwD8UXByG792u00,2663
|
|
1505
|
-
wisent/examples/scripts/results/test_spanish_bench_pairs.json,sha256=7CNMc4P5A5oxc-5PEF3hRvYU3lD8Az2VMzIL-1Zb2NI,1235
|
|
1506
|
-
wisent/examples/scripts/results/test_squad2_evaluation.json,sha256=FuhDnQzcmU_KCjB0XEF8TNLJ21rd-YIR8VHTIw5OvAY,969
|
|
1507
|
-
wisent/examples/scripts/results/test_squad2_pairs.json,sha256=lO_MW2N-KxNymjgIqdraiRx5814j2B5QJ-hGjpXAhmI,1055
|
|
1508
|
-
wisent/examples/scripts/results/test_squadv2_evaluation.json,sha256=Ptp6ftFeIaep_18jUQbnDooiWl_-Rb1oZL2H9HEBWBQ,978
|
|
1509
|
-
wisent/examples/scripts/results/test_squadv2_pairs.json,sha256=9gmSl12mrGAaXL0TDebZO0yFefvSTiduZT3MpUO0Akk,1063
|
|
1510
|
-
wisent/examples/scripts/results/test_super-glue-lm-eval-v1-seq2seq_evaluation.json,sha256=dHD9bopxO_oPFHdwVN-X5VkREK7_ba3XTU5s1E_ZkkM,888
|
|
1511
|
-
wisent/examples/scripts/results/test_super-glue-lm-eval-v1-seq2seq_pairs.json,sha256=YZiJJSLsFTIRMfctwiXSEStI3YaznaWTbF58-eGE8OQ,1583
|
|
1512
|
-
wisent/examples/scripts/results/test_super-glue-lm-eval-v1_evaluation.json,sha256=ETuEkyK8GwV09yd9OE8KmjWyZzpRxGnFvM9fWPHmBrE,1654
|
|
1513
|
-
wisent/examples/scripts/results/test_super-glue-lm-eval-v1_pairs.json,sha256=ASGZcutkQv-dqflNqC70xTf8c0vfqC-cCo8FO_A_VaA,2729
|
|
1514
|
-
wisent/examples/scripts/results/test_swag_evaluation.json,sha256=WbIntRdAMsRkgkVkhXH495RnEfLd8flMNVZd1XA_aiw,1043
|
|
1515
|
-
wisent/examples/scripts/results/test_swag_pairs.json,sha256=fj-KXPXdS4e2Lt8lTGYz7QkOxvQ5yDpfoOrA9CiYYys,288
|
|
1516
|
-
wisent/examples/scripts/results/test_tinyBenchmarks_evaluation.json,sha256=GCN4KDa9HwZctfgBdF_GWXD0-1aEGhh_LK3adzcX7II,1816
|
|
1517
|
-
wisent/examples/scripts/results/test_tinyBenchmarks_pairs.json,sha256=KlTcdNMmXAlwArOmV3qLdfjTTSygO8Elu_eZWK3k-5A,1086
|
|
1518
|
-
wisent/examples/scripts/results/test_tmmluplus_evaluation.json,sha256=epDgRWk1EOr0x3EyNP8GFPMa5-L6teec1VaW-b0dy6g,3438
|
|
1519
|
-
wisent/examples/scripts/results/test_tmmluplus_pairs.json,sha256=qiV2NvDXx1h6uvXzldM3vTL_3CR9BbmxmkViXtlw1n8,1590
|
|
1520
|
-
wisent/examples/scripts/results/test_translation_evaluation.json,sha256=ZHJimHvMjVMQCuAlWF2WSG2cV3LdVWLJzgqTldW6WTA,2483
|
|
1521
|
-
wisent/examples/scripts/results/test_translation_pairs.json,sha256=ET1sAjTY8owKBheIr_DHmGLKFb_3hQeIiHKrtpL8RoQ,798
|
|
1522
|
-
wisent/examples/scripts/results/test_triviaqa_evaluation.json,sha256=loiHb2Y7Bl08egPzV2vSLjXFKy_VpVKUEmNPdGjZXpI,923
|
|
1523
|
-
wisent/examples/scripts/results/test_triviaqa_pairs.json,sha256=Pry_8uSNJ43u6pJvBI8AHPsWkCMeHO_s8lqy7u7ilVY,222
|
|
1524
|
-
wisent/examples/scripts/results/test_truthfulqa-multi_evaluation.json,sha256=LREOfE9bp4OHZF8dMIyvHbyxCJCVGMp0guB7H6zF62o,2254
|
|
1525
|
-
wisent/examples/scripts/results/test_truthfulqa-multi_pairs.json,sha256=vE5O-aBu9t1_M6JGxEvKIs4y7zxjUaRw0xofP-PzYxI,597
|
|
1526
|
-
wisent/examples/scripts/results/test_truthfulqa_evaluation.json,sha256=B-Fjz1DmOb0SEw0ufyk-HmMIubojb09ArtNCohqK0BM,1374
|
|
1527
|
-
wisent/examples/scripts/results/test_truthfulqa_mc1_evaluation.json,sha256=BqBYV3CP7SPDGz_ZRJ95m_R0lNckDEA4dnyZ5Xgi4pI,1378
|
|
1528
|
-
wisent/examples/scripts/results/test_truthfulqa_mc1_pairs.json,sha256=9NXU1laojUaEQXtoKQDYEImMosgO4MF4dPtdy9dEpgs,557
|
|
1529
|
-
wisent/examples/scripts/results/test_truthfulqa_mc2_evaluation.json,sha256=AeMsc60T14qwt7TJDIpbJqzVO40poR9SWUZfPpMsxHc,1378
|
|
1530
|
-
wisent/examples/scripts/results/test_truthfulqa_mc2_pairs.json,sha256=9NXU1laojUaEQXtoKQDYEImMosgO4MF4dPtdy9dEpgs,557
|
|
1531
|
-
wisent/examples/scripts/results/test_truthfulqa_pairs.json,sha256=9NXU1laojUaEQXtoKQDYEImMosgO4MF4dPtdy9dEpgs,557
|
|
1532
|
-
wisent/examples/scripts/results/test_turkishmmlu_evaluation.json,sha256=AnkNpn32HNhA9ncKMpmhYkfTKbm5j5sPejnZEFBB-y8,2010
|
|
1533
|
-
wisent/examples/scripts/results/test_turkishmmlu_pairs.json,sha256=uZxUHPKY43RsghFDNvSRd6IL9xZUYa3EjvF8C12oei4,934
|
|
1534
|
-
wisent/examples/scripts/results/test_unfair_tos_evaluation.json,sha256=mjW_7wMPOJ4O-arUf16VbodEu3ogzfOBKknCV1AYkLg,918
|
|
1535
|
-
wisent/examples/scripts/results/test_unfair_tos_pairs.json,sha256=fkqUlW6y3QYhWyrQCwYAtOToFoGQjP2G2V73GxQnkkk,488
|
|
1536
|
-
wisent/examples/scripts/results/test_unscramble_evaluation.json,sha256=bu7yzHEYR_xO64FGVb8hkPGp6YYIp1xIOGY6NPoOKCE,1485
|
|
1537
|
-
wisent/examples/scripts/results/test_unscramble_pairs.json,sha256=CgDUkWIMU-TvIE3EHrN0t2bWdcGwNGirfwIDlQXXwGI,262
|
|
1538
|
-
wisent/examples/scripts/results/test_webqs_evaluation.json,sha256=Bg35qWgfylN3Pf0CKvTSMawPcqLyZ10YYJCaEVqnvs8,1045
|
|
1539
|
-
wisent/examples/scripts/results/test_webqs_pairs.json,sha256=ZTXifP3ZwsbTW4F1nRNvTPB0bsJzacXiYqgOCgyYMuI,293
|
|
1540
|
-
wisent/examples/scripts/results/test_wikitext103_evaluation.json,sha256=MhNmXu3J_K-g-faNt1w2wLsEcfPZkmPScXVcc6h3EwI,3720
|
|
1541
|
-
wisent/examples/scripts/results/test_wikitext103_pairs.json,sha256=Lt1hRlaLTqi6S2_YMMhfVjGFTzhzmbeLwE1-UdEAcSo,1565
|
|
1542
|
-
wisent/examples/scripts/results/test_wikitext_evaluation.json,sha256=dzK8PjAo75A56GEtzOrfqpICxd1YIF-lR6L0Kh3ocBo,3717
|
|
1543
|
-
wisent/examples/scripts/results/test_wikitext_pairs.json,sha256=cq8HOwPiu4i5Qjn7WQkUkHTd6Xx-sVzZFz-n_qSvxW0,1565
|
|
1544
|
-
wisent/examples/scripts/results/test_winogender_evaluation.json,sha256=OPiDUAklkfkiw-U9uNeZG69hN3u5Wgs22JcuzAQyK80,1652
|
|
1545
|
-
wisent/examples/scripts/results/test_winogender_pairs.json,sha256=Wr4mgPnv98ZQJNLw7caQyqakL1BSaCB1Dj6an3mEkN4,485
|
|
1546
|
-
wisent/examples/scripts/results/test_winogrande_evaluation.json,sha256=TC2jspGQjHTYLR5kb4ZIr6u3MYssG2E5YhFxDdrjwVg,886
|
|
1547
|
-
wisent/examples/scripts/results/test_winogrande_pairs.json,sha256=pLNpvtDn9398l4JqzwlxdJAFTp1PpYRQSi5WP1oOBcc,233
|
|
1548
|
-
wisent/examples/scripts/results/test_wmdp_evaluation.json,sha256=i21siUjmeY7AbnaM5S1Y7EYuhC8e8uGFuGyDVbexN_s,1106
|
|
1549
|
-
wisent/examples/scripts/results/test_wmdp_pairs.json,sha256=NxZfI9iD6CV4jS3LV7AhoogEZpqnSwTCxfG4p0VPYJA,401
|
|
1550
|
-
wisent/examples/scripts/results/test_wmt-ro-en-t5-prompt_evaluation.json,sha256=bbnszaIIIiCcP6NQ9g28rhDTWTVl0kjZot7_o5QmODg,1168
|
|
1551
|
-
wisent/examples/scripts/results/test_wmt-ro-en-t5-prompt_pairs.json,sha256=iED7CMQMDdWDOlxsh07PyE4YWFqmO-3SoZ8ExzVdXKI,328
|
|
1552
|
-
wisent/examples/scripts/results/test_wmt14_en_fr_evaluation.json,sha256=FMQdeqh5akNJ5sOJ6YxgE1uB_OGhiWBwLlJYq_oy1I4,1147
|
|
1553
|
-
wisent/examples/scripts/results/test_wmt14_en_fr_pairs.json,sha256=ypwRrogw8zm_M10OWOZgggcGCaskcbEYN9-B5SaOMX0,298
|
|
1554
|
-
wisent/examples/scripts/results/test_wmt16_en_de_evaluation.json,sha256=oT86Ix1U9DuULsDgbGrSGrgn63X-Vr4KVr_SxsLRops,941
|
|
1555
|
-
wisent/examples/scripts/results/test_wmt16_en_de_pairs.json,sha256=lmYdCNDTGztU0gCIsVgKZ0yErjdLH-xsqIIkKaycJHg,197
|
|
1556
|
-
wisent/examples/scripts/results/test_wmt16_ro_en_evaluation.json,sha256=9ClcOUtO0vfHn_Zd29tqNUVEFxbRpSyfbXA1sQNmGYY,1131
|
|
1557
|
-
wisent/examples/scripts/results/test_wmt16_ro_en_pairs.json,sha256=hO0i_AfnErQ8ChKyWgiCws0dfY-E07txotfOaJY5ZVs,301
|
|
1558
|
-
wisent/examples/scripts/results/test_wsc273_evaluation.json,sha256=RV9FqeePrCsVYedlAnXksfGEppFtlBzL_P_YIuP_SMg,962
|
|
1559
|
-
wisent/examples/scripts/results/test_wsc273_pairs.json,sha256=yK8EMyi5fR_lx8wb2SdW7Co88tBD8ORJIdeJd4CpPkU,274
|
|
1560
|
-
wisent/examples/scripts/results/test_xcopa_evaluation.json,sha256=40LnQrNzZUabyvWXVyc4JSXDAY6TGeade_rg9cJwZ_o,1893
|
|
1561
|
-
wisent/examples/scripts/results/test_xcopa_pairs.json,sha256=RmrzF37PWhnw5sdzh-yKxBHCjgliNKw2CJ4-JKgYgpo,490
|
|
1562
|
-
wisent/examples/scripts/results/test_xnli_eu_evaluation.json,sha256=_PmCiZDR2xcImFgffTeK6mdHtQrIhq_3xTUcej-mKrg,906
|
|
1563
|
-
wisent/examples/scripts/results/test_xnli_eu_pairs.json,sha256=OnNCubMX4U5Haz3HgXRTEOgnkhkRqWnhlBL3TQJjmFk,302
|
|
1564
|
-
wisent/examples/scripts/results/test_xnli_evaluation.json,sha256=g_ojPO_A6CqpEWey4NVXZ5e13VcverS4jUURAaKZk_U,1843
|
|
1565
|
-
wisent/examples/scripts/results/test_xnli_pairs.json,sha256=lHgJF38o3VUeM9ApvV-5v-j2MobCP8mnFYtEdq7Vpi0,1171
|
|
1566
|
-
wisent/examples/scripts/results/test_xquad_evaluation.json,sha256=FWIrqhB6E9zIHyg0M9UprDedcYg0rNpVsFmpAzYzmsA,2171
|
|
1567
|
-
wisent/examples/scripts/results/test_xquad_pairs.json,sha256=syPySOQjRWsaHEfiWhrLEDOjvV-dCNjcp3uyKqIU86Q,2070
|
|
1568
|
-
wisent/examples/scripts/results/test_xstorycloze_evaluation.json,sha256=3LyG1hQyhyiWLqtgwBT4ZknTZaXililXxtSEwcopx-M,4641
|
|
1569
|
-
wisent/examples/scripts/results/test_xstorycloze_pairs.json,sha256=TOSmSQpSQNB1dklWDENQQkIQ-QtVsg7VFqn0P7AcVnI,2952
|
|
1570
|
-
wisent/examples/scripts/results/test_xsum_evaluation.json,sha256=ahpGvrimsFt1zCkY6iimuBPTSx0OW-0lbRUP5v-OkI8,1419
|
|
1571
|
-
wisent/examples/scripts/results/test_xsum_pairs.json,sha256=goOLYN9jYo-JYIigxdLEsWqgc2EsODU-YeDDWvCv6aE,840
|
|
1572
|
-
wisent/examples/scripts/results/test_xwinograd_evaluation.json,sha256=JyroLtcJj5oeChul7WdadkZsvOAVT18zuEIl3rNFqy0,2210
|
|
1573
|
-
wisent/examples/scripts/results/test_xwinograd_pairs.json,sha256=SDObE7ToPGGKjDrB20WVnCT8BCclvvFk_133Fdv2Img,835
|
|
1574
|
-
wisent/examples/scripts/results/test_yahoo_answers_topics_evaluation.json,sha256=g86lFm2e0ALaJruyKOabK0mkYJHTc1GiYpbpxGuVJqk,923
|
|
1575
|
-
wisent/examples/scripts/results/test_yahoo_answers_topics_pairs.json,sha256=g88bnzqG_95nONXy11ZnNQA-2x_m_R9FbwTtIUMgBgI,846
|
|
1576
|
-
wisent/examples/scripts/results/test_AraDiCE_boolq_egy/test_AraDiCE_boolq_egy_evaluation.json,sha256=8Fif1e-Z5Yj_MXcrLTvrdRv_1_TDGf4F-CcD9P6vc6I,1114
|
|
1577
|
-
wisent/examples/scripts/results/test_AraDiCE_boolq_egy/test_AraDiCE_boolq_egy_pairs.json,sha256=ACvi5qvSFg8N3zmaZ0lp3KFAVO0eIo8mulILuUDA09Q,402
|
|
1578
|
-
wisent/examples/scripts/results/test_aradice/test_aradice_evaluation.json,sha256=DLwvsG6RZmsSFdwvr9rcR7W3jPx5m0aa9vSl6UDF74Y,2195
|
|
1579
|
-
wisent/examples/scripts/results/test_aradice/test_aradice_pairs.json,sha256=R6Gd163_VDKHL933ktNjT630al_JtWzczLWgCWAikGQ,998
|
|
1580
|
-
wisent/examples/scripts/results/test_aradice3/test_aradice_evaluation.json,sha256=pr8FAerYR2UPI6nqbnHVPZmkCGArVHTOE79EcaNdXKY,1948
|
|
1581
|
-
wisent/examples/scripts/results/test_aradice3/test_aradice_pairs.json,sha256=7bV0mBa4IuyOOU0AOLa5GaDVSIm-v6hrMN5SKUpBqA0,751
|
|
1582
|
-
wisent/examples/scripts/results/test_basque/test_basque-glue_pairs.json,sha256=eiN94jLrpFyOEQPSJeu8CXttaLJFCGnnmixiOGRcxEk,570
|
|
1583
|
-
wisent/examples/scripts/results/test_basque2/test_basque-glue_evaluation.json,sha256=Np2XXbtbzl0d9aAcS7rrc6U3yMUE8S4SakKaxFCqQKY,1797
|
|
1584
|
-
wisent/examples/scripts/results/test_basque2/test_basque-glue_pairs.json,sha256=eiN94jLrpFyOEQPSJeu8CXttaLJFCGnnmixiOGRcxEk,570
|
|
1585
|
-
wisent/examples/scripts/results/test_basque_glue/test_basque-glue_evaluation.json,sha256=pMnny7J-O7FWKUZfY7z4fV4BSR2j03TuNpb7B53YEKk,1701
|
|
1586
|
-
wisent/examples/scripts/results/test_basque_glue/test_basque-glue_pairs.json,sha256=Iwt6Kmg3fiWhQXOkOlXtfKksYwsXvQWKV4S_NiEkleM,613
|
|
1587
|
-
wisent/examples/scripts/results/test_boolq/test_boolq_evaluation.json,sha256=b4iXD4lHIrUZjntmXJSXQ-ONFpsdQ_nh7zLSiev-HlA,864
|
|
1588
|
-
wisent/examples/scripts/results/test_boolq/test_boolq_pairs.json,sha256=jK_jGZrMSaJVwiBYYmG9FxYaQhpn4-J9HH5lflr0lZ4,1554
|
|
1589
|
-
wisent/examples/scripts/results/test_ceval/test_ceval_evaluation.json,sha256=wcjDYFj5B8R7UcHxLMLFQR-7w97eIk0nRVl3lf1tPuc,2283
|
|
1590
|
-
wisent/examples/scripts/results/test_ceval/test_ceval_pairs.json,sha256=dk4jGjqCE_HZLAWz6lIivYWRAt6rz0cao2GhhElzGVg,872
|
|
1591
|
-
wisent/examples/scripts/results/test_ceval_accountant/test_ceval-valid_accountant_evaluation.json,sha256=NwZBvgrCpm2ML57l_S2ezkBuD28Hbaq9-BKDCN8GT3A,2339
|
|
1592
|
-
wisent/examples/scripts/results/test_ceval_accountant/test_ceval-valid_accountant_pairs.json,sha256=c0fWeirDrdsrsN2LTUftkcjlMSqhFZig1aZlbokQWSg,938
|
|
1593
|
-
wisent/examples/scripts/results/test_ceval_valid/test_ceval_valid_evaluation.json,sha256=Mn-o6UK1MWuH3EDi1XsSlnuy0wOXMRWk7AUS_NYiE0E,2289
|
|
1594
|
-
wisent/examples/scripts/results/test_ceval_valid/test_ceval_valid_pairs.json,sha256=dk4jGjqCE_HZLAWz6lIivYWRAt6rz0cao2GhhElzGVg,872
|
|
1595
|
-
wisent/examples/scripts/results/test_darija_bench/test_darija_bench_evaluation.json,sha256=mE-UlpD4_bpnlQt-rYW-4S4hS_HXOKpjup-f4pj20hw,2599
|
|
1596
|
-
wisent/examples/scripts/results/test_darija_bench/test_darija_bench_pairs.json,sha256=td8oZ9RFS5qeVx3gNdf6bgo3yjWGd6Tkz7jOa-8zByg,1711
|
|
1597
|
-
wisent/examples/scripts/results/test_eus_exams/test_eus_exams_evaluation.json,sha256=aMWHOmI1qOEPnUadmadu28pYLb4u-_Kxj2OHfHgXs4w,4109
|
|
1598
|
-
wisent/examples/scripts/results/test_eus_exams/test_eus_exams_pairs.json,sha256=Bn3Xm1qJseSwhdAT8j3F4vu3u3K6e3smdMimdorX_JM,2025
|
|
1599
|
-
wisent/examples/scripts/results/test_evalita_llm/test_evalita_llm_evaluation.json,sha256=mukAfoY6hd2R5GiobTbjJavTvMP3tnMbXjIUgahYBHg,1905
|
|
1600
|
-
wisent/examples/scripts/results/test_evalita_llm/test_evalita_llm_pairs.json,sha256=HjC70ItXgdB5iE0LyEILkNb7JHsOrFsb3AGNhZc44zs,1785
|
|
1601
|
-
wisent/examples/scripts/results/test_evalita_mp/test_evalita-mp_te_prompt-1_evaluation.json,sha256=MOI3IDN3T5nThGnfryDslZ1ojyRFyPV6IAnbNkhskHM,889
|
|
1602
|
-
wisent/examples/scripts/results/test_evalita_mp/test_evalita-mp_te_prompt-1_pairs.json,sha256=aTLk2rUAIVnFYSqHhbj2WmLM144_i7u5sgooc3GPd7Y,300
|
|
1603
|
-
wisent/examples/scripts/results/test_evalita_mp2/test_evalita_mp_evaluation.json,sha256=6R1jAtX9sNhfYe9nVQvx4IvGLD4br8klbS_cXMdUNbs,1904
|
|
1604
|
-
wisent/examples/scripts/results/test_evalita_mp2/test_evalita_mp_pairs.json,sha256=HjC70ItXgdB5iE0LyEILkNb7JHsOrFsb3AGNhZc44zs,1785
|
|
1605
|
-
wisent/examples/scripts/results/test_evalita_sp2/test_evalita-sp_sum_task_fp-small_p1_evaluation.json,sha256=7pUXf4PqJLPFOEezImpguOlyQhvTn-WdPEzte3RSmXo,2869
|
|
1606
|
-
wisent/examples/scripts/results/test_evalita_sp2/test_evalita-sp_sum_task_fp-small_p1_pairs.json,sha256=yZ6BL9RAtKIpS0MiWcmiIcq-V3FBuDdkfB-TiU1xhto,3268
|
|
1607
|
-
wisent/examples/scripts/results/test_fld/test_fld_evaluation.json,sha256=S1F5EGJdHSkXIHZxz0YGqWmi_YgK_VJL2UpGHenu_fI,838
|
|
1608
|
-
wisent/examples/scripts/results/test_fld/test_fld_pairs.json,sha256=1L5jg_v5WHopxNJYpEplZXRowQ4hH3bKT3G2TMnW-CQ,1629
|
|
1609
|
-
wisent/examples/scripts/results/test_fld_fixed/test_fld_evaluation.json,sha256=aiEXO4lqEdjtTzY4hFbFTH2CPZXeDPfKfme87WacMhE,842
|
|
1610
|
-
wisent/examples/scripts/results/test_fld_fixed/test_fld_pairs.json,sha256=1L5jg_v5WHopxNJYpEplZXRowQ4hH3bKT3G2TMnW-CQ,1629
|
|
1611
|
-
wisent/examples/scripts/results/test_instruct_humaneval/test_instruct_humaneval_evaluation.json,sha256=ouYU9tVa0qtqLmMj3Z8PdXqh5S4zbFIg8rEekb7cuMU,4640
|
|
1612
|
-
wisent/examples/scripts/results/test_instruct_humaneval/test_instruct_humaneval_pairs.json,sha256=8nPVGlUHfsFdcoRV2Zq30zH9-9dXvrOXXHOJ7yMbvHc,1766
|
|
1613
|
-
wisent/examples/scripts/results/test_inverse_scaling_mc/test_inverse_scaling_mc_evaluation.json,sha256=a9w23kEXr9rzK1T9J_ka9uzjGZlXR5xtocclSs_gNkA,1590
|
|
1614
|
-
wisent/examples/scripts/results/test_inverse_scaling_mc/test_inverse_scaling_mc_pairs.json,sha256=TnxvMiVzO9Df42EZ1VivM1UtwoLtpisMTDR9SNJ5cpQ,1964
|
|
1615
|
-
wisent/examples/scripts/results/test_iwslt2017_ar_en/test_iwslt2017-ar-en_evaluation.json,sha256=lWTEYCVVtqSYGZGEGXZvejR_f2kqfwpOKap0DtCjdds,2307
|
|
1616
|
-
wisent/examples/scripts/results/test_iwslt2017_ar_en/test_iwslt2017-ar-en_pairs.json,sha256=BUu5vtNr-oHb201ONyrDANXSQLNB5XJ6bQ310cyaAJo,1414
|
|
1617
|
-
wisent/examples/scripts/results/test_iwslt2017_en_ar/test_iwslt2017-en-ar_evaluation.json,sha256=qk1QpcJgKhBukSbIjZdy6Xup6XM5YVpSCoIcD8EQRBA,2307
|
|
1618
|
-
wisent/examples/scripts/results/test_iwslt2017_en_ar/test_iwslt2017-en-ar_pairs.json,sha256=qQahZyr7GnOpbfy8RoAf2xAFszGzKzqE_2ZphoBL6Pc,1414
|
|
1619
|
-
wisent/examples/scripts/results/test_iwslt2017_group/test_iwslt2017_evaluation.json,sha256=qyt01KdxO5AfMYIAR1-Cv0l-Ts2u3NEB49t8WOsllt8,2301
|
|
1620
|
-
wisent/examples/scripts/results/test_iwslt2017_group/test_iwslt2017_pairs.json,sha256=Lb8LJ6ykOx6iXOcgcwfSRL4DANGNRg9IMOUfDunM9-0,1414
|
|
1621
|
-
wisent/examples/scripts/results/test_jsonschema_bench/test_jsonschema_bench_evaluation.json,sha256=Vnp1Ha2PyH-VA3IasJtKQ4w9AJKSZldqcV9voMAP980,893
|
|
1622
|
-
wisent/examples/scripts/results/test_jsonschema_bench/test_jsonschema_bench_pairs.json,sha256=rTNcw8zRB8sino6WuO6P2lhKEiRG2VHXSh-a2mhJMdc,19480
|
|
1623
|
-
wisent/examples/scripts/results/test_jsonschema_bench_final/test_jsonschema_bench_evaluation.json,sha256=Vnp1Ha2PyH-VA3IasJtKQ4w9AJKSZldqcV9voMAP980,893
|
|
1624
|
-
wisent/examples/scripts/results/test_jsonschema_bench_final/test_jsonschema_bench_pairs.json,sha256=rTNcw8zRB8sino6WuO6P2lhKEiRG2VHXSh-a2mhJMdc,19480
|
|
1625
|
-
wisent/examples/scripts/results/test_kbl_fixed/test_kbl_evaluation.json,sha256=8kGpFhxjO8x_HRSvAg6-WbTez2E8A51ES0i1b0MOCCM,1980
|
|
1626
|
-
wisent/examples/scripts/results/test_kbl_fixed/test_kbl_pairs.json,sha256=LV-Ua4yLlHsewRWlSYsZwTQsd9Gph9iJlDyrgPTTGdo,1803
|
|
1627
|
-
wisent/examples/scripts/results/test_kormedmcqa/test_kormedmcqa_evaluation.json,sha256=j85PbuvVbOUZCiROCx5s6xGeaDEqGvJmY-zFzC-To-Y,1221
|
|
1628
|
-
wisent/examples/scripts/results/test_kormedmcqa/test_kormedmcqa_pairs.json,sha256=1zItWyoLhYMnSx5dEUSm62Wl47PTgM7IFA0vabZ7yNU,1133
|
|
1629
|
-
wisent/examples/scripts/results/test_kormedmcqa_dentist/test_kormedmcqa_dentist_evaluation.json,sha256=k_oerHtwo5BP0n4tmvk9FY-OqkYPHp-Qrs0K33IAn9I,1135
|
|
1630
|
-
wisent/examples/scripts/results/test_kormedmcqa_dentist/test_kormedmcqa_dentist_pairs.json,sha256=hcU7f-g0h20OCCvcVADoQ7Ri0i6gLl4zPRG4QvLSL9E,837
|
|
1631
|
-
wisent/examples/scripts/results/test_lambada_final/test_lambada_openai_mt_stablelm_en_evaluation.json,sha256=y3Cm3YbjBv_RIXT2FTgaEEADBu9stGdGUgWMpkQ0SXk,903
|
|
1632
|
-
wisent/examples/scripts/results/test_lambada_final/test_lambada_openai_mt_stablelm_en_pairs.json,sha256=flzZN9GO7iUf6V22Mfqtyuktrdd3rK5ReKRNFwNIA4Q,452
|
|
1633
|
-
wisent/examples/scripts/results/test_lambada_multilingual/test_lambada_multilingual_evaluation.json,sha256=2007-h4hL1i6TQwvc5Afu8XZYOZlJN7unUEmJSqXph8,1644
|
|
1634
|
-
wisent/examples/scripts/results/test_lambada_multilingual/test_lambada_multilingual_pairs.json,sha256=vcJdBqSpnZ8kEzehkctGhi_LNsM66X3G1C_44hRJaiU,916
|
|
1635
|
-
wisent/examples/scripts/results/test_lambada_stablelm_en_fixed/test_lambada_openai_mt_stablelm_en_evaluation.json,sha256=TxQIkEKMuXBfr8CFIxDw-bOE3_AfQN6DA96oPs3lfcs,901
|
|
1636
|
-
wisent/examples/scripts/results/test_lambada_stablelm_en_fixed/test_lambada_openai_mt_stablelm_en_pairs.json,sha256=LyMRob8O1u3P3Z_5scO0_vCPIWN7YFyCJqF022Z5GRs,451
|
|
1637
|
-
wisent/examples/scripts/results/test_lambada_stablelm_fixed/test_lambada_openai_mt_stablelm_en_evaluation.json,sha256=bqWXs_-P5t3N_iHZ_8fuLkD28qjypiwDF_CApN26-Zo,903
|
|
1638
|
-
wisent/examples/scripts/results/test_lambada_stablelm_fixed/test_lambada_openai_mt_stablelm_en_pairs.json,sha256=1z3YrPxsSBnpotKl-xbzG3M7Ot4d2hCXVR4FkC-zSUI,452
|
|
1639
|
-
wisent/examples/scripts/results/test_libra/test_libra_evaluation.json,sha256=aVk-MyKvwga9sxUUgnG6DOSaA2xlO2vBAlG6jxgZv_Y,2485
|
|
1640
|
-
wisent/examples/scripts/results/test_libra/test_libra_pairs.json,sha256=v-b8smewd_4we1vsxOkyIn0Ol_oCi5xPv_5conndrgk,880379
|
|
1641
|
-
wisent/examples/scripts/results/test_mastermind/test_mastermind_evaluation.json,sha256=f69woRnb2_yIiKm6JNTpM17z3YkisTqiYgwTgvv8Fzc,1846
|
|
1642
|
-
wisent/examples/scripts/results/test_mastermind/test_mastermind_pairs.json,sha256=nZiJ_cPmiPfl799XB7t5vejrct1fZYCG_dWvHiGbKS0,1778
|
|
1643
|
-
wisent/examples/scripts/results/test_mastermind_24_easy/test_mastermind_24_easy_evaluation.json,sha256=E29v402NEemeza5RfRX-2Vpqykc4eBgKstGpF3wWN0E,935
|
|
1644
|
-
wisent/examples/scripts/results/test_mastermind_24_easy/test_mastermind_24_easy_pairs.json,sha256=x7HZA2lND47FIAVS6XuqfenqPYpv0Vi5z2e293V9jiM,531
|
|
1645
|
-
wisent/examples/scripts/results/test_med_concepts_qa/test_med_concepts_qa_evaluation.json,sha256=ouFMxeZaFneONKOFiCabnHUhi6GK5nqN0v0BLYwj_W4,1577
|
|
1646
|
-
wisent/examples/scripts/results/test_med_concepts_qa/test_med_concepts_qa_pairs.json,sha256=QRn1FPe4dRcoE1E1DzIlg7hCqnVdeBZiXSeteJW44Kk,926
|
|
1647
|
-
wisent/examples/scripts/results/test_med_concepts_qa_atc_easy/test_med_concepts_qa_atc_easy_evaluation.json,sha256=Ozg2aC9NwtF173Tc9TWKXcJAv0EiN2QaxFNDXweTgQs,877
|
|
1648
|
-
wisent/examples/scripts/results/test_med_concepts_qa_atc_easy/test_med_concepts_qa_atc_easy_pairs.json,sha256=RtJxjGHpn-gCGedHZZ5sM2bagfSFyGVF4Vf2z9dhedw,333
|
|
1649
|
-
wisent/examples/scripts/results/test_meddialog_raw_perplexity/test_meddialog_raw_perplexity_evaluation.json,sha256=Ffg25sLagyLYRyefmps_P8-stOfF-FttPiCx84qQaT8,3401
|
|
1650
|
-
wisent/examples/scripts/results/test_meddialog_raw_perplexity/test_meddialog_raw_perplexity_pairs.json,sha256=XneZGQh21Uy9Z0w3W7SHik7Wt7Tt1LzlXzXGAZdkpGQ,1124
|
|
1651
|
-
wisent/examples/scripts/results/test_passkey/test_passkey_evaluation.json,sha256=qKB-mMP9W933gVTJk55hPYxyfDUZFbuYR6SzF2hhVGc,1303
|
|
1652
|
-
wisent/examples/scripts/results/test_passkey/test_passkey_pairs.json,sha256=9lC5EuXXTw_wcsfViJC7xnmojlUBkBDy4U6NMY35Wm8,38658
|
|
1653
|
-
wisent/examples/scripts/results/test_paws_en/test_paws_en_evaluation.json,sha256=zF4GHcRrj7SA3iDc546R0aNlrJXN7_iUKO1lpFndnqk,868
|
|
1654
|
-
wisent/examples/scripts/results/test_paws_en/test_paws_en_pairs.json,sha256=3AMSPsHmYHKiO8hQVAfkcWICtsa3Sq731P6jYXO8YaU,369
|
|
1655
|
-
wisent/examples/scripts/results/test_pile_10k/test_pile_10k_evaluation.json,sha256=iif8Qd0STfl684SafDCF81InL6-FuaF6T63Kh96JjKw,3581
|
|
1656
|
-
wisent/examples/scripts/results/test_pile_10k/test_pile_10k_pairs.json,sha256=4HmOQNqCczfI6OEZeld1HU3HydzT06qD_68QIXJNiPM,1544
|
|
1657
|
-
wisent/examples/scripts/results/test_prompt_robustness_agieval_aqua_rat/test_prompt_robustness_agieval_aqua_rat_evaluation.json,sha256=v_6MzluhERLu25Tc7Lml6kXsvddV6MCLVBm49VBcR2s,975
|
|
1658
|
-
wisent/examples/scripts/results/test_prompt_robustness_agieval_aqua_rat/test_prompt_robustness_agieval_aqua_rat_pairs.json,sha256=cdRa2UXD_Zgta_OSSpHr36knjDOxf7sgTAcZzDK6WI0,570
|
|
1659
|
-
wisent/examples/scripts/results/test_siqa/test_siqa_evaluation.json,sha256=mlGNX3VgWyXk4tBBcB3c7oQ87LYppF4ohlSRDN5pkw4,959
|
|
1660
|
-
wisent/examples/scripts/results/test_siqa/test_siqa_pairs.json,sha256=8xrVmzRdfITwngaXf5J78WJKq_WEPPiRQLpYES0k2HE,294
|
|
1048
|
+
wisent/examples/scripts/results/test_AraDiCE_ArabicMMLU_lev_evaluation.json,sha256=fcQJbCj5AxAT0mHqSXH6M8stbp54KpWyKJw92qaPq8E,14062
|
|
1049
|
+
wisent/examples/scripts/results/test_AraDiCE_ArabicMMLU_lev_pairs.json,sha256=inaWlBB2zpzRyO7-YB1VYH0AGsduByBJ3_kwN4yTac4,6024
|
|
1050
|
+
wisent/examples/scripts/results/test_aexams_IslamicStudies_evaluation.json,sha256=zXXxnIR6Qb7y-Qh0WE-mrS7Oq2cZ082dUlEx6KG86bs,21734
|
|
1051
|
+
wisent/examples/scripts/results/test_aexams_IslamicStudies_pairs.json,sha256=XtRDKooN-Ht9Vqf8RRQPVdOyGmh1ZAODoxmQhLHNto8,8668
|
|
1052
|
+
wisent/examples/scripts/results/test_afrimgsm_pairs.json,sha256=qNbvIDdJ7Dss-T5bmSCxuUZ-e7UpjPStq7MbTjE-Sqc,6400
|
|
1053
|
+
wisent/examples/scripts/results/test_afrimmlu_evaluation.json,sha256=skwDyoaU4zTpk_Qg-HFAcSKR3R2OEERRi20xFKy0CmM,12575
|
|
1054
|
+
wisent/examples/scripts/results/test_afrimmlu_pairs.json,sha256=uOQ6MK9iXNt4c4h5S3-RI1KdBCV38T2FMPBWhqb4FEc,4851
|
|
1661
1055
|
wisent/parameters/__init__.py,sha256=dwyW8F6LSMPM-H4zQX6gn7x5qPs78oNAMYRiRPJ8UCk,36
|
|
1662
1056
|
wisent/parameters/lm_eval/all_lm_eval_task_families.json,sha256=MAFcazf3UoDplgaeWdkcKpAOzFRHyc5yLoXLqOwyFvc,2555
|
|
1663
|
-
wisent/parameters/lm_eval/broken_in_lm_eval.json,sha256=
|
|
1057
|
+
wisent/parameters/lm_eval/broken_in_lm_eval.json,sha256=v1sON6hTeKxORXVNrW_WJsIyFWhdIkOWwEXX2V5u2XE,3223
|
|
1058
|
+
wisent/parameters/lm_eval/category_directions.json,sha256=AfgWHCrVEvsjqvFeWDocY4hh3jlYVqkfhrrztWmKWTI,3555
|
|
1664
1059
|
wisent/parameters/lm_eval/evaluations_not_lm_eval_tasks.json,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
1665
1060
|
wisent/parameters/lm_eval/evaluator_check.json,sha256=XrfAOzyw3SYSIfqOo2Q_U-nXpM13ck4m-aRtL6Za9cg,131833
|
|
1666
1061
|
wisent/parameters/lm_eval/final_verification.json,sha256=clscpavGxNXbX2Xn-idHKXGO0_fhMyDalV5bYZtbYiw,740459
|
|
@@ -1671,18 +1066,25 @@ wisent/parameters/lm_eval/no_readmes.json,sha256=T1PNoYwrqgwDVLtfmj7L5e0Sq02OEbq
|
|
|
1671
1066
|
wisent/parameters/lm_eval/not_lm_eval_tasks.json,sha256=zcdUnstl_OA52DO5Sf8ZAPkNcu9B-bfuyTXxPm8MEr8,1964
|
|
1672
1067
|
wisent/parameters/lm_eval/read_tasks.json,sha256=MLOSbTPLXhMcPVw5QJosIIlUiRTFeQmbFZ16wFcMMKk,3401
|
|
1673
1068
|
wisent/parameters/lm_eval/readme_files.json,sha256=1VtyYzREk50c1VjBz5p2JhUcydE0-Kv0wXmIR9C8X3U,3401
|
|
1674
|
-
wisent/parameters/lm_eval/
|
|
1069
|
+
wisent/parameters/lm_eval/repair_plan.json,sha256=7fHvz9rYoeJvuuciXJekZq6ok-rI9ndVybbficmukbc,11131
|
|
1070
|
+
wisent/parameters/lm_eval/track_progress_not_lm_eval_tasks.json,sha256=6dujwX_RNY1MZFbWMb1MtXYK0CdN1QTC6ppPWpxO_64,3472
|
|
1071
|
+
wisent/parameters/lm_eval/weak_contrastive_pairs.json,sha256=ruwV_qTXWKvWKq6zlufYinzeQ1bz2yZJ6eOk_tAprGU,1202
|
|
1072
|
+
wisent/parameters/lm_eval/working_benchmarks.json,sha256=K1Wk2PU9BnmkVFoAwNJc3RcUODaSb2id6aGNjTSzTS0,3240
|
|
1073
|
+
wisent/parameters/lm_eval/working_benchmarks_categorized.json,sha256=F78AlZhPOWW9Si7Qhq28Yz7OZC1jo0c0oAmeZhVydto,4041
|
|
1675
1074
|
wisent/parameters/tasks/missing_task_families.json,sha256=h6g_2CYNQIW5SqRdcymDe4miWkGkVoD3yR0eOFZH4aw,65107
|
|
1676
1075
|
wisent/parameters/tasks/remaining_tasks_to_implement.json,sha256=8_YDVQ439DdvC3daNW7v8y0Zth1eUxum6QzdnKDp6a8,3432
|
|
1677
1076
|
wisent/parameters/tasks/risks.json,sha256=8U1LAY6Zrv68naYMzVlOrGgTBNL0l-9nC7moa-ljSHI,136
|
|
1678
1077
|
wisent/parameters/tasks/skills.json,sha256=63KirwoeFTabMsQ3B7IdNyQLyl8857J0gJF02tTNPQo,215
|
|
1679
1078
|
wisent/parameters/tasks/tasks.json,sha256=7HvSgYjO5dQfHfIwLB3D0h0lVQqpf2tKnU6U36j-r6Y,1140923
|
|
1680
|
-
wisent/scripts/run_quality_metrics_sweep.sh,sha256=
|
|
1079
|
+
wisent/scripts/run_quality_metrics_sweep.sh,sha256=Lj8euHTGBO3QMdNhpW5zFXWPd4bPPYLJRZmZPhQvhiM,10493
|
|
1681
1080
|
wisent/tests/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
1081
|
+
wisent/tests/test_aggregation_geometry.py,sha256=hh8aJ6VyuN_3xA0x9YaoPhu_lMVYKupUxpVyFtEF_18,9277
|
|
1682
1082
|
wisent/tests/test_all_cli_commands.py,sha256=7KqSZ8FsJEwXbgp0w_cfVtv9jgd-9P52fH3nx3jGF9k,23432
|
|
1083
|
+
wisent/tests/test_detector_accuracy.py,sha256=9puG4bcjmeHkMsMO62g49Jq5YjfqLA4r9rzsDYXQRU8,6464
|
|
1683
1084
|
wisent/tests/test_geometry_comprehensive.py,sha256=lUyBfZYudMMaX2-nV2QhtQcchbBaz8bLi6fqmMRQOig,13693
|
|
1085
|
+
wisent/tests/test_geometry_exhaustive.py,sha256=yQnUIjNTW8DaC_bwU_rfHThOutLoMGxTHxsbkbqCZNQ,49679
|
|
1684
1086
|
wisent/tests/test_titan_geometry.py,sha256=lKWsFSCGEHFHD-CW_lz0vfATb6iFij0lrrLosBQJmkc,9710
|
|
1685
|
-
wisent/tests/visualize_geometry.py,sha256=
|
|
1087
|
+
wisent/tests/visualize_geometry.py,sha256=7l_QOoN7Rftmwzu6tn2M6Fug6uniKRSBguwCFeSnTzg,13841
|
|
1686
1088
|
wisent/tests/examples/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
1687
1089
|
wisent/tests/examples/cli/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
1688
1090
|
wisent/tests/examples/cli/activations/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
@@ -1712,9 +1114,9 @@ wisent/tests/nosense/__init__.py,sha256=sH3x4jRPzFM3YmQkdrwJoz-BdOQ1Bh6F95G5HWyI
|
|
|
1712
1114
|
wisent/tests/nosense/base_nosense.py,sha256=a18dBv1378nHly7OCIuk-bCcLnubss3XXDC1ex0zCK8,2633
|
|
1713
1115
|
wisent/tests/nosense/math500_nosense.py,sha256=My0dHsr4OFOiTxb_VDKmGzpoMyzAtqXlHhA0oPfaG7s,2389
|
|
1714
1116
|
wisent/tests/nosense/test_robustness.py,sha256=eeKji-_ls6tx7tuXqUO4BXxFRK-giJVihENAJVOvzSs,12546
|
|
1715
|
-
wisent-0.7.
|
|
1716
|
-
wisent-0.7.
|
|
1717
|
-
wisent-0.7.
|
|
1718
|
-
wisent-0.7.
|
|
1719
|
-
wisent-0.7.
|
|
1720
|
-
wisent-0.7.
|
|
1117
|
+
wisent-0.7.901.dist-info/licenses/LICENSE,sha256=wy0iaw8b2tyqZAfKHib3lP3PJ9o88FDCg92oUHh3sDQ,1073
|
|
1118
|
+
wisent-0.7.901.dist-info/METADATA,sha256=gA_lnwxajFyuc_Dr9wFJ7v9cLeQc27KELDeDiDX4ugo,2125
|
|
1119
|
+
wisent-0.7.901.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
1120
|
+
wisent-0.7.901.dist-info/entry_points.txt,sha256=BM76j3xjtIcVZGk24iDf5w18s6SuqeOpaiAxfZhpnY8,49
|
|
1121
|
+
wisent-0.7.901.dist-info/top_level.txt,sha256=2Ts9Iyldnb3auIN2HBBaHPknRy7nSRDm2f6RGzYgr8A,7
|
|
1122
|
+
wisent-0.7.901.dist-info/RECORD,,
|