ai2-olmo-eval 0.7.1__tar.gz → 0.7.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/PKG-INFO +1 -1
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/ai2_olmo_eval.egg-info/PKG-INFO +1 -1
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/ai2_olmo_eval.egg-info/SOURCES.txt +12 -0
- ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_arithmetic/rc_5shot/config.json +23 -0
- ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_arithmetic/rc_5shot/requests.jsonl.gz +0 -0
- ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_coding/rc_5shot/config.json +23 -0
- ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_coding/rc_5shot/requests.jsonl.gz +0 -0
- ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_common_knowledge/rc_5shot/config.json +23 -0
- ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_common_knowledge/rc_5shot/requests.jsonl.gz +0 -0
- ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_logical_reasoning/rc_5shot/config.json +23 -0
- ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_logical_reasoning/rc_5shot/requests.jsonl.gz +0 -0
- ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_pattern/rc_5shot/config.json +23 -0
- ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_pattern/rc_5shot/requests.jsonl.gz +0 -0
- ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_string_operations/rc_5shot/config.json +23 -0
- ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_string_operations/rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/tasks.py +40 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/version.py +1 -1
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/LICENSE +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/README.md +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/pyproject.toml +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/setup.cfg +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/ai2_olmo_eval.egg-info/dependency_links.txt +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/ai2_olmo_eval.egg-info/requires.txt +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/ai2_olmo_eval.egg-info/top_level.txt +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/__init__.py +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/ai2_arc/ARC-Challenge/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/ai2_arc/ARC-Challenge/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/ai2_arc/ARC-Challenge/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/ai2_arc/ARC-Easy/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/ai2_arc/ARC-Easy/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/ai2_arc/ARC-Easy/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/allenai/basic_arithmetic/none/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/allenai/basic_arithmetic/none/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/allenai/basic_arithmetic/none/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/boolq/none/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/boolq/none/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/boolq/none/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/glue/mrpc/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/glue/mrpc/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/glue/mrpc/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/glue/rte/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/glue/rte/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/glue/rte/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/glue/sst2/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/glue/sst2/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/glue/sst2/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/abstract_algebra/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/abstract_algebra/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/abstract_algebra/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/abstract_algebra/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/abstract_algebra/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/abstract_algebra/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/abstract_algebra/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/abstract_algebra/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/abstract_algebra/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/anatomy/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/anatomy/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/anatomy/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/anatomy/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/anatomy/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/anatomy/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/anatomy/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/anatomy/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/anatomy/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/astronomy/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/astronomy/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/astronomy/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/astronomy/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/astronomy/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/astronomy/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/astronomy/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/astronomy/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/astronomy/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/business_ethics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/business_ethics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/business_ethics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/business_ethics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/business_ethics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/business_ethics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/business_ethics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/business_ethics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/business_ethics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/clinical_knowledge/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/clinical_knowledge/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/clinical_knowledge/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/clinical_knowledge/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/clinical_knowledge/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/clinical_knowledge/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/clinical_knowledge/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/clinical_knowledge/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/clinical_knowledge/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_biology/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_biology/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_biology/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_biology/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_biology/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_biology/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_biology/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_biology/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_biology/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_chemistry/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_chemistry/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_chemistry/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_chemistry/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_chemistry/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_chemistry/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_chemistry/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_chemistry/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_chemistry/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_computer_science/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_computer_science/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_computer_science/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_computer_science/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_computer_science/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_computer_science/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_computer_science/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_computer_science/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_computer_science/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_mathematics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_mathematics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_mathematics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_mathematics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_mathematics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_mathematics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_mathematics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_mathematics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_mathematics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_medicine/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_medicine/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_medicine/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_medicine/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_medicine/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_medicine/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_medicine/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_medicine/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_medicine/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_physics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_physics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_physics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_physics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_physics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_physics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_physics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_physics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/college_physics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/computer_security/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/computer_security/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/computer_security/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/computer_security/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/computer_security/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/computer_security/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/computer_security/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/computer_security/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/computer_security/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/conceptual_physics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/conceptual_physics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/conceptual_physics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/conceptual_physics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/conceptual_physics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/conceptual_physics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/conceptual_physics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/conceptual_physics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/conceptual_physics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/econometrics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/econometrics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/econometrics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/econometrics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/econometrics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/econometrics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/econometrics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/econometrics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/econometrics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/electrical_engineering/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/electrical_engineering/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/electrical_engineering/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/electrical_engineering/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/electrical_engineering/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/electrical_engineering/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/electrical_engineering/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/electrical_engineering/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/electrical_engineering/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/elementary_mathematics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/elementary_mathematics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/elementary_mathematics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/elementary_mathematics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/elementary_mathematics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/elementary_mathematics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/elementary_mathematics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/elementary_mathematics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/elementary_mathematics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/formal_logic/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/formal_logic/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/formal_logic/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/formal_logic/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/formal_logic/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/formal_logic/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/formal_logic/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/formal_logic/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/formal_logic/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/global_facts/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/global_facts/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/global_facts/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/global_facts/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/global_facts/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/global_facts/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/global_facts/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/global_facts/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/global_facts/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_biology/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_biology/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_biology/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_biology/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_biology/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_biology/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_biology/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_biology/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_biology/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_chemistry/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_chemistry/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_chemistry/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_chemistry/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_chemistry/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_chemistry/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_chemistry/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_chemistry/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_chemistry/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_computer_science/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_computer_science/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_computer_science/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_computer_science/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_computer_science/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_computer_science/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_computer_science/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_computer_science/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_computer_science/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_european_history/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_european_history/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_european_history/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_european_history/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_european_history/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_european_history/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_european_history/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_european_history/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_european_history/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_geography/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_geography/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_geography/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_geography/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_geography/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_geography/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_geography/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_geography/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_geography/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_government_and_politics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_government_and_politics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_government_and_politics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_government_and_politics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_government_and_politics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_government_and_politics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_government_and_politics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_government_and_politics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_government_and_politics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_macroeconomics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_macroeconomics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_macroeconomics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_macroeconomics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_macroeconomics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_macroeconomics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_macroeconomics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_macroeconomics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_macroeconomics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_mathematics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_mathematics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_mathematics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_mathematics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_mathematics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_mathematics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_mathematics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_mathematics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_mathematics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_microeconomics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_microeconomics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_microeconomics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_microeconomics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_microeconomics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_microeconomics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_microeconomics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_microeconomics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_microeconomics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_physics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_physics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_physics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_physics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_physics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_physics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_physics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_physics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_physics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_psychology/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_psychology/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_psychology/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_psychology/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_psychology/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_psychology/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_psychology/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_psychology/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_psychology/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_statistics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_statistics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_statistics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_statistics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_statistics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_statistics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_statistics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_statistics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_statistics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_us_history/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_us_history/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_us_history/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_us_history/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_us_history/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_us_history/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_us_history/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_us_history/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_us_history/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_world_history/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_world_history/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_world_history/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_world_history/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_world_history/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_world_history/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_world_history/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_world_history/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/high_school_world_history/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_aging/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_aging/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_aging/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_aging/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_aging/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_aging/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_aging/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_aging/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_aging/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_sexuality/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_sexuality/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_sexuality/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_sexuality/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_sexuality/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_sexuality/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_sexuality/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_sexuality/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/human_sexuality/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/international_law/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/international_law/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/international_law/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/international_law/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/international_law/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/international_law/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/international_law/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/international_law/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/international_law/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/jurisprudence/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/jurisprudence/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/jurisprudence/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/jurisprudence/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/jurisprudence/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/jurisprudence/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/jurisprudence/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/jurisprudence/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/jurisprudence/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/logical_fallacies/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/logical_fallacies/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/logical_fallacies/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/logical_fallacies/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/logical_fallacies/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/logical_fallacies/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/logical_fallacies/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/logical_fallacies/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/logical_fallacies/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/machine_learning/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/machine_learning/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/machine_learning/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/machine_learning/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/machine_learning/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/machine_learning/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/machine_learning/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/machine_learning/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/machine_learning/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/management/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/management/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/management/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/management/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/management/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/management/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/management/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/management/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/management/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/marketing/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/marketing/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/marketing/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/marketing/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/marketing/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/marketing/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/marketing/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/marketing/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/marketing/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/medical_genetics/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/medical_genetics/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/medical_genetics/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/medical_genetics/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/medical_genetics/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/medical_genetics/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/medical_genetics/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/medical_genetics/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/medical_genetics/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/miscellaneous/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/miscellaneous/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/miscellaneous/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/miscellaneous/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/miscellaneous/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/miscellaneous/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/miscellaneous/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/miscellaneous/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/miscellaneous/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_disputes/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_disputes/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_disputes/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_disputes/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_disputes/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_disputes/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_disputes/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_disputes/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_disputes/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_scenarios/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_scenarios/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_scenarios/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_scenarios/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_scenarios/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_scenarios/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_scenarios/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_scenarios/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/moral_scenarios/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/nutrition/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/nutrition/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/nutrition/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/nutrition/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/nutrition/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/nutrition/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/nutrition/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/nutrition/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/nutrition/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/philosophy/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/philosophy/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/philosophy/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/philosophy/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/philosophy/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/philosophy/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/philosophy/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/philosophy/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/philosophy/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/prehistory/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/prehistory/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/prehistory/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/prehistory/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/prehistory/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/prehistory/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/prehistory/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/prehistory/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/prehistory/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_accounting/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_accounting/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_accounting/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_accounting/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_accounting/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_accounting/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_accounting/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_accounting/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_accounting/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_law/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_law/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_law/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_law/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_law/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_law/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_law/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_law/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_law/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_medicine/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_medicine/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_medicine/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_medicine/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_medicine/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_medicine/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_medicine/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_medicine/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_medicine/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_psychology/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_psychology/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_psychology/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_psychology/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_psychology/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_psychology/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_psychology/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_psychology/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/professional_psychology/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/public_relations/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/public_relations/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/public_relations/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/public_relations/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/public_relations/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/public_relations/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/public_relations/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/public_relations/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/public_relations/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/security_studies/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/security_studies/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/security_studies/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/security_studies/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/security_studies/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/security_studies/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/security_studies/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/security_studies/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/security_studies/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/sociology/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/sociology/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/sociology/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/sociology/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/sociology/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/sociology/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/sociology/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/sociology/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/sociology/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/us_foreign_policy/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/us_foreign_policy/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/us_foreign_policy/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/us_foreign_policy/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/us_foreign_policy/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/us_foreign_policy/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/us_foreign_policy/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/us_foreign_policy/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/us_foreign_policy/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/virology/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/virology/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/virology/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/virology/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/virology/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/virology/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/virology/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/virology/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/virology/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/world_religions/dev/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/world_religions/dev/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/world_religions/dev/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/world_religions/test/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/world_religions/test/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/world_religions/test/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/world_religions/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/world_religions/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hails/mmlu_no_train/world_religions/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hellaswag/none/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hellaswag/none/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/hellaswag/none/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/nq_open/none/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/nq_open/none/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/nq_open/none/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/openbookqa/main/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/openbookqa/main/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/openbookqa/main/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/piqa/plain_text/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/piqa/plain_text/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/piqa/plain_text/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/sciq/none/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/sciq/none/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/sciq/none/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/social_i_qa/none/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/social_i_qa/none/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/social_i_qa/none/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/super_glue/cb/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/super_glue/cb/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/super_glue/cb/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/super_glue/copa/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/super_glue/copa/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/super_glue/copa/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/tau/commonsense_qa/none/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/tau/commonsense_qa/none/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/tau/commonsense_qa/none/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/trivia_qa/rc.wikipedia.nocontext/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/trivia_qa/rc.wikipedia.nocontext/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/trivia_qa/rc.wikipedia.nocontext/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/winogrande/winogrande_xl/validation/data-00000-of-00001.arrow +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/winogrande/winogrande_xl/validation/dataset_info.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/winogrande/winogrande_xl/validation/state.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/metrics.py +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/rc_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/rc_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/test_mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/test_mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/test_rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/test_rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/val_mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/val_mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/val_rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_challenge/val_rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/rc_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/rc_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/test_mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/test_mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/test_rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/test_rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/val_mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/val_mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/val_rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/arc_easy/val_rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/boolq/mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/boolq/mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/boolq/rc_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/boolq/rc_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/boolq/rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/boolq/rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/boolq/val_mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/boolq/val_mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/boolq/val_rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/boolq/val_rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/codex_humaneval/gold_bpb_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/codex_humaneval/gold_bpb_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/codex_mbpp/gold_bpb_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/codex_mbpp/gold_bpb_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/copa/rc_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/copa/rc_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/copycolors/10way/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/copycolors/10way/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/copycolors/xl_10way/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/copycolors/xl_10way/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/csqa/mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/csqa/mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/csqa/rc_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/csqa/rc_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/csqa/rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/csqa/rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/csqa/val_mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/csqa/val_mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/csqa/val_rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/csqa/val_rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/gsm8k/gold_bpb_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/gsm8k/gold_bpb_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/hellaswag/mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/hellaswag/mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/hellaswag/rc_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/hellaswag/rc_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/hellaswag/rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/hellaswag/rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/hellaswag/val_mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/hellaswag/val_mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/hellaswag/val_rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/hellaswag/val_rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_algebra/gold_bpb_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_algebra/gold_bpb_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_counting_and_probability/gold_bpb_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_counting_and_probability/gold_bpb_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_geometry/gold_bpb_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_geometry/gold_bpb_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_intermediate_algebra/gold_bpb_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_intermediate_algebra/gold_bpb_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_number_theory/gold_bpb_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_number_theory/gold_bpb_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_prealgebra/gold_bpb_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_prealgebra/gold_bpb_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_precalculus/gold_bpb_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/minerva_math_precalculus/gold_bpb_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/rc_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/rc_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/test_mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/test_mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/test_rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/test_rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/val_mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/val_mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/val_rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/openbookqa/val_rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/piqa/mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/piqa/mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/piqa/rc_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/piqa/rc_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/piqa/rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/piqa/rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/piqa/val_mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/piqa/val_mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/piqa/val_rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/piqa/val_rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/sciq/rc_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/sciq/rc_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/socialiqa/mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/socialiqa/mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/socialiqa/rc_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/socialiqa/rc_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/socialiqa/rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/socialiqa/rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/socialiqa/val_mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/socialiqa/val_mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/socialiqa/val_rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/socialiqa/val_rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/winogrande/mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/winogrande/mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/winogrande/rc_0shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/winogrande/rc_0shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/winogrande/rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/winogrande/rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/winogrande/val_mc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/winogrande/val_mc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/winogrande/val_rc_5shot/config.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/oe_eval_tasks/winogrande/val_rc_5shot/requests.jsonl.gz +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/tokenizer.py +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/tokenizers/allenai_eleuther-ai-gpt-neox-20b-pii-special.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/tokenizers/allenai_gpt-neox-olmo-dolma-v1_5.json +0 -0
- {ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/util.py +0 -0
|
@@ -607,6 +607,18 @@ src/olmo_eval/oe_eval_tasks/arc_easy/val_mc_5shot/config.json
|
|
|
607
607
|
src/olmo_eval/oe_eval_tasks/arc_easy/val_mc_5shot/requests.jsonl.gz
|
|
608
608
|
src/olmo_eval/oe_eval_tasks/arc_easy/val_rc_5shot/config.json
|
|
609
609
|
src/olmo_eval/oe_eval_tasks/arc_easy/val_rc_5shot/requests.jsonl.gz
|
|
610
|
+
src/olmo_eval/oe_eval_tasks/basic_skills_arithmetic/rc_5shot/config.json
|
|
611
|
+
src/olmo_eval/oe_eval_tasks/basic_skills_arithmetic/rc_5shot/requests.jsonl.gz
|
|
612
|
+
src/olmo_eval/oe_eval_tasks/basic_skills_coding/rc_5shot/config.json
|
|
613
|
+
src/olmo_eval/oe_eval_tasks/basic_skills_coding/rc_5shot/requests.jsonl.gz
|
|
614
|
+
src/olmo_eval/oe_eval_tasks/basic_skills_common_knowledge/rc_5shot/config.json
|
|
615
|
+
src/olmo_eval/oe_eval_tasks/basic_skills_common_knowledge/rc_5shot/requests.jsonl.gz
|
|
616
|
+
src/olmo_eval/oe_eval_tasks/basic_skills_logical_reasoning/rc_5shot/config.json
|
|
617
|
+
src/olmo_eval/oe_eval_tasks/basic_skills_logical_reasoning/rc_5shot/requests.jsonl.gz
|
|
618
|
+
src/olmo_eval/oe_eval_tasks/basic_skills_pattern/rc_5shot/config.json
|
|
619
|
+
src/olmo_eval/oe_eval_tasks/basic_skills_pattern/rc_5shot/requests.jsonl.gz
|
|
620
|
+
src/olmo_eval/oe_eval_tasks/basic_skills_string_operations/rc_5shot/config.json
|
|
621
|
+
src/olmo_eval/oe_eval_tasks/basic_skills_string_operations/rc_5shot/requests.jsonl.gz
|
|
610
622
|
src/olmo_eval/oe_eval_tasks/boolq/mc_5shot/config.json
|
|
611
623
|
src/olmo_eval/oe_eval_tasks/boolq/mc_5shot/requests.jsonl.gz
|
|
612
624
|
src/olmo_eval/oe_eval_tasks/boolq/rc_0shot/config.json
|
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
{
|
|
2
|
+
"task_name": "basic_skills_arithmetic",
|
|
3
|
+
"task_hash": "56711b967c78d896ef51ba00aef5cfb0",
|
|
4
|
+
"task_config": {
|
|
5
|
+
"dataset_path": "basic_skills_arithmetic",
|
|
6
|
+
"primary_metric": "acc_per_token",
|
|
7
|
+
"split": "validation",
|
|
8
|
+
"num_shots": 5,
|
|
9
|
+
"metadata": {
|
|
10
|
+
"regimes": [
|
|
11
|
+
"OLMES-v0.1"
|
|
12
|
+
],
|
|
13
|
+
"alias": "basic_skills_arithmetic:rc::olmes"
|
|
14
|
+
},
|
|
15
|
+
"generation_kwargs": {},
|
|
16
|
+
"context_kwargs": {},
|
|
17
|
+
"dataset_name": "arithmetic",
|
|
18
|
+
"task_name": "basic_skills_arithmetic",
|
|
19
|
+
"version": 0,
|
|
20
|
+
"task_core": "basic_skills_arithmetic"
|
|
21
|
+
},
|
|
22
|
+
"current_date": "2025-05-12 00:06:28 UTC"
|
|
23
|
+
}
|
ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_arithmetic/rc_5shot/requests.jsonl.gz
ADDED
|
Binary file
|
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
{
|
|
2
|
+
"task_name": "basic_skills_coding",
|
|
3
|
+
"task_hash": "d748d1d8ba506d3d234eed529ef62c3e",
|
|
4
|
+
"task_config": {
|
|
5
|
+
"dataset_path": "basic_skills_coding",
|
|
6
|
+
"primary_metric": "acc_per_token",
|
|
7
|
+
"split": "validation",
|
|
8
|
+
"num_shots": 5,
|
|
9
|
+
"metadata": {
|
|
10
|
+
"regimes": [
|
|
11
|
+
"OLMES-v0.1"
|
|
12
|
+
],
|
|
13
|
+
"alias": "basic_skills_coding:rc::olmes"
|
|
14
|
+
},
|
|
15
|
+
"generation_kwargs": {},
|
|
16
|
+
"context_kwargs": {},
|
|
17
|
+
"dataset_name": "coding",
|
|
18
|
+
"task_name": "basic_skills_coding",
|
|
19
|
+
"version": 0,
|
|
20
|
+
"task_core": "basic_skills_coding"
|
|
21
|
+
},
|
|
22
|
+
"current_date": "2025-05-12 00:06:28 UTC"
|
|
23
|
+
}
|
ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_coding/rc_5shot/requests.jsonl.gz
ADDED
|
Binary file
|
ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_common_knowledge/rc_5shot/config.json
ADDED
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
{
|
|
2
|
+
"task_name": "basic_skills_common_knowledge",
|
|
3
|
+
"task_hash": "51e88e759602f9085a8c779da375d833",
|
|
4
|
+
"task_config": {
|
|
5
|
+
"dataset_path": "basic_skills_common_knowledge",
|
|
6
|
+
"primary_metric": "acc_per_token",
|
|
7
|
+
"split": "validation",
|
|
8
|
+
"num_shots": 5,
|
|
9
|
+
"metadata": {
|
|
10
|
+
"regimes": [
|
|
11
|
+
"OLMES-v0.1"
|
|
12
|
+
],
|
|
13
|
+
"alias": "basic_skills_common_knowledge:rc::olmes"
|
|
14
|
+
},
|
|
15
|
+
"generation_kwargs": {},
|
|
16
|
+
"context_kwargs": {},
|
|
17
|
+
"dataset_name": "common_knowledge",
|
|
18
|
+
"task_name": "basic_skills_common_knowledge",
|
|
19
|
+
"version": 0,
|
|
20
|
+
"task_core": "basic_skills_common_knowledge"
|
|
21
|
+
},
|
|
22
|
+
"current_date": "2025-05-12 00:06:28 UTC"
|
|
23
|
+
}
|
|
Binary file
|
ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_logical_reasoning/rc_5shot/config.json
ADDED
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
{
|
|
2
|
+
"task_name": "basic_skills_logical_reasoning",
|
|
3
|
+
"task_hash": "a3d406a2f4224604b7e6bbf68050691d",
|
|
4
|
+
"task_config": {
|
|
5
|
+
"dataset_path": "basic_skills_logical_reasoning",
|
|
6
|
+
"primary_metric": "acc_per_token",
|
|
7
|
+
"split": "validation",
|
|
8
|
+
"num_shots": 5,
|
|
9
|
+
"metadata": {
|
|
10
|
+
"regimes": [
|
|
11
|
+
"OLMES-v0.1"
|
|
12
|
+
],
|
|
13
|
+
"alias": "basic_skills_logical_reasoning:rc::olmes"
|
|
14
|
+
},
|
|
15
|
+
"generation_kwargs": {},
|
|
16
|
+
"context_kwargs": {},
|
|
17
|
+
"dataset_name": "logical_reasoning",
|
|
18
|
+
"task_name": "basic_skills_logical_reasoning",
|
|
19
|
+
"version": 0,
|
|
20
|
+
"task_core": "basic_skills_logical_reasoning"
|
|
21
|
+
},
|
|
22
|
+
"current_date": "2025-05-12 00:06:28 UTC"
|
|
23
|
+
}
|
|
Binary file
|
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
{
|
|
2
|
+
"task_name": "basic_skills_pattern",
|
|
3
|
+
"task_hash": "67983750bfb70a3b5cc34dcd67ee3c6a",
|
|
4
|
+
"task_config": {
|
|
5
|
+
"dataset_path": "basic_skills_pattern",
|
|
6
|
+
"primary_metric": "acc_per_token",
|
|
7
|
+
"split": "validation",
|
|
8
|
+
"num_shots": 5,
|
|
9
|
+
"metadata": {
|
|
10
|
+
"regimes": [
|
|
11
|
+
"OLMES-v0.1"
|
|
12
|
+
],
|
|
13
|
+
"alias": "basic_skills_pattern:rc::olmes"
|
|
14
|
+
},
|
|
15
|
+
"generation_kwargs": {},
|
|
16
|
+
"context_kwargs": {},
|
|
17
|
+
"dataset_name": "pattern",
|
|
18
|
+
"task_name": "basic_skills_pattern",
|
|
19
|
+
"version": 0,
|
|
20
|
+
"task_core": "basic_skills_pattern"
|
|
21
|
+
},
|
|
22
|
+
"current_date": "2025-05-12 00:06:28 UTC"
|
|
23
|
+
}
|
ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_pattern/rc_5shot/requests.jsonl.gz
ADDED
|
Binary file
|
ai2_olmo_eval-0.7.2/src/olmo_eval/oe_eval_tasks/basic_skills_string_operations/rc_5shot/config.json
ADDED
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
{
|
|
2
|
+
"task_name": "basic_skills_string_operations",
|
|
3
|
+
"task_hash": "8e5fdc7697f1bc7b0c9487a6fa682e45",
|
|
4
|
+
"task_config": {
|
|
5
|
+
"dataset_path": "basic_skills_string_operations",
|
|
6
|
+
"primary_metric": "acc_per_token",
|
|
7
|
+
"split": "validation",
|
|
8
|
+
"num_shots": 5,
|
|
9
|
+
"metadata": {
|
|
10
|
+
"regimes": [
|
|
11
|
+
"OLMES-v0.1"
|
|
12
|
+
],
|
|
13
|
+
"alias": "basic_skills_string_operations:rc::olmes"
|
|
14
|
+
},
|
|
15
|
+
"generation_kwargs": {},
|
|
16
|
+
"context_kwargs": {},
|
|
17
|
+
"dataset_name": "string_operations",
|
|
18
|
+
"task_name": "basic_skills_string_operations",
|
|
19
|
+
"version": 0,
|
|
20
|
+
"task_core": "basic_skills_string_operations"
|
|
21
|
+
},
|
|
22
|
+
"current_date": "2025-05-12 00:06:28 UTC"
|
|
23
|
+
}
|
|
Binary file
|
|
@@ -1704,6 +1704,46 @@ LABEL_TO_TASK_MAP_ORIG = {
|
|
|
1704
1704
|
OEEvalTask,
|
|
1705
1705
|
{"dataset_path": "arc_easy", "dataset_name": "rc_5shot", "metric_type": "acc"},
|
|
1706
1706
|
),
|
|
1707
|
+
"basic_skills_arithmetic_rc_5shot": (
|
|
1708
|
+
OEEvalTask,
|
|
1709
|
+
{
|
|
1710
|
+
"dataset_path": "basic_skills_arithmetic",
|
|
1711
|
+
"dataset_name": "rc_5shot",
|
|
1712
|
+
"metric_type": "acc",
|
|
1713
|
+
},
|
|
1714
|
+
),
|
|
1715
|
+
"basic_skills_coding_rc_5shot": (
|
|
1716
|
+
OEEvalTask,
|
|
1717
|
+
{"dataset_path": "basic_skills_coding", "dataset_name": "rc_5shot", "metric_type": "acc"},
|
|
1718
|
+
),
|
|
1719
|
+
"basic_skills_common_knowledge_rc_5shot": (
|
|
1720
|
+
OEEvalTask,
|
|
1721
|
+
{
|
|
1722
|
+
"dataset_path": "basic_skills_common_knowledge",
|
|
1723
|
+
"dataset_name": "rc_5shot",
|
|
1724
|
+
"metric_type": "acc",
|
|
1725
|
+
},
|
|
1726
|
+
),
|
|
1727
|
+
"basic_skills_logical_reasoning_rc_5shot": (
|
|
1728
|
+
OEEvalTask,
|
|
1729
|
+
{
|
|
1730
|
+
"dataset_path": "basic_skills_logical_reasoning",
|
|
1731
|
+
"dataset_name": "rc_5shot",
|
|
1732
|
+
"metric_type": "acc",
|
|
1733
|
+
},
|
|
1734
|
+
),
|
|
1735
|
+
"basic_skills_pattern_rc_5shot": (
|
|
1736
|
+
OEEvalTask,
|
|
1737
|
+
{"dataset_path": "basic_skills_pattern", "dataset_name": "rc_5shot", "metric_type": "acc"},
|
|
1738
|
+
),
|
|
1739
|
+
"basic_skills_string_operations_rc_5shot": (
|
|
1740
|
+
OEEvalTask,
|
|
1741
|
+
{
|
|
1742
|
+
"dataset_path": "basic_skills_string_operations",
|
|
1743
|
+
"dataset_name": "rc_5shot",
|
|
1744
|
+
"metric_type": "acc",
|
|
1745
|
+
},
|
|
1746
|
+
),
|
|
1707
1747
|
"boolq_mc_5shot": (
|
|
1708
1748
|
OEEvalTask,
|
|
1709
1749
|
{"dataset_path": "boolq", "dataset_name": "mc_5shot", "metric_type": "acc"},
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{ai2_olmo_eval-0.7.1 → ai2_olmo_eval-0.7.2}/src/olmo_eval/hf_datasets/glue/rte/validation/state.json
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|