evalscope 0.7.0__py3-none-any.whl → 0.7.2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of evalscope might be problematic. Click here for more details.

@@ -6,7 +6,8 @@ from opencompass.tasks import OpenICLInferTask
6
6
 
7
7
 
8
8
  with read_base():
9
- from opencompass.configs.summarizers.medium import summarizer
9
+ # from opencompass.configs.summarizers.medium import summarizer
10
+ # from opencompass.configs.summarizers.PMMEval import summarizer
10
11
  from evalscope.backend.opencompass.tasks.eval_datasets import datasets
11
12
 
12
13
  # 1. Get datasets
@@ -51,6 +51,7 @@ with read_base():
51
51
  from opencompass.configs.datasets.triviaqa.triviaqa_gen_2121ce import triviaqa_datasets
52
52
  from opencompass.configs.datasets.cmb.cmb_gen_dfb5c4 import cmb_datasets
53
53
  from opencompass.configs.datasets.cmmlu.cmmlu_gen_c13365 import cmmlu_datasets
54
+ from opencompass.configs.datasets.PMMEval.pmmeval_gen import PMMEval_datasets
54
55
 
55
56
  # Note: to be supported
56
57
  # from opencompass.configs.datasets.flores.flores_gen_806ede import flores_datasets
@@ -151,6 +151,6 @@ class OpenaiPlugin(ApiPluginBase):
151
151
  elif input_tokens is None and output_tokens is None: # no usage info get.
152
152
  input_tokens = 0
153
153
  output_tokens = 0
154
- logger.warning('No usage info get.')
154
+ logger.warning('No usage information found. Please specify `--tokenizer-path` to generate usage details.')
155
155
 
156
156
  return input_tokens, output_tokens
evalscope/version.py CHANGED
@@ -1,4 +1,4 @@
1
1
  # Copyright (c) Alibaba, Inc. and its affiliates.
2
2
 
3
- __version__ = "0.7.0"
4
- __release_datetime__ = "2024-11-28 15:00:00"
3
+ __version__ = '0.7.2'
4
+ __release_datetime__ = '2024-12-04 12:00:00'
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: evalscope
3
- Version: 0.7.0
3
+ Version: 0.7.2
4
4
  Summary: EvalScope: Lightweight LLMs Evaluation Framework
5
5
  Home-page: https://github.com/modelscope/evalscope
6
6
  Author: ModelScope team
@@ -29,7 +29,7 @@ Requires-Dist: nltk>=3.9
29
29
  Requires-Dist: openai
30
30
  Requires-Dist: pandas
31
31
  Requires-Dist: plotly
32
- Requires-Dist: pyarrow<=17.0.0
32
+ Requires-Dist: pyarrow
33
33
  Requires-Dist: pympler
34
34
  Requires-Dist: pyyaml
35
35
  Requires-Dist: regex
@@ -62,7 +62,7 @@ Requires-Dist: nltk>=3.9; extra == "all"
62
62
  Requires-Dist: openai; extra == "all"
63
63
  Requires-Dist: pandas; extra == "all"
64
64
  Requires-Dist: plotly; extra == "all"
65
- Requires-Dist: pyarrow<=17.0.0; extra == "all"
65
+ Requires-Dist: pyarrow; extra == "all"
66
66
  Requires-Dist: pympler; extra == "all"
67
67
  Requires-Dist: pyyaml; extra == "all"
68
68
  Requires-Dist: regex; extra == "all"
@@ -81,7 +81,7 @@ Requires-Dist: torch; extra == "all"
81
81
  Requires-Dist: tqdm; extra == "all"
82
82
  Requires-Dist: transformers>=4.33; extra == "all"
83
83
  Requires-Dist: transformers-stream-generator; extra == "all"
84
- Requires-Dist: ms-opencompass>=0.1.3; extra == "all"
84
+ Requires-Dist: ms-opencompass>=0.1.4; extra == "all"
85
85
  Requires-Dist: ms-vlmeval>=0.0.9; extra == "all"
86
86
  Requires-Dist: mteb==1.19.4; extra == "all"
87
87
  Requires-Dist: ragas==0.2.5; extra == "all"
@@ -119,7 +119,7 @@ Requires-Dist: tqdm; extra == "inner"
119
119
  Requires-Dist: transformers<4.43,>=4.33; extra == "inner"
120
120
  Requires-Dist: transformers-stream-generator; extra == "inner"
121
121
  Provides-Extra: opencompass
122
- Requires-Dist: ms-opencompass>=0.1.3; extra == "opencompass"
122
+ Requires-Dist: ms-opencompass>=0.1.4; extra == "opencompass"
123
123
  Provides-Extra: perf
124
124
  Requires-Dist: aiohttp; extra == "perf"
125
125
  Requires-Dist: fastapi; extra == "perf"
@@ -6,15 +6,15 @@ evalscope/run.py,sha256=uAXtaxIBcR94jyfHGFAecuzn0y71oLgu-d9VOohCJAw,18738
6
6
  evalscope/run_arena.py,sha256=BCWCAiX0BQ9pLMIq08svEcd-IoFr75gFShpV88robIY,8963
7
7
  evalscope/run_ms.py,sha256=UtJoGnah64SXigTawJQWTi_TEGjr7Td0rjCTaO-htL8,6028
8
8
  evalscope/summarizer.py,sha256=rIyML8HpjQxIpXg8KvQ0CzOS6xMS-JHZh6kUZzkaRsk,6640
9
- evalscope/version.py,sha256=KtYzabHQSFovvIs99J7glrRj7yrdxYKzKpbzzM2lORk,118
9
+ evalscope/version.py,sha256=H1a8g__rL44KWkB8_7MGtmAlZo0QAG-Yz8ElN-SGMdA,118
10
10
  evalscope/backend/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
11
11
  evalscope/backend/base.py,sha256=5BLrDNNwxsGp35zorD-kphmN15tlBbkuuqwkz8jWZq0,876
12
12
  evalscope/backend/opencompass/__init__.py,sha256=UP_TW5KBq6V_Nvqkeb7PGvGGX3rVYussT43npwCwDgE,135
13
13
  evalscope/backend/opencompass/api_meta_template.py,sha256=sBW0XbVDOKeJ7mVUDLhmcG4e0yClw3eluazdp_8wtgQ,1753
14
14
  evalscope/backend/opencompass/backend_manager.py,sha256=_eg82FLAVxQ6t5e1OqlyuxZcngqD8rxvI5EijLUh_zI,10294
15
15
  evalscope/backend/opencompass/tasks/__init__.py,sha256=I_ANdxdcIHpkIzIXc1yKOlWwzb4oY0FwTPq1kYtgzQw,50
16
- evalscope/backend/opencompass/tasks/eval_api.py,sha256=12lrgDpMzZ1XBRboq5TEOovDPCMDwwGCJoRT78Ox_yo,1108
17
- evalscope/backend/opencompass/tasks/eval_datasets.py,sha256=3V67A2LSj_XaiGd9fqdKpxpzyNrfynCH3UnhaBtAaqc,5326
16
+ evalscope/backend/opencompass/tasks/eval_api.py,sha256=NRIbDqhM_5JD0zBGinhptxrSmTjTelO_RaiaAht7ee0,1179
17
+ evalscope/backend/opencompass/tasks/eval_datasets.py,sha256=nWrPfItIYgPLJUXyu9vZmOmUUjku0BEFCV94Ss12pVU,5408
18
18
  evalscope/backend/rag_eval/__init__.py,sha256=8om6TVnTMmyTEQt1jBuUQA4UfIzyps-_-ih90H_Qjio,284
19
19
  evalscope/backend/rag_eval/backend_manager.py,sha256=jmO-UMu6_iOXMnl4--PrMWCsnIYEhsbiX017rtURqm0,2997
20
20
  evalscope/backend/rag_eval/clip_benchmark/__init__.py,sha256=gDXCiRUTSeGQHxd5SjQsnphMqHJ2si2jywRiHvujEOg,150
@@ -188,7 +188,7 @@ evalscope/perf/plugin/api/__init__.py,sha256=Ckzbq4CkSMVQTedQcDHCYlRd6FTwQAElt2m
188
188
  evalscope/perf/plugin/api/base.py,sha256=B_H04qKx7eRTn155rnDrbTYur7PK1mvxfQKYcqYbndU,2118
189
189
  evalscope/perf/plugin/api/custom_api.py,sha256=NQ2LDKsFQfExVRx2prcmfORCBzxxibfhpVHhB-lxAO4,3776
190
190
  evalscope/perf/plugin/api/dashscope_api.py,sha256=0p9f6ujppS_H6w7wsIbRVNnCkHXtRemIai5Bhdogla4,3826
191
- evalscope/perf/plugin/api/openai_api.py,sha256=I9yM4ouY1-xlBz4bYQ_62FZHKX4F3YCsg5GCqLU_9xA,6938
191
+ evalscope/perf/plugin/api/openai_api.py,sha256=dYUzRwQ9xLoJUTtZHfoI1_3pV9VevdK7EV_yfngDidA,7008
192
192
  evalscope/perf/plugin/datasets/__init__.py,sha256=9mz2TnVHhxbEKAS9pLbKMQuIoShNlZpGiRo9e2RQLUs,490
193
193
  evalscope/perf/plugin/datasets/base.py,sha256=1U_efZuU2ZdWV9UVAqFu1fx9_0PST_sJnaSIqbNvTF4,1787
194
194
  evalscope/perf/plugin/datasets/custom.py,sha256=_GSC5yR90_BjcRjdJqrJT2vHQAzskz5XxYOxngUM2Pg,815
@@ -278,9 +278,9 @@ tests/swift/test_run_swift_vlm_eval.py,sha256=p2i2ZRj-vG1YsQGsemvQLHcyhjy1EmUChy
278
278
  tests/swift/test_run_swift_vlm_jugde_eval.py,sha256=c31jwQle_97ru5Dep91qsAqYjR1HDm1O9YZihRr0u0s,6018
279
279
  tests/vlm/__init__.py,sha256=I_ANdxdcIHpkIzIXc1yKOlWwzb4oY0FwTPq1kYtgzQw,50
280
280
  tests/vlm/test_vlmeval.py,sha256=21xi0nu4ghDB6_X-Pol7pTfK7aYkAYOp82TQ-MSQv-I,1757
281
- evalscope-0.7.0.dist-info/LICENSE,sha256=K_2M03pN0PxVMyx9IQUKsHGhhDMkw5ryQ02rlMvzj3I,11416
282
- evalscope-0.7.0.dist-info/METADATA,sha256=W-NWOZwX9X-VN_LDI16aW6TxcOLJ3Um9dvms8bs28Bw,23796
283
- evalscope-0.7.0.dist-info/WHEEL,sha256=tZoeGjtWxWRfdplE7E3d45VPlLNQnvbKiYnx7gwAy8A,92
284
- evalscope-0.7.0.dist-info/entry_points.txt,sha256=Qr4oTgGhg_K-iUtKwVH6lWUhFHDUiH9trIqydHGTEug,56
285
- evalscope-0.7.0.dist-info/top_level.txt,sha256=Yv0iprOqZQ4rfUO-AWJp7Ni6m0Twxny1yvZwO-8hUDM,16
286
- evalscope-0.7.0.dist-info/RECORD,,
281
+ evalscope-0.7.2.dist-info/LICENSE,sha256=K_2M03pN0PxVMyx9IQUKsHGhhDMkw5ryQ02rlMvzj3I,11416
282
+ evalscope-0.7.2.dist-info/METADATA,sha256=k4bfDc1QrLXGBfztQbobpQDp1ML1sUjqZrKylotW-Ck,23780
283
+ evalscope-0.7.2.dist-info/WHEEL,sha256=tZoeGjtWxWRfdplE7E3d45VPlLNQnvbKiYnx7gwAy8A,92
284
+ evalscope-0.7.2.dist-info/entry_points.txt,sha256=Qr4oTgGhg_K-iUtKwVH6lWUhFHDUiH9trIqydHGTEug,56
285
+ evalscope-0.7.2.dist-info/top_level.txt,sha256=Yv0iprOqZQ4rfUO-AWJp7Ni6m0Twxny1yvZwO-8hUDM,16
286
+ evalscope-0.7.2.dist-info/RECORD,,