nemo-evaluator-launcher 0.1.21__py3-none-any.whl → 0.1.23__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -14,6 +14,7 @@
14
14
  # limitations under the License.
15
15
  #
16
16
  import base64
17
+ import copy
17
18
  import datetime
18
19
  from dataclasses import dataclass
19
20
  from typing import Optional
@@ -170,7 +171,9 @@ def get_eval_factory_command(
170
171
  + "&& $cmd run_eval --run_config config_ef.yaml"
171
172
  )
172
173
 
173
- overrides = merged_nemo_evaluator_config.get("overrides", {})
174
+ # NOTE: see note and test about deprecating that.
175
+ overrides = copy.deepcopy(dict(cfg.evaluation.get("overrides", {})))
176
+ overrides.update(dict(user_task_config.get("overrides", {})))
174
177
  # NOTE(dfridman): Temporary fix to make sure that the overrides arg is not split into multiple lines.
175
178
  # Consider passing a JSON object on Eval Factory side
176
179
  overrides = {
@@ -16,7 +16,7 @@
16
16
  # Below is the _next_ version that will be published, not the currently published one.
17
17
  MAJOR = 0
18
18
  MINOR = 1
19
- PATCH = 21
19
+ PATCH = 23
20
20
  PRE_RELEASE = ""
21
21
 
22
22
  # Use the following formatting: (major, minor, patch, pre-release)
@@ -226,7 +226,7 @@ required_env_vars = []
226
226
  [bigcode-evaluation-harness.tasks.completions.humaneval]
227
227
  required_env_vars = []
228
228
 
229
- [bigcode-evaluation-harness.tasks.completions.humaneval_instruct]
229
+ [bigcode-evaluation-harness.tasks.chat.humaneval_instruct]
230
230
 
231
231
 
232
232
  ###############################################################################
@@ -304,29 +304,29 @@ required_env_vars = []
304
304
 
305
305
  ###############################################################################
306
306
  # NOTE(wprazuch): to verify if the tasks need any env var setting
307
- [nemo-skills]
307
+ [nemo_skills]
308
308
  container = "nvcr.io/nvidia/eval-factory/nemo_skills:25.09.1"
309
309
 
310
- [nemo-skills.tasks.chat.ns_aime2024]
311
- required_env_vars = []
310
+ [nemo_skills.tasks.chat.ns_aime2024]
311
+ required_env_vars = ["JUDGE_API_KEY"]
312
312
 
313
- [nemo-skills.tasks.chat.ns_aime2025]
313
+ [nemo_skills.tasks.chat.ns_aime2025]
314
314
  required_env_vars = []
315
315
 
316
- [nemo-skills.tasks.chat.ns_bfcl_v3]
316
+ [nemo_skills.tasks.chat.ns_bfcl_v3]
317
317
  required_env_vars = []
318
318
 
319
- [nemo-skills.tasks.chat.ns_gpqa]
320
- required_env_vars = []
319
+ [nemo_skills.tasks.chat.ns_gpqa]
320
+ required_env_vars = ["HF_TOKEN"]
321
321
 
322
- [nemo-skills.tasks.chat.ns_hle]
322
+ [nemo_skills.tasks.chat.ns_hle]
323
323
  required_env_vars = []
324
324
 
325
- [nemo-skills.tasks.chat.ns_mmlu]
326
- required_env_vars = []
325
+ [nemo_skills.tasks.chat.ns_mmlu]
326
+ required_env_vars = ["HF_TOKEN"]
327
327
 
328
- [nemo-skills.tasks.chat.ns_mmlu_pro]
329
- required_env_vars = []
328
+ [nemo_skills.tasks.chat.ns_mmlu_pro]
329
+ required_env_vars = ["HF_TOKEN"]
330
330
 
331
331
  ###############################################################################
332
332
  [safety-harness]
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: nemo-evaluator-launcher
3
- Version: 0.1.21
3
+ Version: 0.1.23
4
4
  Summary: Launcher for the evaluations provided by NeMo Evaluator containers with different runtime backends
5
5
  Author: NVIDIA
6
6
  Author-email: nemo-toolkit@nvidia.com
@@ -478,7 +478,7 @@ Requires-Dist: mlflow>=2.8.0; extra == "mlflow"
478
478
  Provides-Extra: wandb
479
479
  Requires-Dist: wandb>=0.15.0; extra == "wandb"
480
480
  Provides-Extra: gsheets
481
- Requires-Dist: gsheets>=0.1.0; extra == "gsheets"
481
+ Requires-Dist: gspread>=5.0.0; extra == "gsheets"
482
482
  Provides-Extra: exporters
483
483
  Requires-Dist: mlflow; extra == "exporters"
484
484
  Requires-Dist: wandb; extra == "exporters"
@@ -1,5 +1,5 @@
1
1
  nemo_evaluator_launcher/__init__.py,sha256=GT38zGwbvBOSeU52WCRx-n9N49LvLGEV1PItgKC8orA,2320
2
- nemo_evaluator_launcher/package_info.py,sha256=oc2OZPiKTMsAYyASxBeE1qPWFlJvxPh7Ey9ajBjdEOk,1586
2
+ nemo_evaluator_launcher/package_info.py,sha256=BXDKj0jZhJPCGvEBfg-lEvW1XIDijovEWP6SqRlqfdA,1586
3
3
  nemo_evaluator_launcher/api/__init__.py,sha256=U9q_MJK2vRsFaymanhyy0nD1SNAZQZC8oY45RXPX7ac,1024
4
4
  nemo_evaluator_launcher/api/functional.py,sha256=T1HTIeiTXb-APWP7lPPTwFam4vFOApZCScRi6tMp538,27648
5
5
  nemo_evaluator_launcher/api/types.py,sha256=W7ZQ9ZTPR6YxInxxsKE6NxuuQAg4pVYz6SRmFCFxY0A,3635
@@ -16,7 +16,7 @@ nemo_evaluator_launcher/cli/status.py,sha256=ANdu0JYnfKNvd1gXmdu_0FrbPG-g0A_R4le
16
16
  nemo_evaluator_launcher/cli/version.py,sha256=puMwIvkmfD3HESjftdTSP6T3Nc8J4cbz8uXWHJcTemY,2030
17
17
  nemo_evaluator_launcher/common/__init__.py,sha256=6-xb4KpG8-lZbWBI42c_Gax-Sq0kMSW8UG0Vn8dOBlo,744
18
18
  nemo_evaluator_launcher/common/execdb.py,sha256=WPzg5Iu2ojvFpBuYahSt3voP_iEUpoO8NgqMLUBwFxA,9767
19
- nemo_evaluator_launcher/common/helpers.py,sha256=ohfTQoltPFG4lDbKbWR3KgcS7Nhlw2cTiEYml_aPhjA,11283
19
+ nemo_evaluator_launcher/common/helpers.py,sha256=7O0cZYGndVaGYhu0npC0faspuD5NeBr2DfzwyAFvPSY,11422
20
20
  nemo_evaluator_launcher/common/logging_utils.py,sha256=LSMGeCyc_QwA6NyyNMKWgKNArz6HBlULEcZy33nlenQ,12214
21
21
  nemo_evaluator_launcher/common/mapping.py,sha256=tD3jWN7rm9-iJEFlENhYMt7adz8DKs67g3Xd43XIAMM,10731
22
22
  nemo_evaluator_launcher/common/printing_utils.py,sha256=YICPY-KhxjL5QNEFJNvYfnj6_ArkZURDdP1pizqY-yU,2368
@@ -51,10 +51,10 @@ nemo_evaluator_launcher/exporters/mlflow.py,sha256=qFEe9774s31Uybpah7kiz4BfZUDMy
51
51
  nemo_evaluator_launcher/exporters/registry.py,sha256=XsPTv_SBAFjcErO6BJ3OHqs3EvXQpLeyKRJuK9Ql4_M,1299
52
52
  nemo_evaluator_launcher/exporters/utils.py,sha256=XZVgTDmoa20tjEMwez0oUSpYpjt3ILV75D4KWuHtZ80,23119
53
53
  nemo_evaluator_launcher/exporters/wandb.py,sha256=1qRUV_YE1Ury7rH7KH65AabR7gmEQ38kXBh2XrfiEpE,18082
54
- nemo_evaluator_launcher/resources/mapping.toml,sha256=3Dgvx_C9M_TdxQ2nZn-QkNEYY7Y3MUMKhCMbBv8cIP4,12233
55
- nemo_evaluator_launcher-0.1.21.dist-info/licenses/LICENSE,sha256=DyGb0fqHPZAsd_uXHA0DGcOCqsvrNsImuLC0Ts4s1zI,23413
56
- nemo_evaluator_launcher-0.1.21.dist-info/METADATA,sha256=Nww4E5YEWFRG4tTVnrvAjLSXzPYxs27C5EDaL-y9W0U,28725
57
- nemo_evaluator_launcher-0.1.21.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
58
- nemo_evaluator_launcher-0.1.21.dist-info/entry_points.txt,sha256=64z1T5GKSB9PW1fCENQuor6X6eqH1rcfg0NQGfKrEy8,130
59
- nemo_evaluator_launcher-0.1.21.dist-info/top_level.txt,sha256=5PvawNm9TXKqPRjZita1xPOtFiMOipcoRf50FI1iY3s,24
60
- nemo_evaluator_launcher-0.1.21.dist-info/RECORD,,
54
+ nemo_evaluator_launcher/resources/mapping.toml,sha256=7M0LAFHI_EUAEPgpPBP_5HxugM0EUa8mUqg-dW4mKmE,12271
55
+ nemo_evaluator_launcher-0.1.23.dist-info/licenses/LICENSE,sha256=DyGb0fqHPZAsd_uXHA0DGcOCqsvrNsImuLC0Ts4s1zI,23413
56
+ nemo_evaluator_launcher-0.1.23.dist-info/METADATA,sha256=QupygFYxAQzCpOAAnGGVjl5QLvbQLqKNZE2VPmRvwAI,28725
57
+ nemo_evaluator_launcher-0.1.23.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
58
+ nemo_evaluator_launcher-0.1.23.dist-info/entry_points.txt,sha256=64z1T5GKSB9PW1fCENQuor6X6eqH1rcfg0NQGfKrEy8,130
59
+ nemo_evaluator_launcher-0.1.23.dist-info/top_level.txt,sha256=5PvawNm9TXKqPRjZita1xPOtFiMOipcoRf50FI1iY3s,24
60
+ nemo_evaluator_launcher-0.1.23.dist-info/RECORD,,