nemo-evaluator-launcher 0.1.21__tar.gz → 0.1.23__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of nemo-evaluator-launcher might be problematic. Click here for more details.
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/PKG-INFO +2 -2
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/pyproject.toml +1 -1
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/common/helpers.py +4 -1
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/package_info.py +1 -1
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/resources/mapping.toml +13 -13
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher.egg-info/PKG-INFO +2 -2
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher.egg-info/requires.txt +1 -1
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/LICENSE +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/README.md +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/setup.cfg +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/__init__.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/api/__init__.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/api/functional.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/api/types.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/api/utils.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/cli/__init__.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/cli/export.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/cli/info.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/cli/kill.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/cli/ls_runs.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/cli/ls_tasks.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/cli/main.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/cli/run.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/cli/status.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/cli/version.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/common/__init__.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/common/execdb.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/common/logging_utils.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/common/mapping.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/common/printing_utils.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/configs/__init__.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/configs/default.yaml +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/configs/deployment/generic.yaml +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/configs/deployment/nim.yaml +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/configs/deployment/none.yaml +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/configs/deployment/sglang.yaml +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/configs/deployment/trtllm.yaml +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/configs/deployment/vllm.yaml +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/configs/execution/lepton/default.yaml +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/configs/execution/local.yaml +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/configs/execution/slurm/default.yaml +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/executors/__init__.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/executors/base.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/executors/lepton/__init__.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/executors/lepton/deployment_helpers.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/executors/lepton/executor.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/executors/lepton/job_helpers.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/executors/local/__init__.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/executors/local/executor.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/executors/local/run.template.sh +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/executors/registry.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/executors/slurm/__init__.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/executors/slurm/executor.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/exporters/__init__.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/exporters/base.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/exporters/gsheets.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/exporters/local.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/exporters/mlflow.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/exporters/registry.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/exporters/utils.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher/exporters/wandb.py +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher.egg-info/SOURCES.txt +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher.egg-info/dependency_links.txt +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher.egg-info/entry_points.txt +0 -0
- {nemo_evaluator_launcher-0.1.21 → nemo_evaluator_launcher-0.1.23}/src/nemo_evaluator_launcher.egg-info/top_level.txt +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: nemo-evaluator-launcher
|
|
3
|
-
Version: 0.1.
|
|
3
|
+
Version: 0.1.23
|
|
4
4
|
Summary: Launcher for the evaluations provided by NeMo Evaluator containers with different runtime backends
|
|
5
5
|
Author: NVIDIA
|
|
6
6
|
Author-email: nemo-toolkit@nvidia.com
|
|
@@ -478,7 +478,7 @@ Requires-Dist: mlflow>=2.8.0; extra == "mlflow"
|
|
|
478
478
|
Provides-Extra: wandb
|
|
479
479
|
Requires-Dist: wandb>=0.15.0; extra == "wandb"
|
|
480
480
|
Provides-Extra: gsheets
|
|
481
|
-
Requires-Dist:
|
|
481
|
+
Requires-Dist: gspread>=5.0.0; extra == "gsheets"
|
|
482
482
|
Provides-Extra: exporters
|
|
483
483
|
Requires-Dist: mlflow; extra == "exporters"
|
|
484
484
|
Requires-Dist: wandb; extra == "exporters"
|
|
@@ -40,7 +40,7 @@ repository = "https://github.com/NVIDIA-NeMo/Evaluator/packages/nemo-evaluator-l
|
|
|
40
40
|
[project.optional-dependencies]
|
|
41
41
|
mlflow = ["mlflow>=2.8.0"]
|
|
42
42
|
wandb = ["wandb>=0.15.0"]
|
|
43
|
-
gsheets = ["
|
|
43
|
+
gsheets = ["gspread>=5.0.0"]
|
|
44
44
|
exporters = ["mlflow", "wandb", "gsheets"]
|
|
45
45
|
all = ["mlflow", "wandb", "gsheets"]
|
|
46
46
|
|
|
@@ -14,6 +14,7 @@
|
|
|
14
14
|
# limitations under the License.
|
|
15
15
|
#
|
|
16
16
|
import base64
|
|
17
|
+
import copy
|
|
17
18
|
import datetime
|
|
18
19
|
from dataclasses import dataclass
|
|
19
20
|
from typing import Optional
|
|
@@ -170,7 +171,9 @@ def get_eval_factory_command(
|
|
|
170
171
|
+ "&& $cmd run_eval --run_config config_ef.yaml"
|
|
171
172
|
)
|
|
172
173
|
|
|
173
|
-
|
|
174
|
+
# NOTE: see note and test about deprecating that.
|
|
175
|
+
overrides = copy.deepcopy(dict(cfg.evaluation.get("overrides", {})))
|
|
176
|
+
overrides.update(dict(user_task_config.get("overrides", {})))
|
|
174
177
|
# NOTE(dfridman): Temporary fix to make sure that the overrides arg is not split into multiple lines.
|
|
175
178
|
# Consider passing a JSON object on Eval Factory side
|
|
176
179
|
overrides = {
|
|
@@ -226,7 +226,7 @@ required_env_vars = []
|
|
|
226
226
|
[bigcode-evaluation-harness.tasks.completions.humaneval]
|
|
227
227
|
required_env_vars = []
|
|
228
228
|
|
|
229
|
-
[bigcode-evaluation-harness.tasks.
|
|
229
|
+
[bigcode-evaluation-harness.tasks.chat.humaneval_instruct]
|
|
230
230
|
|
|
231
231
|
|
|
232
232
|
###############################################################################
|
|
@@ -304,29 +304,29 @@ required_env_vars = []
|
|
|
304
304
|
|
|
305
305
|
###############################################################################
|
|
306
306
|
# NOTE(wprazuch): to verify if the tasks need any env var setting
|
|
307
|
-
[
|
|
307
|
+
[nemo_skills]
|
|
308
308
|
container = "nvcr.io/nvidia/eval-factory/nemo_skills:25.09.1"
|
|
309
309
|
|
|
310
|
-
[
|
|
311
|
-
required_env_vars = []
|
|
310
|
+
[nemo_skills.tasks.chat.ns_aime2024]
|
|
311
|
+
required_env_vars = ["JUDGE_API_KEY"]
|
|
312
312
|
|
|
313
|
-
[
|
|
313
|
+
[nemo_skills.tasks.chat.ns_aime2025]
|
|
314
314
|
required_env_vars = []
|
|
315
315
|
|
|
316
|
-
[
|
|
316
|
+
[nemo_skills.tasks.chat.ns_bfcl_v3]
|
|
317
317
|
required_env_vars = []
|
|
318
318
|
|
|
319
|
-
[
|
|
320
|
-
required_env_vars = []
|
|
319
|
+
[nemo_skills.tasks.chat.ns_gpqa]
|
|
320
|
+
required_env_vars = ["HF_TOKEN"]
|
|
321
321
|
|
|
322
|
-
[
|
|
322
|
+
[nemo_skills.tasks.chat.ns_hle]
|
|
323
323
|
required_env_vars = []
|
|
324
324
|
|
|
325
|
-
[
|
|
326
|
-
required_env_vars = []
|
|
325
|
+
[nemo_skills.tasks.chat.ns_mmlu]
|
|
326
|
+
required_env_vars = ["HF_TOKEN"]
|
|
327
327
|
|
|
328
|
-
[
|
|
329
|
-
required_env_vars = []
|
|
328
|
+
[nemo_skills.tasks.chat.ns_mmlu_pro]
|
|
329
|
+
required_env_vars = ["HF_TOKEN"]
|
|
330
330
|
|
|
331
331
|
###############################################################################
|
|
332
332
|
[safety-harness]
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: nemo-evaluator-launcher
|
|
3
|
-
Version: 0.1.
|
|
3
|
+
Version: 0.1.23
|
|
4
4
|
Summary: Launcher for the evaluations provided by NeMo Evaluator containers with different runtime backends
|
|
5
5
|
Author: NVIDIA
|
|
6
6
|
Author-email: nemo-toolkit@nvidia.com
|
|
@@ -478,7 +478,7 @@ Requires-Dist: mlflow>=2.8.0; extra == "mlflow"
|
|
|
478
478
|
Provides-Extra: wandb
|
|
479
479
|
Requires-Dist: wandb>=0.15.0; extra == "wandb"
|
|
480
480
|
Provides-Extra: gsheets
|
|
481
|
-
Requires-Dist:
|
|
481
|
+
Requires-Dist: gspread>=5.0.0; extra == "gsheets"
|
|
482
482
|
Provides-Extra: exporters
|
|
483
483
|
Requires-Dist: mlflow; extra == "exporters"
|
|
484
484
|
Requires-Dist: wandb; extra == "exporters"
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|