PyPI - nemo-evaluator-launcher - Versions diffs - 0.1.16__tar.gz → 0.1.44__tar.gz - Mend

nemo-evaluator-launcher 0.1.16tar.gz → 0.1.44tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (68) hide show

{nemo_evaluator_launcher-0.1.16 → nemo_evaluator_launcher-0.1.44}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: nemo-evaluator-launcher
-Version: 0.1.16
+Version: 0.1.44
 Summary: Launcher for the evaluations provided by NeMo Evaluator containers with different runtime backends
 Author: NVIDIA
 Author-email: nemo-toolkit@nvidia.com
@@ -458,7 +458,7 @@ License:
               OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
               SOFTWARE.
-Project-URL: homepage, https://github.com/NVIDIA-NeMo/Eval
+Project-URL: homepage, https://github.com/NVIDIA-NeMo/Evaluator
 Project-URL: repository, https://github.com/NVIDIA-NeMo/Evaluator/packages/nemo-evaluator-launcher
 Keywords: deep learning,evaluations,machine learning,gpu,NLP,pytorch,torch
 Requires-Python: <3.14,>=3.10
@@ -478,7 +478,7 @@ Requires-Dist: mlflow>=2.8.0; extra == "mlflow"
 Provides-Extra: wandb
 Requires-Dist: wandb>=0.15.0; extra == "wandb"
 Provides-Extra: gsheets
-Requires-Dist: gsheets>=0.1.0; extra == "gsheets"
+Requires-Dist: gspread>=5.0.0; extra == "gsheets"
 Provides-Extra: exporters
 Requires-Dist: mlflow; extra == "exporters"
 Requires-Dist: wandb; extra == "exporters"

{nemo_evaluator_launcher-0.1.16 → nemo_evaluator_launcher-0.1.44}/pyproject.toml RENAMED Viewed

@@ -33,20 +33,21 @@ keywords = [
 [project.urls]
 # BEGIN(if-changed): check package_info.py
-homepage = "https://github.com/NVIDIA-NeMo/Eval"
+homepage = "https://github.com/NVIDIA-NeMo/Evaluator"
 repository = "https://github.com/NVIDIA-NeMo/Evaluator/packages/nemo-evaluator-launcher"
 # END(if-changed)
 [project.optional-dependencies]
 mlflow = ["mlflow>=2.8.0"]
 wandb = ["wandb>=0.15.0"]
-gsheets = ["gsheets>=0.1.0"]
+gsheets = ["gspread>=5.0.0"]
 exporters = ["mlflow", "wandb", "gsheets"]
 all = ["mlflow", "wandb", "gsheets"]
 [project.scripts]
 nemo-evaluator-launcher = "nemo_evaluator_launcher.cli.main:main"
 nv-eval = "nemo_evaluator_launcher.cli.main:main"
+nel = "nemo_evaluator_launcher.cli.main:main"
 [dependency-groups]
 dev = [
@@ -75,6 +76,7 @@ where = ["src"]
   "resources/**/*",
   "configs/**/*",
   "executors/**/*.sh",
+  "executors/**/*.template",
 ]
 [tool.setuptools.dynamic]

{nemo_evaluator_launcher-0.1.16 → nemo_evaluator_launcher-0.1.44}/src/nemo_evaluator_launcher/__init__.py RENAMED Viewed

@@ -20,6 +20,7 @@ It automatically initializes logging and conditionally loads internal components
 """
 import importlib
+import warnings
 from nemo_evaluator_launcher.common.logging_utils import logger
 from nemo_evaluator_launcher.package_info import (
@@ -32,9 +33,22 @@ from nemo_evaluator_launcher.package_info import (
     __version__,
 )
-logger.info("Version info", pkg=__package_name__, ver=__version__)
+# Suppress pydantic warnings from third-party libraries (e.g., wandb) that are not
+# compatible with Pydantic 2.x field metadata on Python 3.13+
+warnings.filterwarnings(
+    "ignore",
+    message=r"The 'repr' attribute.*Field\(\).*",
+    category=Warning,
+)
+warnings.filterwarnings(
+    "ignore",
+    message=r"The 'frozen' attribute.*Field\(\).*",
+    category=Warning,
+)
+logger.info("Version info", pkg=__package_name__, ver=__version__)
 try:
     importlib.import_module("nemo_evaluator_launcher_internal")
     logger.debug(

{nemo_evaluator_launcher-0.1.16 → nemo_evaluator_launcher-0.1.44}/src/nemo_evaluator_launcher/api/functional.py RENAMED Viewed

@@ -19,7 +19,7 @@ This module provides the main functional entry points for running evaluations, q
 """
 from pathlib import Path
-from typing import Any, List, Optional, Union
+from typing import Any, Dict, Iterator, List, Optional, Tuple, Union
 import yaml
 from omegaconf import DictConfig, OmegaConf
@@ -116,6 +116,7 @@ def get_status(ids_or_prefixes: list[str]) -> list[dict[str, Any]]:
     db = ExecutionDB()
     results: List[dict[str, Any]] = []
+    # TODO(agronskiy): refactor the `.`-checking job in all the functions.
     for id_or_prefix in ids_or_prefixes:
         # If id looks like an invocation_id (no dot), get all jobs for it
         if "." not in id_or_prefix:
@@ -259,6 +260,108 @@ def get_status(ids_or_prefixes: list[str]) -> list[dict[str, Any]]:
     return results
+def stream_logs(
+    ids_or_prefixes: Union[str, list[str]],
+) -> Iterator[Tuple[str, str, str]]:
+    """Stream logs from jobs or invocations by their IDs or invocation IDs.
+    Args:
+        ids_or_prefixes: Single ID/prefix or list of job IDs or invocation IDs to stream logs from.
+                         Short prefixes are allowed, we would try to match the full ones from
+                         prefixes if no collisions are present.
+    Yields:
+        Tuple[str, str, str]: Tuples of (job_id, task_name, log_line) for each log line.
+            Empty lines are yielded as empty strings.
+    Raises:
+        ValueError: If the executor doesn't support log streaming.
+    """
+    db = ExecutionDB()
+    # Normalize to list for consistent processing
+    if isinstance(ids_or_prefixes, str):
+        ids_or_prefixes = [ids_or_prefixes]
+    # Collect all jobs from all IDs, grouped by executor
+    executor_to_jobs: Dict[str, Dict[str, JobData]] = {}
+    executor_to_invocations: Dict[str, List[str]] = {}
+    # TODO(agronskiy): refactor the `.`-checking job in all the functions.
+    for id_or_prefix in ids_or_prefixes:
+        # Determine if this is a job ID or invocation ID
+        if "." in id_or_prefix:
+            # This is a job ID
+            job_data = db.get_job(id_or_prefix)
+            if job_data is None:
+                continue
+            executor = job_data.executor
+            if executor not in executor_to_jobs:
+                executor_to_jobs[executor] = {}
+            executor_to_jobs[executor][id_or_prefix] = job_data
+        else:
+            # This is an invocation ID
+            jobs = db.get_jobs(id_or_prefix)
+            if not jobs:
+                continue
+            # Get the executor class from the first job
+            first_job_data = next(iter(jobs.values()))
+            executor = first_job_data.executor
+            if executor not in executor_to_invocations:
+                executor_to_invocations[executor] = []
+            executor_to_invocations[executor].append(id_or_prefix)
+    # Stream logs from each executor simultaneously
+    # For each executor, collect all job IDs and stream them together
+    for executor, jobs_dict in executor_to_jobs.items():
+        try:
+            executor_cls = get_executor(executor)
+        except ValueError:
+            continue
+        # For local executor with multiple jobs, pass list to stream simultaneously
+        # For other executors or single jobs, pass individual job IDs
+        if executor == "local" and len(jobs_dict) > 1:
+            # Pass all job IDs as a list to stream simultaneously
+            try:
+                yield from executor_cls.stream_logs(
+                    list(jobs_dict.keys()), executor_name=executor
+                )
+            except NotImplementedError:
+                raise ValueError(
+                    f"Log streaming is not yet implemented for executor '{executor}'"
+                )
+        else:
+            # Single job or non-local executor
+            for job_id in jobs_dict.keys():
+                try:
+                    yield from executor_cls.stream_logs(job_id, executor_name=executor)
+                except NotImplementedError:
+                    raise ValueError(
+                        f"Log streaming is not yet implemented for executor '{executor}'"
+                    )
+    # Stream logs from invocation IDs
+    for executor, invocation_ids in executor_to_invocations.items():
+        try:
+            executor_cls = get_executor(executor)
+        except ValueError:
+            continue
+        # Stream each invocation (each invocation already handles multiple jobs internally)
+        for invocation_id in invocation_ids:
+            try:
+                yield from executor_cls.stream_logs(
+                    invocation_id, executor_name=executor
+                )
+            except NotImplementedError:
+                raise ValueError(
+                    f"Log streaming is not yet implemented for executor '{executor}'"
+                )
 def list_all_invocations_summary() -> list[dict[str, Any]]:
     """Return a concise per-invocation summary from the exec DB.
@@ -378,6 +481,7 @@ def kill_job_or_invocation(id: str) -> list[dict[str, Any]]:
                 "data": {"error": f"Unexpected error: {str(e)}"},
             }
+    # TODO(agronskiy): refactor the `.`-checking job in all the functions.
     # Determine if this is a job ID or invocation ID
     if "." in id:
         # This is a job ID - kill single job
@@ -442,7 +546,7 @@ def export_results(
             if "." in single_id:  # job_id
                 # Try reading config from artifacts working dir (auto-export on remote node)
                 cfg_file = None
-                for name in ("run_config.yml", "config.yml"):
+                for name in ("config.yml", "run_config.yml"):
                     p = Path(name)
                     if p.exists():
                         cfg_file = p

{nemo_evaluator_launcher-0.1.16 → nemo_evaluator_launcher-0.1.44}/src/nemo_evaluator_launcher/api/types.py RENAMED Viewed

@@ -19,9 +19,18 @@ This module defines data structures and helpers for configuration and type safet
 """
 import os
+import warnings
 from dataclasses import dataclass
 from typing import cast
+# ruff: noqa: E402
+# Later when adding optional module to hydra, since the internal package is optional,
+# will generate a hydra warning. We suppress it as distraction and bad UX, before hydra gets invoked.
+warnings.filterwarnings(
+    "ignore",
+    message="provider=hydra.searchpath.*path=nemo_evaluator_launcher_internal.*is not available\\.",
+)
 import hydra
 from hydra.core.global_hydra import GlobalHydra
 from omegaconf import DictConfig, OmegaConf

nemo_evaluator_launcher-0.1.16/src/nemo_evaluator_launcher/cli/debug.py → nemo_evaluator_launcher-0.1.44/src/nemo_evaluator_launcher/cli/info.py RENAMED Viewed

@@ -14,16 +14,16 @@
 # limitations under the License.
 #
-"""Debugging helper functionalities for nemo-evaluator-launcher."""
+"""Job information helper functionalities for nemo-evaluator-launcher."""
+import sys
 from dataclasses import dataclass
 from datetime import datetime
 from pathlib import Path
-from typing import Any, Dict, List, Optional, Tuple
+from typing import Any, Dict, List, Tuple
 from simple_parsing import field
-from nemo_evaluator_launcher.cli.export import ExportCmd
 from nemo_evaluator_launcher.cli.version import Cmd as VersionCmd
 from nemo_evaluator_launcher.common.execdb import EXEC_DB_FILE, ExecutionDB, JobData
 from nemo_evaluator_launcher.common.logging_utils import logger
@@ -35,52 +35,60 @@ _EXPORT_HELPER = LocalExporter({})
 @dataclass
-class DebugCmd(ExportCmd):
-    """Debugging functionalities for nemo-evaluator-launcher.
+class InfoCmd:
+    """Job information functionalities for nemo-evaluator-launcher.
     Examples:
-      nemo-evaluator-launcher debug <inv>                 # Full debug info
-      nemo-evaluator-launcher debug <inv> --config        # Show stored job config (YAML)
-      nemo-evaluator-launcher debug <inv> --artifacts     # Show artifact locations
-      nemo-evaluator-launcher debug <inv> --logs          # Show log locations
-      nemo-evaluator-launcher debug <inv> --copy-logs <path>       # Copy logs (default: current dir)
-      nemo-evaluator-launcher debug <inv> --copy-artifacts <path>   # Copy artifacts (default: current dir)
+      nemo-evaluator-launcher info <inv>                 # Full job info
+      nemo-evaluator-launcher info <inv> --config        # Show stored job config (YAML)
+      nemo-evaluator-launcher info <inv> --artifacts     # Show artifact locations and key files
+      nemo-evaluator-launcher info <inv> --logs          # Show log locations and key files
+      nemo-evaluator-launcher info <inv> --copy-logs <DIR>       # Copy logs to <DIR>
+      nemo-evaluator-launcher info <inv> --copy-artifacts <DIR>  # Copy artifacts to <DIR>
     Notes:
-      - Supports invocation IDs and job IDs
+      - Supports invocation IDs and job IDs (space-separated)
       - Shows local or remote paths depending on executor (local/slurm/lepton)
+      - Copy operations work for both local and remote jobs (expect longer time for remote jobs)
+      - Copy operations are not supported for Lepton executor (yet).
     """
-    # local exporter destination defaults to local
-    dest: str = field(default="local", init=False)
+    invocation_ids: List[str] = field(
+        positional=True,
+        help="IDs to show info for (space-separated). Accepts invocation IDs or/and job IDs.",
+    )
-    # debug modes
-    config: bool = field(default=False, help="Show job configuration")
-    artifacts: bool = field(default=False, help="Show artifact locations")
-    logs: bool = field(default=False, help="Show log locations")
+    # info modes
+    config: bool = field(
+        default=False, action="store_true", help="Show job configuration"
+    )
+    artifacts: bool = field(
+        default=False, action="store_true", help="Show artifact locations and key files"
+    )
+    logs: bool = field(
+        default=False, action="store_true", help="Show log locations and key files"
+    )
-    # copy operations
-    copy_logs: Optional[str] = field(
+    # copy operations - work for both local and remote jobs
+    copy_logs: str | None = field(
         default=None,
         alias=["--copy-logs"],
-        nargs="?",
-        help="Copy logs to local directory (default: current dir)",
+        help="Copy logs to a local directory",
+        metavar="DIR",
     )
-    copy_artifacts: Optional[str] = field(
+    copy_artifacts: str | None = field(
         default=None,
         alias=["--copy-artifacts"],
-        nargs="?",
-        help="Copy artifacts to local directory (default: current dir)",
+        help="Copy artifacts to a local directory",
+        metavar="DIR",
     )
     def execute(self) -> None:
-        # show version
         VersionCmd().execute()
-        logger.info("Debug command started", invocation_ids=self.invocation_ids)
+        logger.info("Info command started", invocation_ids=self.invocation_ids)
         if not self.invocation_ids:
-            logger.error("No invocation IDs provided")
+            logger.error("No job or invocation IDs provided.")
             raise ValueError("No job or invocation IDs provided.")
         jobs = self._resolve_jobs()
@@ -96,48 +104,63 @@ class DebugCmd(ExportCmd):
                 "No valid jobs found (jobs may have been deleted or IDs may be incorrect)."
             )
             print(
-                "No valid jobs found (jobs may have been deletedd or IDs may be incorrect)."
+                "No valid jobs found (jobs may have been deleted or IDs may be incorrect)."
             )
             return
+        # show ops
         if self.config:
-            logger.info("Showing job configuration", job_count=len(jobs))
             self._show_config_info(jobs)
-        elif self.logs:
-            logger.info("Showing job logs locations", job_count=len(jobs))
+        if self.logs:
             self._show_logs_info(jobs)
-        elif self.artifacts:
-            logger.info("Showing artifacts locations", job_count=len(jobs))
+        if self.artifacts:
             self._show_artifacts_info(jobs)
-        elif self.copy_logs is not None:
-            dest = self.copy_logs or "."
-            if not self.copy_logs:
-                print(
-                    "No destination provided for --copy-logs; defaulting to current dir"
-                )
+        # copy ops
+        args = sys.argv[1:]
+        copy_logs_flag = "--copy-logs" in args
+        copy_artifacts_flag = "--copy-artifacts" in args
+        if copy_logs_flag:
+            if self.copy_logs is None:
+                raise ValueError("--copy-logs requires a directory path")
+            if not self.copy_logs.strip():
+                raise ValueError("--copy-logs requires a directory path")
             logger.info(
-                "Copying logs to local directory", dest_dir=dest, job_count=len(jobs)
+                "Copying logs to local directory",
+                dest_dir=self.copy_logs,
+                job_count=len(jobs),
             )
-            self._copy_logs(jobs, dest)
-        elif self.copy_artifacts is not None:
-            dest = self.copy_artifacts or "."
-            if not self.copy_artifacts:
-                print(
-                    "No destination provided for --copy-artifacts; defaulting to current dir)"
-                )
+            self._copy_logs(jobs, self.copy_logs)
+        if copy_artifacts_flag:
+            if self.copy_artifacts is None:
+                raise ValueError("--copy-artifacts requires a directory path")
+            if not self.copy_artifacts.strip():
+                raise ValueError("--copy-artifacts requires a directory path")
             logger.info(
                 "Copying artifacts to local directory",
-                dest_dir=dest,
+                dest_dir=self.copy_artifacts,
                 job_count=len(jobs),
             )
-            self._copy_artifacts(jobs, dest)
-        else:
+            self._copy_artifacts(jobs, self.copy_artifacts)
+        # default view when no flags
+        if not any(
+            [
+                self.config,
+                self.logs,
+                self.artifacts,
+                self.copy_logs,
+                self.copy_artifacts,
+            ]
+        ):
             logger.info(
                 "Job metadata details",
                 invocation_id=jobs[0][1].invocation_id if jobs else None,
                 jobs=len(jobs),
             )
-            self._show_invocation_debug_info(jobs)
+            self._show_invocation_info(jobs)
     def _resolve_jobs(self) -> List[Tuple[str, JobData]]:
         """Resolve jobs from ExecDB using IDs (job IDs and/or invocation IDs)."""
@@ -160,15 +183,15 @@ class DebugCmd(ExportCmd):
                 uniq.append((jid, jd))
         return sorted(uniq, key=lambda p: p[0])
-    def _show_invocation_debug_info(self, jobs: List[Tuple[str, JobData]]) -> None:
+    def _show_invocation_info(self, jobs: List[Tuple[str, JobData]]) -> None:
         inv = jobs[0][1].invocation_id if jobs else None
-        logger.info("Debug information", jobs=len(jobs), invocation=inv)
+        logger.info("Job information", jobs=len(jobs), invocation=inv)
         print(
-            f"Debug information for {len(jobs)} job(s){f' under invocation {inv}' if inv else ''}:\n"
+            f"Job information for {len(jobs)} job(s){f' under invocation {inv}' if inv else ''}:\n"
         )
         for job_id, job_data in jobs:
-            self._show_job_debug_info(job_id, job_data)
+            self._show_job_info(job_id, job_data)
             print()
         # footer hint: where to find more metadata
@@ -184,10 +207,14 @@ class DebugCmd(ExportCmd):
         print("  - Use --logs to show log locations.")
         print("  - Use --artifacts to show artifact locations.")
         print("  - Use --config to show stored job configuration (YAML).")
-        print("  - Use --copy-logs [DIR] to copy logs to a local directory.")
-        print("  - Use --copy-artifacts [DIR] to copy artifacts to a local directory.")
+        print(
+            "  - Use --copy-logs [DIR] to copy logs to a local directory (works for local and remote jobs)."
+        )
+        print(
+            "  - Use --copy-artifacts [DIR] to copy artifacts to a local directory (works for local and remote jobs)."
+        )
-    def _show_job_debug_info(self, job_id: str, job_data: JobData) -> None:
+    def _show_job_info(self, job_id: str, job_data: JobData) -> None:
         logger.info("Job", job_id=job_id)
         print(f"Job {job_id}")
@@ -208,14 +235,22 @@ class DebugCmd(ExportCmd):
             logger.info("Task", job_id=job_id, name=task_name)
             print(f"├── Task: {task_name}")
+        # Determine executor type for file descriptions
+        cfg_exec_type = ((job_data.config or {}).get("execution") or {}).get("type")
+        exec_type = (job_data.executor or cfg_exec_type or "").lower()
         # locations via exporter helper
         paths = _EXPORT_HELPER.get_job_paths(job_data)
-        # Artifacts
+        # Artifacts with file descriptions
+        artifacts_list = _get_artifacts_file_list()
         if paths.get("storage_type") == "remote_ssh":
             artifacts_path = f"{paths['username']}@{paths['hostname']}:{paths['remote_path']}/artifacts"
             logger.info("Artifacts", job_id=job_id, path=artifacts_path, remote=True)
             print(f"├── Artifacts: {artifacts_path} (remote)")
+            print("│   └── Key files:")
+            for filename, desc in artifacts_list:
+                print(f"│       ├── {filename} - {desc}")
         else:
             ap = paths.get("artifacts_dir")
             if ap:
@@ -224,14 +259,21 @@ class DebugCmd(ExportCmd):
                     "Artifacts", job_id=job_id, path=str(ap), exists_indicator=exists
                 )
                 print(f"├── Artifacts: {ap} {exists} (local)")
+                print("│   └── Key files:")
+                for filename, desc in artifacts_list:
+                    print(f"│       ├── {filename} - {desc}")
-        # Logs
+        # Logs with file descriptions
+        logs_list = _get_log_file_list(exec_type)
         if paths.get("storage_type") == "remote_ssh":
             logs_path = (
                 f"{paths['username']}@{paths['hostname']}:{paths['remote_path']}/logs"
             )
             logger.info("Logs", job_id=job_id, path=logs_path, remote=True)
             print(f"├── Logs: {logs_path} (remote)")
+            print("│   └── Key files:")
+            for filename, desc in logs_list:
+                print(f"│       ├── {filename} - {desc}")
         else:
             lp = paths.get("logs_dir")
             if lp:
@@ -240,6 +282,9 @@ class DebugCmd(ExportCmd):
                     "Logs", job_id=job_id, path=str(lp), exists_indicator=exists
                 )
                 print(f"├── Logs: {lp} {exists} (local)")
+                print("│   └── Key files:")
+                for filename, desc in logs_list:
+                    print(f"│       ├── {filename} - {desc}")
         # executor-specific
         d = job_data.data or {}
@@ -264,17 +309,23 @@ class DebugCmd(ExportCmd):
             eu = d.get("endpoint_url")
             if eu:
                 print(f"├── Endpoint URL: {eu}")
-        # local and others: paths already displayed above; no extra fields needed
     def _show_logs_info(self, jobs: List[Tuple[str, JobData]]) -> None:
         logger.info("Log locations")
         print("Log locations:\n")
         for job_id, job_data in jobs:
             paths = _EXPORT_HELPER.get_job_paths(job_data)
+            cfg_exec_type = ((job_data.config or {}).get("execution") or {}).get("type")
+            exec_type = (job_data.executor or cfg_exec_type or "").lower()
+            logs_list = _get_log_file_list(exec_type)
             if paths.get("storage_type") == "remote_ssh":
                 logs_path = f"ssh://{paths['username']}@{paths['hostname']}{paths['remote_path']}/logs"
                 logger.info("Logs", job_id=job_id, path=logs_path, remote=True)
                 print(f"{job_id}: {logs_path} (remote)")
+                print("  └── Key files:")
+                for filename, desc in logs_list:
+                    print(f"      ├── {filename} - {desc}")
             else:
                 lp = paths.get("logs_dir")
                 if lp:
@@ -283,18 +334,26 @@ class DebugCmd(ExportCmd):
                         "Logs", job_id=job_id, path=str(lp), exists_indicator=exists
                     )
                     print(f"{job_id}: {lp} {exists} (local)")
+                    print("  └── Key files:")
+                    for filename, desc in logs_list:
+                        print(f"      ├── {filename} - {desc}")
     def _show_artifacts_info(self, jobs: List[Tuple[str, JobData]]) -> None:
         logger.info("Artifact locations")
         print("Artifact locations:\n")
         for job_id, job_data in jobs:
             paths = _EXPORT_HELPER.get_job_paths(job_data)
+            artifacts_list = _get_artifacts_file_list()
             if paths.get("storage_type") == "remote_ssh":
                 artifacts_path = f"ssh://{paths['username']}@{paths['hostname']}{paths['remote_path']}/artifacts"
                 logger.info(
                     "Artifacts", job_id=job_id, path=artifacts_path, remote=True
                 )
                 print(f"{job_id}: {artifacts_path} (remote)")
+                print("  └── Key files:")
+                for filename, desc in artifacts_list:
+                    print(f"      ├── {filename} - {desc}")
             else:
                 ap = paths.get("artifacts_dir")
                 if ap:
@@ -306,6 +365,9 @@ class DebugCmd(ExportCmd):
                         exists_indicator=exists,
                     )
                     print(f"{job_id}: {ap} {exists} (local)")
+                    print("  └── Key files:")
+                    for filename, desc in artifacts_list:
+                        print(f"      ├── {filename} - {desc}")
     def _show_config_info(self, jobs: List[Tuple[str, JobData]]) -> None:
         for job_id, job_data in jobs:
@@ -383,6 +445,9 @@ class DebugCmd(ExportCmd):
                         print(
                             f"{jid}: Failed - {job_result.get('message', 'Unknown error')}"
                         )
+            # Show full destination path
+            full_dest_path = Path(dest_dir).resolve()
+            print(f"Copied to: {full_dest_path}")
         else:
             err = result.get("error", "Unknown error")
             logger.warning("Content copy failed", error=err, dest_dir=dest_dir)
@@ -403,3 +468,45 @@ class DebugCmd(ExportCmd):
         except Exception:
             pass
         return ""
+# Helper functions for file descriptions (based on actual code and content analysis)
+def _get_artifacts_file_list() -> list[tuple[str, str]]:
+    """Files generated in artifacts/."""
+    return [
+        (
+            "results.yml",
+            "Benchmark scores, task results and resolved run configuration.",
+        ),
+        (
+            "eval_factory_metrics.json",
+            "Response + runtime stats (latency, tokens count, memory)",
+        ),
+        ("metrics.json", "Harness/benchmark metric and configuration"),
+        ("report.html", "Request-Response Pairs samples in HTML format (if enabled)"),
+        ("report.json", "Report data in json format, if enabled"),
+    ]
+def _get_log_file_list(executor_type: str) -> list[tuple[str, str]]:
+    """Files actually generated in logs/ - executor-specific."""
+    et = (executor_type or "local").lower()
+    if et == "slurm":
+        return [
+            ("client-{SLURM_JOB_ID}.out", "Evaluation container/process output"),
+            (
+                "slurm-{SLURM_JOB_ID}.out",
+                "SLURM scheduler stdout/stderr (batch submission, export steps).",
+            ),
+            (
+                "server-{SLURM_JOB_ID}.out",
+                "Model server logs when a deployment is used.",
+            ),
+        ]
+    # local executor
+    return [
+        (
+            "stdout.log",
+            "Complete evaluation output (timestamps, resolved config, run/export messages).",
+        ),
+    ]

nemo-evaluator-launcher 0.1.16__tar.gz → 0.1.44__tar.gz

nemo-evaluator-launcher 0.1.16tar.gz → 0.1.44tar.gz