PyPI - synth-ai - Versions diffs - 0.4.1__py3-none-any.whl → 0.4.4__py3-none-any.whl - Mend

synth-ai 0.4.1py3-none-any.whl → 0.4.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synth-ai might be problematic. Click here for more details.

Files changed (153) hide show

synth_ai/__init__.py +13 -13
synth_ai/cli/__init__.py +6 -15
synth_ai/cli/commands/eval/__init__.py +6 -15
synth_ai/cli/commands/eval/config.py +338 -0
synth_ai/cli/commands/eval/core.py +236 -1091
synth_ai/cli/commands/eval/runner.py +704 -0
synth_ai/cli/commands/eval/validation.py +44 -117
synth_ai/cli/commands/filter/core.py +7 -7
synth_ai/cli/commands/filter/validation.py +2 -2
synth_ai/cli/commands/smoke/core.py +7 -17
synth_ai/cli/commands/status/__init__.py +1 -64
synth_ai/cli/commands/status/client.py +50 -151
synth_ai/cli/commands/status/config.py +3 -83
synth_ai/cli/commands/status/errors.py +4 -13
synth_ai/cli/commands/status/subcommands/__init__.py +2 -8
synth_ai/cli/commands/status/subcommands/config.py +13 -0
synth_ai/cli/commands/status/subcommands/files.py +18 -63
synth_ai/cli/commands/status/subcommands/jobs.py +28 -311
synth_ai/cli/commands/status/subcommands/models.py +18 -62
synth_ai/cli/commands/status/subcommands/runs.py +16 -63
synth_ai/cli/commands/status/subcommands/session.py +67 -172
synth_ai/cli/commands/status/subcommands/summary.py +24 -32
synth_ai/cli/commands/status/subcommands/utils.py +41 -0
synth_ai/cli/commands/status/utils.py +16 -107
synth_ai/cli/commands/train/__init__.py +18 -20
synth_ai/cli/commands/train/errors.py +3 -3
synth_ai/cli/commands/train/prompt_learning_validation.py +15 -16
synth_ai/cli/commands/train/validation.py +7 -7
synth_ai/cli/commands/train/{judge_schemas.py → verifier_schemas.py} +33 -34
synth_ai/cli/commands/train/verifier_validation.py +235 -0
synth_ai/cli/demo_apps/demo_task_apps/math/config.toml +0 -1
synth_ai/cli/demo_apps/demo_task_apps/math/modal_task_app.py +2 -6
synth_ai/cli/demo_apps/math/config.toml +0 -1
synth_ai/cli/demo_apps/math/modal_task_app.py +2 -6
synth_ai/cli/demo_apps/mipro/task_app.py +25 -47
synth_ai/cli/lib/apps/task_app.py +12 -13
synth_ai/cli/lib/task_app_discovery.py +6 -6
synth_ai/cli/lib/train_cfgs.py +10 -10
synth_ai/cli/task_apps/__init__.py +11 -0
synth_ai/cli/task_apps/commands.py +7 -15
synth_ai/core/env.py +12 -1
synth_ai/core/errors.py +1 -2
synth_ai/core/integrations/cloudflare.py +209 -33
synth_ai/core/tracing_v3/abstractions.py +46 -0
synth_ai/data/__init__.py +3 -30
synth_ai/data/enums.py +1 -20
synth_ai/data/rewards.py +100 -3
synth_ai/products/graph_evolve/__init__.py +1 -2
synth_ai/products/graph_evolve/config.py +16 -16
synth_ai/products/graph_evolve/converters/__init__.py +3 -3
synth_ai/products/graph_evolve/converters/openai_sft.py +7 -7
synth_ai/products/graph_evolve/examples/hotpotqa/config.toml +1 -1
synth_ai/products/graph_gepa/__init__.py +23 -0
synth_ai/products/graph_gepa/converters/__init__.py +19 -0
synth_ai/products/graph_gepa/converters/openai_sft.py +29 -0
synth_ai/sdk/__init__.py +45 -35
synth_ai/sdk/api/eval/__init__.py +33 -0
synth_ai/sdk/api/eval/job.py +732 -0
synth_ai/sdk/api/research_agent/__init__.py +276 -66
synth_ai/sdk/api/train/builders.py +181 -0
synth_ai/sdk/api/train/cli.py +41 -33
synth_ai/sdk/api/train/configs/__init__.py +6 -4
synth_ai/sdk/api/train/configs/prompt_learning.py +127 -33
synth_ai/sdk/api/train/configs/rl.py +264 -16
synth_ai/sdk/api/train/configs/sft.py +165 -1
synth_ai/sdk/api/train/graph_validators.py +12 -12
synth_ai/sdk/api/train/graphgen.py +169 -51
synth_ai/sdk/api/train/graphgen_models.py +95 -45
synth_ai/sdk/api/train/local_api.py +10 -0
synth_ai/sdk/api/train/pollers.py +36 -0
synth_ai/sdk/api/train/prompt_learning.py +390 -60
synth_ai/sdk/api/train/rl.py +41 -5
synth_ai/sdk/api/train/sft.py +2 -0
synth_ai/sdk/api/train/task_app.py +20 -0
synth_ai/sdk/api/train/validators.py +17 -17
synth_ai/sdk/graphs/completions.py +239 -33
synth_ai/sdk/{judging/schemas.py → graphs/verifier_schemas.py} +23 -23
synth_ai/sdk/learning/__init__.py +35 -5
synth_ai/sdk/learning/context_learning_client.py +531 -0
synth_ai/sdk/learning/context_learning_types.py +294 -0
synth_ai/sdk/learning/prompt_learning_client.py +1 -1
synth_ai/sdk/learning/prompt_learning_types.py +2 -1
synth_ai/sdk/learning/rl/__init__.py +0 -4
synth_ai/sdk/learning/rl/contracts.py +0 -4
synth_ai/sdk/localapi/__init__.py +40 -0
synth_ai/sdk/localapi/apps/__init__.py +28 -0
synth_ai/sdk/localapi/client.py +10 -0
synth_ai/sdk/localapi/contracts.py +10 -0
synth_ai/sdk/localapi/helpers.py +519 -0
synth_ai/sdk/localapi/rollouts.py +93 -0
synth_ai/sdk/localapi/server.py +29 -0
synth_ai/sdk/localapi/template.py +49 -0
synth_ai/sdk/streaming/handlers.py +6 -6
synth_ai/sdk/streaming/streamer.py +10 -6
synth_ai/sdk/task/__init__.py +18 -5
synth_ai/sdk/task/apps/__init__.py +37 -1
synth_ai/sdk/task/client.py +9 -1
synth_ai/sdk/task/config.py +6 -11
synth_ai/sdk/task/contracts.py +137 -95
synth_ai/sdk/task/in_process.py +32 -22
synth_ai/sdk/task/in_process_runner.py +9 -4
synth_ai/sdk/task/rubrics/__init__.py +2 -3
synth_ai/sdk/task/rubrics/loaders.py +4 -4
synth_ai/sdk/task/rubrics/strict.py +3 -4
synth_ai/sdk/task/server.py +76 -16
synth_ai/sdk/task/trace_correlation_helpers.py +190 -139
synth_ai/sdk/task/validators.py +34 -49
synth_ai/sdk/training/__init__.py +7 -16
synth_ai/sdk/tunnels/__init__.py +118 -0
synth_ai/sdk/tunnels/cleanup.py +83 -0
synth_ai/sdk/tunnels/ports.py +120 -0
synth_ai/sdk/tunnels/tunneled_api.py +363 -0
{synth_ai-0.4.1.dist-info → synth_ai-0.4.4.dist-info}/METADATA +71 -4
{synth_ai-0.4.1.dist-info → synth_ai-0.4.4.dist-info}/RECORD +118 -128
synth_ai/cli/commands/baseline/__init__.py +0 -12
synth_ai/cli/commands/baseline/core.py +0 -636
synth_ai/cli/commands/baseline/list.py +0 -94
synth_ai/cli/commands/eval/errors.py +0 -81
synth_ai/cli/commands/status/formatters.py +0 -164
synth_ai/cli/commands/status/subcommands/pricing.py +0 -23
synth_ai/cli/commands/status/subcommands/usage.py +0 -203
synth_ai/cli/commands/train/judge_validation.py +0 -305
synth_ai/cli/usage.py +0 -159
synth_ai/data/specs.py +0 -36
synth_ai/sdk/api/research_agent/cli.py +0 -428
synth_ai/sdk/api/research_agent/config.py +0 -357
synth_ai/sdk/api/research_agent/job.py +0 -717
synth_ai/sdk/baseline/__init__.py +0 -25
synth_ai/sdk/baseline/config.py +0 -209
synth_ai/sdk/baseline/discovery.py +0 -216
synth_ai/sdk/baseline/execution.py +0 -154
synth_ai/sdk/judging/__init__.py +0 -15
synth_ai/sdk/judging/base.py +0 -24
synth_ai/sdk/judging/client.py +0 -191
synth_ai/sdk/judging/types.py +0 -42
synth_ai/sdk/research_agent/__init__.py +0 -34
synth_ai/sdk/research_agent/container_builder.py +0 -328
synth_ai/sdk/research_agent/container_spec.py +0 -198
synth_ai/sdk/research_agent/defaults.py +0 -34
synth_ai/sdk/research_agent/results_collector.py +0 -69
synth_ai/sdk/specs/__init__.py +0 -46
synth_ai/sdk/specs/dataclasses.py +0 -149
synth_ai/sdk/specs/loader.py +0 -144
synth_ai/sdk/specs/serializer.py +0 -199
synth_ai/sdk/specs/validation.py +0 -250
synth_ai/sdk/tracing/__init__.py +0 -39
synth_ai/sdk/usage/__init__.py +0 -37
synth_ai/sdk/usage/client.py +0 -171
synth_ai/sdk/usage/models.py +0 -261
{synth_ai-0.4.1.dist-info → synth_ai-0.4.4.dist-info}/WHEEL +0 -0
{synth_ai-0.4.1.dist-info → synth_ai-0.4.4.dist-info}/entry_points.txt +0 -0
{synth_ai-0.4.1.dist-info → synth_ai-0.4.4.dist-info}/licenses/LICENSE +0 -0
{synth_ai-0.4.1.dist-info → synth_ai-0.4.4.dist-info}/top_level.txt +0 -0

synth_ai/sdk/api/train/prompt_learning.py CHANGED Viewed

@@ -1,5 +1,9 @@
 """First-class SDK API for prompt learning (MIPRO and GEPA).
+**Status:** Alpha
+Note: MIPRO is Experimental, GEPA is Alpha.
 This module provides high-level abstractions for running prompt optimization jobs
 both via CLI (`uvx synth-ai train`) and programmatically in Python scripts.
@@ -8,13 +12,17 @@ Example CLI usage:
 Example SDK usage:
     from synth_ai.sdk.api.train.prompt_learning import PromptLearningJob
-    job = PromptLearningJob.from_config("my_config.toml")
+    job = PromptLearningJob.from_dict(config_dict, api_key="sk_live_...")
     job.submit()
-    result = job.poll_until_complete()
-    print(f"Best score: {result['best_score']}")
+    result = job.poll_until_complete(progress=True)  # Built-in progress printing
+    if result.succeeded:
+        print(f"Best score: {result.best_score}")
+    else:
+        print(f"Failed: {result.error}")
-For domain-specific judging, you can use **Verifier Graphs**. See `PromptLearningJudgeConfig`
+For domain-specific verification, you can use **Verifier Graphs**. See `PromptLearningVerifierConfig`
 in `synth_ai.sdk.api.train.configs.prompt_learning` for configuration details.
 """
@@ -22,38 +30,186 @@ from __future__ import annotations
 import asyncio
 import os
-from dataclasses import dataclass
+import time
+from dataclasses import dataclass, field
+from enum import Enum
 from pathlib import Path
-from typing import Any, Callable, Dict, Optional
+from typing import Any, Callable, Dict, List, Optional
 from synth_ai.core.telemetry import log_info
-from .builders import PromptLearningBuildResult, build_prompt_learning_payload
+class JobStatus(str, Enum):
+    """Status of a prompt learning job."""
+    PENDING = "pending"
+    QUEUED = "queued"
+    RUNNING = "running"
+    SUCCEEDED = "succeeded"
+    FAILED = "failed"
+    CANCELLED = "cancelled"
+    @classmethod
+    def from_string(cls, status: str) -> "JobStatus":
+        """Convert string to JobStatus, defaulting to PENDING for unknown values."""
+        try:
+            return cls(status.lower())
+        except ValueError:
+            return cls.PENDING
+    @property
+    def is_terminal(self) -> bool:
+        """Whether this status is terminal (job won't change further)."""
+        return self in (JobStatus.SUCCEEDED, JobStatus.FAILED, JobStatus.CANCELLED)
+    @property
+    def is_success(self) -> bool:
+        """Whether this status indicates success."""
+        return self == JobStatus.SUCCEEDED
+@dataclass
+class PromptLearningResult:
+    """Typed result from a prompt learning job.
+    Provides clean accessors for common fields instead of raw dict access.
+    Example:
+        >>> result = job.poll_until_complete()
+        >>> if result.succeeded:
+        ...     print(f"Best score: {result.best_score}")
+        ...     print(f"Best prompt: {result.best_prompt[:100]}...")
+        >>> else:
+        ...     print(f"Failed: {result.error}")
+    """
+    job_id: str
+    status: JobStatus
+    best_score: Optional[float] = None
+    best_prompt: Optional[str] = None
+    error: Optional[str] = None
+    raw: Dict[str, Any] = field(default_factory=dict)
+    @classmethod
+    def from_response(cls, job_id: str, data: Dict[str, Any]) -> "PromptLearningResult":
+        """Create result from API response dict."""
+        status_str = data.get("status", "pending")
+        status = JobStatus.from_string(status_str)
+        # Extract best score from various field names (backward compat)
+        best_score = (
+            data.get("best_score")
+            or data.get("best_reward")
+            or data.get("best_train_score")
+            or data.get("best_train_reward")
+        )
+        return cls(
+            job_id=job_id,
+            status=status,
+            best_score=best_score,
+            best_prompt=data.get("best_prompt"),
+            error=data.get("error"),
+            raw=data,
+        )
+    @property
+    def succeeded(self) -> bool:
+        """Whether the job succeeded."""
+        return self.status.is_success
+    @property
+    def failed(self) -> bool:
+        """Whether the job failed."""
+        return self.status == JobStatus.FAILED
+    @property
+    def is_terminal(self) -> bool:
+        """Whether the job has reached a terminal state."""
+        return self.status.is_terminal
+from .builders import (
+    PromptLearningBuildResult,
+    build_prompt_learning_payload,
+    build_prompt_learning_payload_from_mapping,
+)
 from .pollers import JobPoller, PollOutcome
-from .task_app import check_task_app_health
-from .utils import ensure_api_base, http_post
+from .local_api import check_local_api_health
+from .utils import ensure_api_base, http_get, http_post
 @dataclass
 class PromptLearningJobConfig:
-    """Configuration for a prompt learning job."""
-    config_path: Path
+    """Configuration for a prompt learning job.
+    This dataclass holds all the configuration needed to submit and run
+    a prompt learning job (MIPRO or GEPA optimization).
+    Supports two modes:
+    1. **File-based**: Provide `config_path` pointing to a TOML file
+    2. **Programmatic**: Provide `config_dict` with the configuration directly
+    Both modes go through the same `PromptLearningConfig` Pydantic validation.
+    Attributes:
+        config_path: Path to the TOML configuration file. Mutually exclusive with config_dict.
+        config_dict: Dictionary with prompt learning configuration. Mutually exclusive with config_path.
+            Should have the same structure as the TOML file (with 'prompt_learning' section).
+        backend_url: Base URL of the Synth API backend (e.g., "https://api.usesynth.ai").
+        api_key: Synth API key for authentication.
+        task_app_api_key: API key for authenticating with the Local API.
+        allow_experimental: If True, allows use of experimental models.
+        overrides: Dictionary of config overrides.
+    Example (file-based):
+        >>> config = PromptLearningJobConfig(
+        ...     config_path=Path("my_config.toml"),
+        ...     backend_url="https://api.usesynth.ai",
+        ...     api_key="sk_live_...",
+        ... )
+    Example (programmatic):
+        >>> config = PromptLearningJobConfig(
+        ...     config_dict={
+        ...         "prompt_learning": {
+        ...             "algorithm": "gepa",
+        ...             "task_app_url": "https://tunnel.example.com",
+        ...             "policy": {"model": "gpt-4o-mini", "provider": "openai"},
+        ...             "gepa": {...},
+        ...         }
+        ...     },
+        ...     backend_url="https://api.usesynth.ai",
+        ...     api_key="sk_live_...",
+        ... )
+    """
     backend_url: str
     api_key: str
+    config_path: Optional[Path] = None
+    config_dict: Optional[Dict[str, Any]] = None
     task_app_api_key: Optional[str] = None
     allow_experimental: Optional[bool] = None
     overrides: Optional[Dict[str, Any]] = None
     def __post_init__(self) -> None:
         """Validate configuration."""
-        if not self.config_path.exists():
+        # Must provide exactly one of config_path or config_dict
+        has_path = self.config_path is not None
+        has_dict = self.config_dict is not None
+        if has_path and has_dict:
+            raise ValueError("Provide either config_path OR config_dict, not both")
+        if not has_path and not has_dict:
+            raise ValueError("Either config_path or config_dict is required")
+        if has_path and not self.config_path.exists():
             raise FileNotFoundError(f"Config file not found: {self.config_path}")
         if not self.backend_url:
             raise ValueError("backend_url is required")
         if not self.api_key:
             raise ValueError("api_key is required")
         # Get task_app_api_key from environment if not provided
         if not self.task_app_api_key:
             self.task_app_api_key = os.environ.get("ENVIRONMENT_API_KEY")
@@ -184,9 +340,100 @@ class PromptLearningJob:
             allow_experimental=allow_experimental,
             overrides=overrides or {},
         )
         return cls(config)
+    @classmethod
+    def from_dict(
+        cls,
+        config_dict: Dict[str, Any],
+        backend_url: Optional[str] = None,
+        api_key: Optional[str] = None,
+        task_app_api_key: Optional[str] = None,
+        allow_experimental: Optional[bool] = None,
+        overrides: Optional[Dict[str, Any]] = None,
+        skip_health_check: bool = False,
+    ) -> PromptLearningJob:
+        """Create a job from a configuration dictionary (programmatic use).
+        This allows creating prompt learning jobs without a TOML file, enabling
+        programmatic use in notebooks, scripts, and applications.
+        The config_dict should have the same structure as a TOML file:
+        ```python
+        {
+            "prompt_learning": {
+                "algorithm": "gepa",
+                "task_app_url": "https://...",
+                "policy": {"model": "gpt-4o-mini", "provider": "openai"},
+                "gepa": {...},
+            }
+        }
+        ```
+        Args:
+            config_dict: Configuration dictionary with 'prompt_learning' section
+            backend_url: Backend API URL (defaults to env or production)
+            api_key: API key (defaults to SYNTH_API_KEY env var)
+            task_app_api_key: Task app API key (defaults to ENVIRONMENT_API_KEY env var)
+            allow_experimental: Allow experimental models
+            overrides: Config overrides
+            skip_health_check: If True, skip task app health check before submission
+        Returns:
+            PromptLearningJob instance
+        Raises:
+            ValueError: If required config is missing or invalid
+        Example:
+            >>> job = PromptLearningJob.from_dict(
+            ...     config_dict={
+            ...         "prompt_learning": {
+            ...             "algorithm": "gepa",
+            ...             "task_app_url": "https://tunnel.example.com",
+            ...             "policy": {"model": "gpt-4o-mini", "provider": "openai"},
+            ...             "gepa": {
+            ...                 "rollout": {"budget": 50, "max_concurrent": 5},
+            ...                 "evaluation": {"train_seeds": [1, 2, 3], "val_seeds": [4, 5]},
+            ...                 "population": {"num_generations": 2, "children_per_generation": 2},
+            ...             },
+            ...         }
+            ...     },
+            ...     api_key="sk_live_...",
+            ... )
+            >>> job_id = job.submit()
+        """
+        import os
+        from synth_ai.core.env import get_backend_from_env
+        # Resolve backend URL
+        if not backend_url:
+            backend_url = os.environ.get("BACKEND_BASE_URL", "").strip()
+            if not backend_url:
+                base, _ = get_backend_from_env()
+                backend_url = f"{base}/api" if not base.endswith("/api") else base
+        # Resolve API key
+        if not api_key:
+            api_key = os.environ.get("SYNTH_API_KEY")
+            if not api_key:
+                raise ValueError(
+                    "api_key is required (provide explicitly or set SYNTH_API_KEY env var)"
+                )
+        config = PromptLearningJobConfig(
+            config_dict=config_dict,
+            backend_url=backend_url,
+            api_key=api_key,
+            task_app_api_key=task_app_api_key,
+            allow_experimental=allow_experimental,
+            overrides=overrides or {},
+        )
+        return cls(config, skip_health_check=skip_health_check)
     @classmethod
     def from_job_id(
         cls,
@@ -223,33 +470,59 @@ class PromptLearningJob:
                     "api_key is required (provide explicitly or set SYNTH_API_KEY env var)"
                 )
-        # Create minimal config (we don't need the config file for resuming)
+        # Create minimal config (we don't need the config for resuming - use empty dict)
+        # The config_dict is never used when resuming since we have the job_id
         config = PromptLearningJobConfig(
-            config_path=Path("/dev/null"),  # Dummy path
+            config_dict={"prompt_learning": {"_resumed": True}},  # Placeholder for resume mode
             backend_url=backend_url,
             api_key=api_key,
         )
         return cls(config, job_id=job_id)
     def _build_payload(self) -> PromptLearningBuildResult:
-        """Build the job payload from config."""
+        """Build the job payload from config.
+        Supports both file-based (config_path) and programmatic (config_dict) modes.
+        Both modes route through the same PromptLearningConfig Pydantic validation.
+        """
         if self._build_result is None:
-            if not self.config.config_path.exists() or self.config.config_path.name == "/dev/null":
-                raise RuntimeError(
-                    "Cannot build payload: config_path is required for new jobs. "
-                    "Use from_job_id() to resume an existing job."
-                )
             overrides = self.config.overrides or {}
             overrides["backend"] = self.config.backend_url
-            self._build_result = build_prompt_learning_payload(
-                config_path=self.config.config_path,
-                task_url=None,  # Force using TOML only
-                overrides=overrides,
-                allow_experimental=self.config.allow_experimental,
-            )
+            # Pass task_app_api_key to builder via overrides
+            if self.config.task_app_api_key:
+                overrides["task_app_api_key"] = self.config.task_app_api_key
+            # Route to appropriate builder based on config mode
+            if self.config.config_dict is not None:
+                # Programmatic mode: use dict-based builder
+                self._build_result = build_prompt_learning_payload_from_mapping(
+                    raw_config=self.config.config_dict,
+                    task_url=None,
+                    overrides=overrides,
+                    allow_experimental=self.config.allow_experimental,
+                    source_label="PromptLearningJob.from_dict",
+                )
+            elif self.config.config_path is not None:
+                # File-based mode: use path-based builder
+                if not self.config.config_path.exists():
+                    raise RuntimeError(
+                        f"Config file not found: {self.config.config_path}. "
+                        "Use from_dict() for programmatic config or from_job_id() to resume."
+                    )
+                self._build_result = build_prompt_learning_payload(
+                    config_path=self.config.config_path,
+                    task_url=None,
+                    overrides=overrides,
+                    allow_experimental=self.config.allow_experimental,
+                )
+            else:
+                raise RuntimeError(
+                    "Cannot build payload: either config_path or config_dict is required. "
+                    "Use from_config() for file-based config, from_dict() for programmatic config, "
+                    "or from_job_id() to resume an existing job."
+                )
         return self._build_result
     def submit(self) -> str:
@@ -262,7 +535,11 @@ class PromptLearningJob:
             RuntimeError: If job submission fails
             ValueError: If task app health check fails
         """
-        ctx: Dict[str, Any] = {"config_path": str(self.config.config_path)}
+        # Log context based on config mode
+        if self.config.config_path is not None:
+            ctx: Dict[str, Any] = {"config_path": str(self.config.config_path)}
+        else:
+            ctx = {"config_mode": "programmatic"}
         log_info("PromptLearningJob.submit invoked", ctx=ctx)
         if self._job_id:
             raise RuntimeError(f"Job already submitted: {self._job_id}")
@@ -271,7 +548,7 @@ class PromptLearningJob:
         # Health check (skip if _skip_health_check is set - useful for tunnels with DNS delay)
         if not self._skip_health_check:
-            health = check_task_app_health(build.task_url, self.config.task_app_api_key or "")
+            health = check_local_api_health(build.task_url, self.config.task_app_api_key or "")
             if not health.ok:
                 raise ValueError(f"Task app health check failed: {health.detail}")
@@ -351,40 +628,92 @@ class PromptLearningJob:
         *,
         timeout: float = 3600.0,
         interval: float = 5.0,
+        progress: bool = False,
         on_status: Optional[Callable[[Dict[str, Any]], None]] = None,
-    ) -> Dict[str, Any]:
+    ) -> PromptLearningResult:
         """Poll job until it reaches a terminal state.
         Args:
             timeout: Maximum seconds to wait
             interval: Seconds between poll attempts
-            on_status: Optional callback called on each status update
+            progress: If True, print status updates during polling (useful for notebooks)
+            on_status: Optional callback called on each status update (for custom progress handling)
         Returns:
-            Final job status dictionary
+            PromptLearningResult with typed status, best_score, etc.
         Raises:
             RuntimeError: If job hasn't been submitted yet
             TimeoutError: If timeout is exceeded
+        Example:
+            >>> result = job.poll_until_complete(progress=True)
+            [00:15] running | score: 0.72
+            [00:30] running | score: 0.78
+            [00:45] succeeded | score: 0.85
+            >>> result.succeeded
+            True
+            >>> result.best_score
+            0.85
         """
         if not self._job_id:
             raise RuntimeError("Job not yet submitted. Call submit() first.")
-        poller = PromptLearningJobPoller(
-            base_url=self.config.backend_url,
-            api_key=self.config.api_key,
-            interval=interval,
-            timeout=timeout,
-        )
-        outcome = poller.poll_job(self._job_id)  # type: ignore[arg-type]  # We check None above
-        payload = dict(outcome.payload) if isinstance(outcome.payload, dict) else {}
-        if on_status:
-            on_status(payload)
-        return payload
+        job_id = self._job_id
+        base_url = ensure_api_base(self.config.backend_url)
+        headers = {
+            "Authorization": f"Bearer {self.config.api_key}",
+            "Content-Type": "application/json",
+        }
+        start_time = time.time()
+        elapsed = 0.0
+        last_data: Dict[str, Any] = {}
+        while elapsed <= timeout:
+            try:
+                # Fetch job status
+                url = f"{base_url}/prompt-learning/online/jobs/{job_id}"
+                resp = http_get(url, headers=headers)
+                data = resp.json() if resp.headers.get("content-type", "").startswith("application/json") else {}
+                last_data = dict(data) if isinstance(data, dict) else {}
+                status = JobStatus.from_string(last_data.get("status", "pending"))
+                best_score = (
+                    last_data.get("best_score")
+                    or last_data.get("best_reward")
+                    or last_data.get("best_train_score")
+                    or last_data.get("best_train_reward")
+                )
+                # Progress output
+                if progress:
+                    mins, secs = divmod(int(elapsed), 60)
+                    score_str = f"score: {best_score:.2f}" if best_score is not None else "score: --"
+                    print(f"[{mins:02d}:{secs:02d}] {status.value} | {score_str}")
+                # Callback for custom handling
+                if on_status:
+                    on_status(last_data)
+                # Check terminal state
+                if status.is_terminal:
+                    return PromptLearningResult.from_response(job_id, last_data)
+            except Exception as exc:
+                if progress:
+                    print(f"[poll] error: {exc}")
+                log_info("poll request failed", ctx={"error": str(exc), "job_id": job_id})
+            time.sleep(interval)
+            elapsed = time.time() - start_time
+        # Timeout reached
+        if progress:
+            print(f"[poll] timeout after {timeout:.0f}s")
+        # Return with whatever data we have, status will indicate not complete
+        return PromptLearningResult.from_response(job_id, last_data)
     def get_results(self) -> Dict[str, Any]:
         """Get job results (prompts, scores, etc.).
@@ -463,8 +792,9 @@ class PromptLearningJob:
 __all__ = [
+    "JobStatus",
     "PromptLearningJob",
     "PromptLearningJobConfig",
     "PromptLearningJobPoller",
+    "PromptLearningResult",
 ]

synth_ai/sdk/api/train/rl.py CHANGED Viewed

@@ -1,5 +1,7 @@
 """First-class SDK API for reinforcement learning (RL/GSPO).
+**Status:** Experimental
 This module provides high-level abstractions for running RL training jobs
 both via CLI (`uvx synth-ai train --type rl`) and programmatically in Python scripts.
@@ -32,14 +34,49 @@ from synth_ai.core.telemetry import log_info
 from .builders import RLBuildResult, build_rl_payload
 from .pollers import RLJobPoller
-from .task_app import check_task_app_health
+from .local_api import check_local_api_health
 from .utils import ensure_api_base, http_post
 @dataclass
 class RLJobConfig:
-    """Configuration for an RL training job."""
+    """Configuration for an RL training job.
+    This dataclass holds all the configuration needed to submit and run
+    a reinforcement learning training job (GSPO, GRPO, PPO, etc.).
+    Attributes:
+        config_path: Path to the TOML configuration file that defines the
+            RL training task, including model settings, training hyperparameters,
+            reward configuration, and Local API URL.
+        backend_url: Base URL of the Synth API backend (e.g.,
+            "https://api.usesynth.ai"). Can also be set via BACKEND_BASE_URL
+            environment variable.
+        api_key: Synth API key for authentication. Can also be set via
+            SYNTH_API_KEY environment variable.
+        task_app_url: URL of the Local API that serves rollout environments.
+            Can be set via TASK_APP_URL env var if not provided.
+            (Alias: also known as "task app URL" in older documentation)
+        task_app_api_key: API key for authenticating with the Local API.
+            Defaults to ENVIRONMENT_API_KEY env var if not provided.
+            (Alias: also known as "task app API key" in older documentation)
+        allow_experimental: If True, allows use of experimental models and
+            features. Defaults to None (uses config file setting).
+        overrides: Dictionary of config overrides that take precedence over
+            values in the TOML file. Useful for programmatic customization.
+        idempotency_key: Optional key for idempotent job submission. If provided,
+            submitting the same key twice will return the existing job instead
+            of creating a new one.
+    Example:
+        >>> config = RLJobConfig(
+        ...     config_path=Path("rl_config.toml"),
+        ...     backend_url="https://api.usesynth.ai",
+        ...     api_key="sk_live_...",
+        ...     task_app_url="https://my-task-app.example.com",
+        ... )
+    """
     config_path: Path
     backend_url: str
     api_key: str
@@ -282,7 +319,7 @@ class RLJob:
         # Health check (skip if _skip_health_check is set - useful for tunnels with DNS delay)
         if not self._skip_health_check:
             task_app_key = self.config.task_app_api_key or ""
-            health = check_task_app_health(build.task_url, task_app_key)
+            health = check_local_api_health(build.task_url, task_app_key)
             if not health.ok:
                 raise ValueError(f"Task app health check failed: {health.detail}")
@@ -439,4 +476,3 @@ __all__ = [
     "RLJob",
     "RLJobConfig",
 ]

synth_ai/sdk/api/train/sft.py CHANGED Viewed

@@ -1,5 +1,7 @@
 """First-class SDK API for SFT (Supervised Fine-Tuning).
+**Status:** Experimental
 This module provides high-level abstractions for running SFT jobs
 both via CLI (`uvx synth-ai train`) and programmatically in Python scripts.

synth_ai/sdk/api/train/task_app.py CHANGED Viewed

@@ -21,6 +21,11 @@ class TaskAppHealth:
     detail: str | None = None
+@dataclass(slots=True)
+class LocalAPIHealth(TaskAppHealth):
+    """Alias for TaskAppHealth with LocalAPI naming."""
 def _resolve_hostname_with_explicit_resolvers(hostname: str) -> str:
     """
     Resolve hostname using explicit resolvers (1.1.1.1, 8.8.8.8) first,
@@ -245,6 +250,19 @@ def check_task_app_health(base_url: str, api_key: str, *, timeout: float = 10.0,
     )
+def check_local_api_health(
+    base_url: str, api_key: str, *, timeout: float = 10.0, max_retries: int = 5
+) -> LocalAPIHealth:
+    """Alias for check_task_app_health with LocalAPI naming."""
+    health = check_task_app_health(base_url, api_key, timeout=timeout, max_retries=max_retries)
+    return LocalAPIHealth(
+        ok=health.ok,
+        health_status=health.health_status,
+        task_info_status=health.task_info_status,
+        detail=health.detail,
+    )
 @dataclass(slots=True)
 class ModalSecret:
     name: str
@@ -323,9 +341,11 @@ __all__ = [
     "ModalApp",
     "ModalSecret",
     "check_task_app_health",
+    "check_local_api_health",
     "format_modal_apps",
     "format_modal_secrets",
     "get_modal_secret_value",
     "list_modal_apps",
     "list_modal_secrets",
+    "LocalAPIHealth",
 ]

synth-ai 0.4.1__py3-none-any.whl → 0.4.4__py3-none-any.whl

Potentially problematic release.

synth-ai 0.4.1py3-none-any.whl → 0.4.4py3-none-any.whl