PyPI - synth-ai - Versions diffs - 0.4.1__py3-none-any.whl → 0.4.4__py3-none-any.whl - Mend

synth-ai 0.4.1py3-none-any.whl → 0.4.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synth-ai might be problematic. Click here for more details.

Files changed (153) hide show

synth_ai/__init__.py +13 -13
synth_ai/cli/__init__.py +6 -15
synth_ai/cli/commands/eval/__init__.py +6 -15
synth_ai/cli/commands/eval/config.py +338 -0
synth_ai/cli/commands/eval/core.py +236 -1091
synth_ai/cli/commands/eval/runner.py +704 -0
synth_ai/cli/commands/eval/validation.py +44 -117
synth_ai/cli/commands/filter/core.py +7 -7
synth_ai/cli/commands/filter/validation.py +2 -2
synth_ai/cli/commands/smoke/core.py +7 -17
synth_ai/cli/commands/status/__init__.py +1 -64
synth_ai/cli/commands/status/client.py +50 -151
synth_ai/cli/commands/status/config.py +3 -83
synth_ai/cli/commands/status/errors.py +4 -13
synth_ai/cli/commands/status/subcommands/__init__.py +2 -8
synth_ai/cli/commands/status/subcommands/config.py +13 -0
synth_ai/cli/commands/status/subcommands/files.py +18 -63
synth_ai/cli/commands/status/subcommands/jobs.py +28 -311
synth_ai/cli/commands/status/subcommands/models.py +18 -62
synth_ai/cli/commands/status/subcommands/runs.py +16 -63
synth_ai/cli/commands/status/subcommands/session.py +67 -172
synth_ai/cli/commands/status/subcommands/summary.py +24 -32
synth_ai/cli/commands/status/subcommands/utils.py +41 -0
synth_ai/cli/commands/status/utils.py +16 -107
synth_ai/cli/commands/train/__init__.py +18 -20
synth_ai/cli/commands/train/errors.py +3 -3
synth_ai/cli/commands/train/prompt_learning_validation.py +15 -16
synth_ai/cli/commands/train/validation.py +7 -7
synth_ai/cli/commands/train/{judge_schemas.py → verifier_schemas.py} +33 -34
synth_ai/cli/commands/train/verifier_validation.py +235 -0
synth_ai/cli/demo_apps/demo_task_apps/math/config.toml +0 -1
synth_ai/cli/demo_apps/demo_task_apps/math/modal_task_app.py +2 -6
synth_ai/cli/demo_apps/math/config.toml +0 -1
synth_ai/cli/demo_apps/math/modal_task_app.py +2 -6
synth_ai/cli/demo_apps/mipro/task_app.py +25 -47
synth_ai/cli/lib/apps/task_app.py +12 -13
synth_ai/cli/lib/task_app_discovery.py +6 -6
synth_ai/cli/lib/train_cfgs.py +10 -10
synth_ai/cli/task_apps/__init__.py +11 -0
synth_ai/cli/task_apps/commands.py +7 -15
synth_ai/core/env.py +12 -1
synth_ai/core/errors.py +1 -2
synth_ai/core/integrations/cloudflare.py +209 -33
synth_ai/core/tracing_v3/abstractions.py +46 -0
synth_ai/data/__init__.py +3 -30
synth_ai/data/enums.py +1 -20
synth_ai/data/rewards.py +100 -3
synth_ai/products/graph_evolve/__init__.py +1 -2
synth_ai/products/graph_evolve/config.py +16 -16
synth_ai/products/graph_evolve/converters/__init__.py +3 -3
synth_ai/products/graph_evolve/converters/openai_sft.py +7 -7
synth_ai/products/graph_evolve/examples/hotpotqa/config.toml +1 -1
synth_ai/products/graph_gepa/__init__.py +23 -0
synth_ai/products/graph_gepa/converters/__init__.py +19 -0
synth_ai/products/graph_gepa/converters/openai_sft.py +29 -0
synth_ai/sdk/__init__.py +45 -35
synth_ai/sdk/api/eval/__init__.py +33 -0
synth_ai/sdk/api/eval/job.py +732 -0
synth_ai/sdk/api/research_agent/__init__.py +276 -66
synth_ai/sdk/api/train/builders.py +181 -0
synth_ai/sdk/api/train/cli.py +41 -33
synth_ai/sdk/api/train/configs/__init__.py +6 -4
synth_ai/sdk/api/train/configs/prompt_learning.py +127 -33
synth_ai/sdk/api/train/configs/rl.py +264 -16
synth_ai/sdk/api/train/configs/sft.py +165 -1
synth_ai/sdk/api/train/graph_validators.py +12 -12
synth_ai/sdk/api/train/graphgen.py +169 -51
synth_ai/sdk/api/train/graphgen_models.py +95 -45
synth_ai/sdk/api/train/local_api.py +10 -0
synth_ai/sdk/api/train/pollers.py +36 -0
synth_ai/sdk/api/train/prompt_learning.py +390 -60
synth_ai/sdk/api/train/rl.py +41 -5
synth_ai/sdk/api/train/sft.py +2 -0
synth_ai/sdk/api/train/task_app.py +20 -0
synth_ai/sdk/api/train/validators.py +17 -17
synth_ai/sdk/graphs/completions.py +239 -33
synth_ai/sdk/{judging/schemas.py → graphs/verifier_schemas.py} +23 -23
synth_ai/sdk/learning/__init__.py +35 -5
synth_ai/sdk/learning/context_learning_client.py +531 -0
synth_ai/sdk/learning/context_learning_types.py +294 -0
synth_ai/sdk/learning/prompt_learning_client.py +1 -1
synth_ai/sdk/learning/prompt_learning_types.py +2 -1
synth_ai/sdk/learning/rl/__init__.py +0 -4
synth_ai/sdk/learning/rl/contracts.py +0 -4
synth_ai/sdk/localapi/__init__.py +40 -0
synth_ai/sdk/localapi/apps/__init__.py +28 -0
synth_ai/sdk/localapi/client.py +10 -0
synth_ai/sdk/localapi/contracts.py +10 -0
synth_ai/sdk/localapi/helpers.py +519 -0
synth_ai/sdk/localapi/rollouts.py +93 -0
synth_ai/sdk/localapi/server.py +29 -0
synth_ai/sdk/localapi/template.py +49 -0
synth_ai/sdk/streaming/handlers.py +6 -6
synth_ai/sdk/streaming/streamer.py +10 -6
synth_ai/sdk/task/__init__.py +18 -5
synth_ai/sdk/task/apps/__init__.py +37 -1
synth_ai/sdk/task/client.py +9 -1
synth_ai/sdk/task/config.py +6 -11
synth_ai/sdk/task/contracts.py +137 -95
synth_ai/sdk/task/in_process.py +32 -22
synth_ai/sdk/task/in_process_runner.py +9 -4
synth_ai/sdk/task/rubrics/__init__.py +2 -3
synth_ai/sdk/task/rubrics/loaders.py +4 -4
synth_ai/sdk/task/rubrics/strict.py +3 -4
synth_ai/sdk/task/server.py +76 -16
synth_ai/sdk/task/trace_correlation_helpers.py +190 -139
synth_ai/sdk/task/validators.py +34 -49
synth_ai/sdk/training/__init__.py +7 -16
synth_ai/sdk/tunnels/__init__.py +118 -0
synth_ai/sdk/tunnels/cleanup.py +83 -0
synth_ai/sdk/tunnels/ports.py +120 -0
synth_ai/sdk/tunnels/tunneled_api.py +363 -0
{synth_ai-0.4.1.dist-info → synth_ai-0.4.4.dist-info}/METADATA +71 -4
{synth_ai-0.4.1.dist-info → synth_ai-0.4.4.dist-info}/RECORD +118 -128
synth_ai/cli/commands/baseline/__init__.py +0 -12
synth_ai/cli/commands/baseline/core.py +0 -636
synth_ai/cli/commands/baseline/list.py +0 -94
synth_ai/cli/commands/eval/errors.py +0 -81
synth_ai/cli/commands/status/formatters.py +0 -164
synth_ai/cli/commands/status/subcommands/pricing.py +0 -23
synth_ai/cli/commands/status/subcommands/usage.py +0 -203
synth_ai/cli/commands/train/judge_validation.py +0 -305
synth_ai/cli/usage.py +0 -159
synth_ai/data/specs.py +0 -36
synth_ai/sdk/api/research_agent/cli.py +0 -428
synth_ai/sdk/api/research_agent/config.py +0 -357
synth_ai/sdk/api/research_agent/job.py +0 -717
synth_ai/sdk/baseline/__init__.py +0 -25
synth_ai/sdk/baseline/config.py +0 -209
synth_ai/sdk/baseline/discovery.py +0 -216
synth_ai/sdk/baseline/execution.py +0 -154
synth_ai/sdk/judging/__init__.py +0 -15
synth_ai/sdk/judging/base.py +0 -24
synth_ai/sdk/judging/client.py +0 -191
synth_ai/sdk/judging/types.py +0 -42
synth_ai/sdk/research_agent/__init__.py +0 -34
synth_ai/sdk/research_agent/container_builder.py +0 -328
synth_ai/sdk/research_agent/container_spec.py +0 -198
synth_ai/sdk/research_agent/defaults.py +0 -34
synth_ai/sdk/research_agent/results_collector.py +0 -69
synth_ai/sdk/specs/__init__.py +0 -46
synth_ai/sdk/specs/dataclasses.py +0 -149
synth_ai/sdk/specs/loader.py +0 -144
synth_ai/sdk/specs/serializer.py +0 -199
synth_ai/sdk/specs/validation.py +0 -250
synth_ai/sdk/tracing/__init__.py +0 -39
synth_ai/sdk/usage/__init__.py +0 -37
synth_ai/sdk/usage/client.py +0 -171
synth_ai/sdk/usage/models.py +0 -261
{synth_ai-0.4.1.dist-info → synth_ai-0.4.4.dist-info}/WHEEL +0 -0
{synth_ai-0.4.1.dist-info → synth_ai-0.4.4.dist-info}/entry_points.txt +0 -0
{synth_ai-0.4.1.dist-info → synth_ai-0.4.4.dist-info}/licenses/LICENSE +0 -0
{synth_ai-0.4.1.dist-info → synth_ai-0.4.4.dist-info}/top_level.txt +0 -0

synth_ai/sdk/api/train/graphgen_models.py CHANGED Viewed

@@ -1,8 +1,8 @@
-"""GraphGen (Automated Design of Agentic Systems) data models.
+"""GraphGen (Graph Opt) data models.
 This module provides Pydantic models for defining GraphGen datasets and job configurations.
 GraphGen is a simplified "Workflows API" for prompt optimization that wraps GEPA with
-auto-generated task apps and built-in judge configurations.
+auto-generated task apps and built-in verifier configurations.
 Example:
     from synth_ai.sdk.api.train.graphgen_models import (
@@ -11,6 +11,7 @@ Example:
         GraphGenGoldOutput,
         GraphGenRubric,
         GraphGenJobConfig,
+        GraphGenVerifierConfig,
     )
     # Create a dataset
@@ -24,7 +25,7 @@ Example:
             GraphGenGoldOutput(output={"answer": "4"}, task_id="task1"),
             GraphGenGoldOutput(output={"answer": "Paris"}, task_id="task2"),
         ],
-        judge_config=GraphGenJudgeConfig(mode="rubric"),
+        verifier_config=GraphGenVerifierConfig(mode="rubric"),
     )
 """
@@ -201,7 +202,7 @@ class GraphGenGoldOutput(BaseModel):
     """A gold/reference output.
     Can be linked to a specific task via task_id, or standalone (for reference examples).
-    Standalone gold outputs (no task_id) are used as reference pool for contrastive judging.
+    Standalone gold outputs (no task_id) are used as reference pool for contrastive verification.
     """
     output: Dict[str, Any] = Field(
@@ -217,16 +218,16 @@ class GraphGenGoldOutput(BaseModel):
 # Improvement 4: Define supported providers as a Literal type
-JudgeProviderType = Literal["groq", "openai", "google", "anthropic"]
+VerifierProviderType = Literal["groq", "openai", "google", "anthropic"]
-class GraphGenJudgeConfig(BaseModel):
-    """Configuration for the judge used during optimization."""
+class GraphGenVerifierConfig(BaseModel):
+    """Configuration for the verifier used during optimization."""
     mode: Literal["rubric", "contrastive", "gold_examples"] = Field(
         default="rubric",
         description=(
-            "Judge mode: "
+            "Verifier mode: "
             "'rubric' = evaluate against criteria, "
             "'contrastive' = compare to gold output, "
             "'gold_examples' = use gold examples as few-shot context"
@@ -234,12 +235,12 @@ class GraphGenJudgeConfig(BaseModel):
     )
     model: str = Field(
         default="llama-3.3-70b-versatile",
-        description="Model to use for judging",
+        description="Model to use for verification",
     )
     # Improvement 4: Changed from str to Literal type for better type safety
-    provider: JudgeProviderType = Field(
+    provider: VerifierProviderType = Field(
         default="groq",
-        description="Provider for judge model (groq, openai, google, anthropic)",
+        description="Provider for verifier model (groq, openai, google, anthropic)",
     )
@@ -247,7 +248,7 @@ class GraphGenTaskSet(BaseModel):
     """The complete GraphGen dataset format.
     Contains tasks with arbitrary JSON inputs, gold outputs (optionally linked to tasks),
-    rubrics (task-specific and/or default), and judge configuration.
+    rubrics (task-specific and/or default), and verifier configuration.
     Example:
         dataset = GraphGenTaskSet(
@@ -274,9 +275,9 @@ class GraphGenTaskSet(BaseModel):
         default=None,
         description="Default rubric applied to all tasks (merged with task-specific rubrics)",
     )
-    judge_config: GraphGenJudgeConfig = Field(
-        default_factory=GraphGenJudgeConfig,
-        description="Configuration for the judge",
+    verifier_config: GraphGenVerifierConfig = Field(
+        default_factory=GraphGenVerifierConfig,
+        description="Configuration for the verifier",
     )
     # Optional schemas (also accepted at top-level for backward/forward compatibility).
     input_schema: Optional[Dict[str, Any]] = Field(
@@ -417,7 +418,7 @@ class GraphGenTaskSet(BaseModel):
         return None
     def get_standalone_gold_outputs(self) -> List[GraphGenGoldOutput]:
-        """Get gold outputs not linked to any task (reference pool for contrastive judge)."""
+        """Get gold outputs not linked to any task (reference pool for contrastive verifier)."""
         return [gold for gold in self.gold_outputs if gold.task_id is None]
@@ -445,8 +446,8 @@ SUPPORTED_POLICY_MODELS = {
     "claude-3-5-haiku-latest",
 }
-# Supported judge models
-SUPPORTED_JUDGE_MODELS = {
+# Supported verifier models
+SUPPORTED_VERIFIER_MODELS = {
     # Groq (fast, cheap)
     "llama-3.3-70b-versatile",
     "llama-3.1-70b-versatile",
@@ -457,8 +458,8 @@ SUPPORTED_JUDGE_MODELS = {
 # Default models
 DEFAULT_POLICY_MODEL = "gpt-4o-mini"
-DEFAULT_JUDGE_MODEL = "llama-3.3-70b-versatile"
-DEFAULT_JUDGE_PROVIDER = "groq"
+DEFAULT_VERIFIER_MODEL = "llama-3.3-70b-versatile"
+DEFAULT_VERIFIER_PROVIDER = "groq"
 class EventInput(BaseModel):
@@ -484,7 +485,7 @@ class SessionTimeStepInput(BaseModel):
 class SessionTraceInput(BaseModel):
-    """V3-compatible session trace input for judge evaluation."""
+    """V3-compatible session trace input for verifier evaluation."""
     model_config = ConfigDict(extra="allow")
@@ -505,7 +506,7 @@ class SessionTraceInput(BaseModel):
         return data
-class GraphGenGraphJudgeRequest(BaseModel):
+class GraphGenGraphVerifierRequest(BaseModel):
     """Request for verifier graph inference."""
     model_config = ConfigDict(extra="forbid")
@@ -576,7 +577,7 @@ class OutcomeRewardResponse(BaseModel):
     annotation: Optional[Dict[str, Any]] = Field(default=None, description="Additional annotations (free-form)")
-class GraphGenGraphJudgeResponse(BaseModel):
+class GraphGenGraphVerifierResponse(BaseModel):
     """Response from verifier graph inference."""
     started_at: datetime = Field(..., description="When inference request started (UTC)")
@@ -589,32 +590,81 @@ class GraphGenGraphJudgeResponse(BaseModel):
     event_rewards: List[EventRewardResponse] = Field(default_factory=list, description="Per-event rewards")
     outcome_reward: Optional[OutcomeRewardResponse] = Field(default=None, description="Episode-level outcome reward")
-    # Legacy fields (kept for backward compatibility)
-    score: float = Field(..., ge=0.0, le=1.0, description="Evaluation score (0-1)")
-    reasoning: Optional[str] = Field(default=None, description="Explanation for the score")
-    sub_scores: Optional[Dict[str, float]] = Field(default=None, description="Breakdown scores by criteria")
     raw_output: Optional[Dict[str, Any]] = Field(default=None, description="Full raw output from the verifier graph")
     usage: List[GraphGenGraphCompletionsModelUsage] = Field(default_factory=list, description="Token usage per model")
-class GraphGenGraphVerifierRequest(GraphGenGraphJudgeRequest):
-    """Alias for GraphGenGraphJudgeRequest with verifier terminology."""
-class GraphGenGraphVerifierResponse(GraphGenGraphJudgeResponse):
-    """Alias for GraphGenGraphJudgeResponse with verifier terminology."""
 class GraphGenJobConfig(BaseModel):
-    """Configuration for an GraphGen optimization job.
+    """Configuration for a GraphGen (Graph Opt) optimization job.
+    GraphGen provides a simplified API for training optimized graphs/workflows without
+    managing task apps manually. It supports three graph types:
+    - **policy**: Standard input-to-output graphs for classification, QA, generation
+    - **verifier**: Trace-to-score graphs for verifying/evaluating agent behavior
+    - **rlm**: Recursive Language Model graphs for massive contexts via tool-based search
     Example:
+        ```python
+        from synth_ai.sdk.api.train.graphgen_models import GraphGenJobConfig
         config = GraphGenJobConfig(
+            graph_type="policy",
             policy_model="gpt-4o-mini",
             rollout_budget=100,
             proposer_effort="medium",
+            problem_spec="Classify customer support messages into categories.",
         )
+        ```
+    Attributes:
+        graph_type: Type of graph - "policy", "verifier", or "rlm".
+        policy_model: Model for policy inference (e.g., "gpt-4o-mini", "claude-3-5-sonnet").
+        policy_provider: Provider for policy model (auto-detected if not specified).
+        rollout_budget: Total rollouts (evaluations) for optimization. Range: 10-10000.
+        proposer_effort: Mutation quality/cost level - "medium" or "high".
+            Note: "low" is not allowed (gpt-4.1-mini too weak for graph generation).
+        verifier_model: Override verifier model from dataset.
+        verifier_provider: Override verifier provider from dataset.
+        population_size: GEPA population size. Range: 2-20. Default: 4.
+        num_generations: Number of generations (auto-calculated from budget if not specified).
+        num_parents: Number of parents for selection. Range: 1-10. Default: 2.
+        evaluation_seeds: Specific seeds for evaluation (auto-generated if not specified).
+        problem_spec: Detailed problem specification for the graph proposer.
+            Include domain info like valid output labels, constraints, format requirements.
+        target_llm_calls: Target LLM calls per graph run (1-10). Default: 5.
+        configured_tools: Tool bindings for RLM graphs. Required for graph_type="rlm".
+    Returns:
+        After training completes via GraphGenJob, you receive a result dict:
+        ```python
+        {
+            "status": "succeeded",
+            "graphgen_job_id": "graphgen_abc123",
+            "best_score": 0.89,
+            "best_snapshot_id": "snap_xyz789",
+            "dataset_name": "My Classification Tasks",
+            "task_count": 50,
+        }
+        ```
+    Events:
+        During training, you'll receive streaming events via GraphGenJob.stream_until_complete():
+        - `graphgen.created` - Job created
+        - `graphgen.running` - Training started
+        - `graphgen.generation.started` - New generation of candidates started
+        - `graphgen.candidate.evaluated` - A candidate graph was evaluated
+        - `graphgen.generation.completed` - Generation finished with metrics
+        - `graphgen.optimization.completed` - Training finished successfully
+        - `graphgen.failed` - Job encountered an error
+    See Also:
+        - GraphGenJob: High-level SDK class for running jobs
+        - GraphGenTaskSet: Dataset format for tasks and gold outputs
+        - Training reference: /training/graph-evolve
+        - Quickstart: /quickstart/graph-evolve
     """
     # Graph type
@@ -656,14 +706,14 @@ class GraphGenJobConfig(BaseModel):
         ),
     )
-    # Judge settings (if not specified in dataset)
-    judge_model: Optional[str] = Field(
+    # Verifier settings (if not specified in dataset)
+    verifier_model: Optional[str] = Field(
         default=None,
-        description="Override judge model from dataset",
+        description="Override verifier model from dataset",
     )
-    judge_provider: Optional[str] = Field(
+    verifier_provider: Optional[str] = Field(
         default=None,
-        description="Override judge provider from dataset",
+        description="Override verifier provider from dataset",
     )
     # Advanced settings
@@ -792,7 +842,7 @@ GraphGenRubric = GraphGenRubric
 GraphGenRubricCriterion = GraphGenRubricCriterion
 GraphGenRubricOutcome = GraphGenRubricOutcome
 GraphGenRubricEvents = GraphGenRubricEvents
-GraphGenJudgeConfig = GraphGenJudgeConfig
+GraphGenVerifierConfig = GraphGenVerifierConfig
 GraphGenJobConfig = GraphGenJobConfig
 parse_graphgen_taskset = parse_graphgen_taskset
 load_graphgen_taskset = load_graphgen_taskset
@@ -800,7 +850,7 @@ load_graphgen_taskset = load_graphgen_taskset
 __all__ = [
     # Core types (new)
     "OutputConfig",
-    "JudgeProviderType",
+    "VerifierProviderType",
     # GraphGen names (preferred)
     "GraphGenTaskSet",
     "GraphGenTaskSetMetadata",
@@ -810,14 +860,14 @@ __all__ = [
     "GraphGenRubricCriterion",
     "GraphGenRubricOutcome",
     "GraphGenRubricEvents",
-    "GraphGenJudgeConfig",
+    "GraphGenVerifierConfig",
     "GraphGenJobConfig",
     "parse_graphgen_taskset",
     "load_graphgen_taskset",
     # Constants
     "SUPPORTED_POLICY_MODELS",
-    "SUPPORTED_JUDGE_MODELS",
+    "SUPPORTED_VERIFIER_MODELS",
     "DEFAULT_POLICY_MODEL",
-    "DEFAULT_JUDGE_MODEL",
-    "DEFAULT_JUDGE_PROVIDER",
+    "DEFAULT_VERIFIER_MODEL",
+    "DEFAULT_VERIFIER_PROVIDER",
 ]

synth_ai/sdk/api/train/local_api.py ADDED Viewed

@@ -0,0 +1,10 @@
+"""LocalAPI health helpers.
+Prefer this module over synth_ai.sdk.api.train.task_app for LocalAPI naming.
+"""
+from __future__ import annotations
+from synth_ai.sdk.api.train.task_app import LocalAPIHealth, check_local_api_health
+__all__ = ["LocalAPIHealth", "check_local_api_health"]

synth_ai/sdk/api/train/pollers.py CHANGED Viewed

@@ -116,9 +116,45 @@ class PromptLearningJobPoller(JobPoller):
         return super().poll(f"/api/prompt-learning/online/jobs/{job_id}")
+class EvalJobPoller(JobPoller):
+    """Poller for evaluation jobs.
+    Polls the backend eval job API to check job status until completion.
+    Example:
+        >>> poller = EvalJobPoller(
+        ...     base_url="https://api.usesynth.ai",
+        ...     api_key="sk_live_...",
+        ...     interval=2.0,
+        ...     timeout=1200.0,
+        ... )
+        >>> outcome = poller.poll_job("eval-abc123")
+        >>> if outcome.status == "completed":
+        ...     print(outcome.payload)
+    See Also:
+        - `synth_ai.sdk.api.eval.EvalJob`: High-level eval job API
+        - Backend API: GET /api/eval/jobs/{job_id}
+    """
+    def poll_job(self, job_id: str) -> PollOutcome:
+        """Poll an eval job by ID.
+        Args:
+            job_id: Job ID (e.g., "eval-abc123")
+        Returns:
+            PollOutcome with status and payload
+        """
+        ctx: dict[str, Any] = {"job_id": job_id, "job_type": "eval"}
+        log_info("EvalJobPoller.poll_job invoked", ctx=ctx)
+        return super().poll(f"/api/eval/jobs/{job_id}")
 __all__ = [
     "PollOutcome",
     "RLJobPoller",
     "SFTJobPoller",
     "PromptLearningJobPoller",
+    "EvalJobPoller",
 ]

synth-ai 0.4.1__py3-none-any.whl → 0.4.4__py3-none-any.whl

Potentially problematic release.

synth-ai 0.4.1py3-none-any.whl → 0.4.4py3-none-any.whl