PyPI - synth-ai - Versions diffs - 0.2.16__py3-none-any.whl → 0.2.19__py3-none-any.whl - Mend

synth-ai 0.2.16py3-none-any.whl → 0.2.19py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synth-ai might be problematic. Click here for more details.

Files changed (299) hide show

examples/analyze_semantic_words.sh +2 -2
examples/baseline/banking77_baseline.py +204 -0
examples/baseline/crafter_baseline.py +407 -0
examples/baseline/pokemon_red_baseline.py +326 -0
examples/baseline/simple_baseline.py +56 -0
examples/baseline/warming_up_to_rl_baseline.py +239 -0
examples/blog_posts/gepa/README.md +355 -0
examples/blog_posts/gepa/configs/banking77_gepa_local.toml +95 -0
examples/blog_posts/gepa/configs/banking77_gepa_test.toml +82 -0
examples/blog_posts/gepa/configs/banking77_mipro_local.toml +52 -0
examples/blog_posts/gepa/configs/hotpotqa_gepa_local.toml +59 -0
examples/blog_posts/gepa/configs/hotpotqa_gepa_qwen.toml +36 -0
examples/blog_posts/gepa/configs/hotpotqa_mipro_local.toml +53 -0
examples/blog_posts/gepa/configs/hover_gepa_local.toml +59 -0
examples/blog_posts/gepa/configs/hover_gepa_qwen.toml +36 -0
examples/blog_posts/gepa/configs/hover_mipro_local.toml +53 -0
examples/blog_posts/gepa/configs/ifbench_gepa_local.toml +59 -0
examples/blog_posts/gepa/configs/ifbench_gepa_qwen.toml +36 -0
examples/blog_posts/gepa/configs/ifbench_mipro_local.toml +53 -0
examples/blog_posts/gepa/configs/pupa_gepa_local.toml +60 -0
examples/blog_posts/gepa/configs/pupa_mipro_local.toml +54 -0
examples/blog_posts/gepa/deploy_banking77_task_app.sh +41 -0
examples/blog_posts/gepa/gepa_baseline.py +204 -0
examples/blog_posts/gepa/query_prompts_example.py +97 -0
examples/blog_posts/gepa/run_gepa_banking77.sh +87 -0
examples/blog_posts/gepa/task_apps.py +105 -0
examples/blog_posts/gepa/test_gepa_local.sh +67 -0
examples/blog_posts/gepa/verify_banking77_setup.sh +123 -0
examples/blog_posts/pokemon_vl/README.md +98 -0
examples/blog_posts/pokemon_vl/configs/eval_gpt5nano.toml +26 -0
examples/blog_posts/pokemon_vl/configs/eval_qwen3_vl.toml +27 -0
examples/blog_posts/pokemon_vl/configs/eval_rl_final.toml +24 -0
examples/blog_posts/pokemon_vl/configs/filter_high_reward.toml +10 -0
examples/blog_posts/pokemon_vl/configs/train_rl_from_sft.toml +43 -0
examples/blog_posts/pokemon_vl/configs/train_sft_qwen4b_vl.toml +40 -0
examples/blog_posts/pokemon_vl/extract_images.py +239 -0
examples/blog_posts/pokemon_vl/pokemon_vl_baseline.py +326 -0
examples/blog_posts/pokemon_vl/run_eval_extract_images.py +209 -0
examples/blog_posts/pokemon_vl/run_qwen_eval_extract_images.py +212 -0
examples/blog_posts/pokemon_vl/text_box_analysis.md +106 -0
examples/blog_posts/warming_up_to_rl/ARCHITECTURE.md +195 -0
examples/blog_posts/warming_up_to_rl/FINAL_TEST_RESULTS.md +127 -0
examples/blog_posts/warming_up_to_rl/INFERENCE_SUCCESS.md +132 -0
examples/blog_posts/warming_up_to_rl/README.md +158 -0
examples/blog_posts/warming_up_to_rl/SMOKE_TESTING.md +164 -0
examples/blog_posts/warming_up_to_rl/SMOKE_TEST_COMPLETE.md +253 -0
examples/blog_posts/warming_up_to_rl/configs/eval_baseline_qwen32b_10x20.toml +25 -0
examples/blog_posts/warming_up_to_rl/configs/eval_ft_qwen4b.toml +25 -0
examples/blog_posts/warming_up_to_rl/configs/eval_ft_qwen4b_10x20.toml +26 -0
examples/blog_posts/warming_up_to_rl/configs/eval_groq_qwen32b.toml +25 -0
examples/blog_posts/warming_up_to_rl/configs/eval_openai_gpt_oss_120b.toml +29 -0
examples/blog_posts/warming_up_to_rl/configs/filter_high_reward_dataset.toml +10 -0
examples/blog_posts/warming_up_to_rl/configs/smoke_test.toml +75 -0
examples/blog_posts/warming_up_to_rl/configs/train_rl_from_sft.toml +91 -0
examples/blog_posts/warming_up_to_rl/configs/train_sft_qwen4b.toml +40 -0
examples/blog_posts/warming_up_to_rl/warming_up_to_rl_baseline.py +187 -0
examples/dev/qwen3_32b_qlora_4xh100.toml +5 -0
examples/multi_step/configs/VERILOG_REWARDS.md +4 -0
examples/multi_step/configs/VERILOG_RL_CHECKLIST.md +4 -0
examples/multi_step/configs/crafter_rl_outcome.toml +2 -1
examples/multi_step/configs/crafter_rl_stepwise_hosted_judge.toml +65 -107
examples/multi_step/configs/crafter_rl_stepwise_shaped.toml +2 -1
examples/multi_step/configs/crafter_rl_stepwise_simple.toml +2 -1
examples/multi_step/configs/crafter_rl_stepwise_simple_NEW_FORMAT.toml +105 -0
examples/multi_step/configs/verilog_rl_lora.toml +80 -123
examples/qwen_coder/configs/coder_lora_30b.toml +1 -3
examples/qwen_coder/configs/coder_lora_4b.toml +4 -1
examples/qwen_coder/configs/coder_lora_small.toml +1 -3
examples/qwen_vl/README.md +10 -12
examples/qwen_vl/SETUP_COMPLETE.md +7 -8
examples/qwen_vl/VISION_TESTS_COMPLETE.md +2 -3
examples/qwen_vl/collect_data_via_cli.md +76 -84
examples/qwen_vl/collect_vision_traces.py +4 -4
examples/qwen_vl/configs/crafter_rl_vision_qwen3vl4b.toml +40 -57
examples/qwen_vl/configs/crafter_vlm_sft_example.toml +1 -2
examples/qwen_vl/configs/eval_gpt4o_mini_vision.toml +20 -37
examples/qwen_vl/configs/eval_gpt5nano_vision.toml +21 -40
examples/qwen_vl/configs/eval_qwen3vl_vision.toml +26 -0
examples/qwen_vl/configs/{filter_qwen2vl_sft.toml → filter_qwen3vl_sft.toml} +4 -5
examples/qwen_vl/configs/filter_vision_sft.toml +2 -3
examples/qwen_vl/crafter_qwen_vl_agent.py +5 -5
examples/qwen_vl/run_vision_comparison.sh +6 -7
examples/rl/README.md +5 -5
examples/rl/configs/rl_from_base_qwen.toml +26 -1
examples/rl/configs/rl_from_base_qwen17.toml +6 -2
examples/rl/task_app/README.md +1 -2
examples/rl/task_app/math_single_step.py +2 -2
examples/run_crafter_demo.sh +2 -2
examples/sft/README.md +1 -1
examples/sft/configs/crafter_fft_qwen0p6b.toml +4 -1
examples/sft/configs/crafter_lora_qwen0p6b.toml +4 -1
examples/swe/task_app/README.md +32 -2
examples/swe/task_app/grpo_swe_mini.py +4 -0
examples/swe/task_app/hosted/envs/crafter/react_agent.py +1 -1
examples/swe/task_app/hosted/envs/mini_swe/environment.py +37 -10
examples/swe/task_app/hosted/inference/openai_client.py +4 -38
examples/swe/task_app/hosted/policy_routes.py +17 -0
examples/swe/task_app/hosted/rollout.py +4 -2
examples/swe/task_app/morph_backend.py +178 -0
examples/task_apps/banking77/__init__.py +6 -0
examples/task_apps/banking77/banking77_task_app.py +841 -0
examples/task_apps/banking77/deploy_wrapper.py +46 -0
examples/task_apps/crafter/CREATE_SFT_DATASET.md +4 -0
examples/task_apps/crafter/FILTER_COMMAND_STATUS.md +4 -0
examples/task_apps/crafter/FILTER_COMMAND_SUCCESS.md +4 -0
examples/task_apps/crafter/task_app/README.md +1 -1
examples/task_apps/crafter/task_app/grpo_crafter.py +90 -5
examples/task_apps/crafter/task_app/grpo_crafter_task_app.py +1 -1
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/policy.py +4 -26
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/react_agent.py +1 -2
examples/task_apps/crafter/task_app/synth_envs_hosted/hosted_app.py +49 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/inference/openai_client.py +372 -107
examples/task_apps/crafter/task_app/synth_envs_hosted/policy_routes.py +81 -12
examples/task_apps/crafter/task_app/synth_envs_hosted/rollout.py +82 -11
examples/task_apps/crafter/task_app/synth_envs_hosted/utils.py +194 -1
examples/task_apps/enron/task_app/grpo_enron_task_app.py +1 -1
examples/task_apps/gepa_benchmarks/__init__.py +7 -0
examples/task_apps/gepa_benchmarks/common.py +260 -0
examples/task_apps/gepa_benchmarks/hotpotqa_task_app.py +507 -0
examples/task_apps/gepa_benchmarks/hover_task_app.py +436 -0
examples/task_apps/gepa_benchmarks/ifbench_task_app.py +563 -0
examples/task_apps/gepa_benchmarks/pupa_task_app.py +460 -0
examples/task_apps/math/README.md +1 -2
examples/task_apps/pokemon_red/README.md +3 -4
examples/task_apps/pokemon_red/README_IMAGE_ONLY_EVAL.md +4 -0
examples/task_apps/pokemon_red/eval_image_only_gpt4o.toml +6 -5
examples/task_apps/pokemon_red/eval_pokemon_red_policy.py +1 -2
examples/task_apps/pokemon_red/task_app.py +288 -39
examples/task_apps/sokoban/README.md +2 -3
examples/task_apps/verilog/eval_groq_qwen32b.toml +12 -14
examples/task_apps/verilog/task_app/grpo_verilog_task_app.py +1 -1
examples/vlm/configs/crafter_vlm_gpt4o.toml +4 -1
examples/warming_up_to_rl/configs/crafter_fft.toml +4 -1
examples/warming_up_to_rl/configs/crafter_fft_4b.toml +0 -2
examples/warming_up_to_rl/configs/rl_from_base_qwen4b.toml +3 -2
examples/warming_up_to_rl/run_local_rollout_traced.py +1 -1
examples/warming_up_to_rl/task_app/README.md +1 -1
examples/warming_up_to_rl/task_app/grpo_crafter.py +185 -5
examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py +3 -27
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py +49 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py +156 -45
examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py +37 -4
examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py +33 -3
examples/warming_up_to_rl/task_app/synth_envs_hosted/utils.py +67 -0
examples/workflows/math_rl/configs/rl_from_base_qwen.toml +27 -0
examples/workflows/math_rl/configs/rl_from_base_qwen17.toml +6 -0
synth_ai/api/train/builders.py +99 -4
synth_ai/api/train/cli.py +516 -26
synth_ai/api/train/config_finder.py +13 -2
synth_ai/api/train/configs/__init__.py +23 -2
synth_ai/api/train/configs/prompt_learning.py +442 -0
synth_ai/api/train/configs/rl.py +61 -7
synth_ai/api/train/configs/sft.py +6 -2
synth_ai/api/train/configs/shared.py +59 -2
synth_ai/api/train/task_app.py +1 -1
synth_ai/api/train/validators.py +277 -0
synth_ai/auth/credentials.py +119 -0
synth_ai/baseline/__init__.py +25 -0
synth_ai/baseline/config.py +209 -0
synth_ai/baseline/discovery.py +214 -0
synth_ai/baseline/execution.py +146 -0
synth_ai/cli/__init__.py +94 -18
synth_ai/cli/__main__.py +0 -0
synth_ai/cli/claude.py +70 -0
synth_ai/cli/codex.py +84 -0
synth_ai/cli/commands/__init__.py +18 -0
synth_ai/cli/commands/baseline/__init__.py +12 -0
synth_ai/cli/commands/baseline/core.py +637 -0
synth_ai/cli/commands/baseline/list.py +93 -0
synth_ai/cli/commands/demo/__init__.py +6 -0
synth_ai/cli/commands/demo/core.py +163 -0
synth_ai/cli/commands/eval/__init__.py +19 -0
synth_ai/cli/commands/eval/core.py +1112 -0
synth_ai/cli/commands/eval/errors.py +81 -0
synth_ai/cli/commands/eval/validation.py +133 -0
synth_ai/cli/commands/filter/__init__.py +12 -0
synth_ai/cli/commands/filter/core.py +424 -0
synth_ai/cli/commands/filter/errors.py +55 -0
synth_ai/cli/commands/filter/validation.py +77 -0
synth_ai/cli/commands/help/__init__.py +177 -0
synth_ai/cli/commands/help/core.py +72 -0
synth_ai/cli/commands/smoke/__init__.py +7 -0
synth_ai/cli/commands/smoke/core.py +1436 -0
synth_ai/cli/commands/status/__init__.py +64 -0
synth_ai/cli/commands/status/client.py +192 -0
synth_ai/cli/commands/status/config.py +92 -0
synth_ai/cli/commands/status/errors.py +20 -0
synth_ai/cli/commands/status/formatters.py +164 -0
synth_ai/cli/commands/status/subcommands/__init__.py +9 -0
synth_ai/cli/commands/status/subcommands/files.py +79 -0
synth_ai/cli/commands/status/subcommands/jobs.py +334 -0
synth_ai/cli/commands/status/subcommands/models.py +79 -0
synth_ai/cli/commands/status/subcommands/pricing.py +22 -0
synth_ai/cli/commands/status/subcommands/runs.py +81 -0
synth_ai/cli/commands/status/subcommands/summary.py +47 -0
synth_ai/cli/commands/status/subcommands/usage.py +203 -0
synth_ai/cli/commands/status/utils.py +114 -0
synth_ai/cli/commands/train/__init__.py +53 -0
synth_ai/cli/commands/train/core.py +21 -0
synth_ai/cli/commands/train/errors.py +117 -0
synth_ai/cli/commands/train/judge_schemas.py +200 -0
synth_ai/cli/commands/train/judge_validation.py +305 -0
synth_ai/cli/commands/train/validation.py +386 -0
synth_ai/cli/demo.py +30 -158
synth_ai/cli/deploy/__init__.py +43 -0
synth_ai/cli/deploy.py +162 -0
synth_ai/cli/eval/__init__.py +36 -0
synth_ai/cli/eval/core.py +5 -0
synth_ai/cli/eval/errors.py +31 -0
synth_ai/cli/eval/validation.py +5 -0
synth_ai/cli/filter/__init__.py +28 -0
synth_ai/cli/filter/core.py +5 -0
synth_ai/cli/filter/errors.py +23 -0
synth_ai/cli/filter/validation.py +5 -0
synth_ai/cli/legacy_root_backup.py +14 -8
synth_ai/cli/modal_serve/__init__.py +12 -0
synth_ai/cli/modal_serve/core.py +14 -0
synth_ai/cli/modal_serve/errors.py +8 -0
synth_ai/cli/modal_serve/validation.py +11 -0
synth_ai/cli/opencode.py +107 -0
synth_ai/cli/root.py +9 -5
synth_ai/cli/serve/__init__.py +12 -0
synth_ai/cli/serve/core.py +14 -0
synth_ai/cli/serve/errors.py +8 -0
synth_ai/cli/serve/validation.py +11 -0
synth_ai/cli/setup.py +20 -265
synth_ai/cli/status.py +7 -126
synth_ai/cli/task_app_deploy.py +1 -10
synth_ai/cli/task_app_modal_serve.py +4 -9
synth_ai/cli/task_app_serve.py +4 -11
synth_ai/cli/task_apps.py +51 -1480
synth_ai/cli/train/__init__.py +12 -0
synth_ai/cli/train/core.py +21 -0
synth_ai/cli/train/errors.py +8 -0
synth_ai/cli/train/validation.py +24 -0
synth_ai/cli/train.py +1 -14
synth_ai/demos/crafter/grpo_crafter_task_app.py +1 -1
synth_ai/demos/demo_task_apps/crafter/grpo_crafter_task_app.py +1 -1
synth_ai/environments/examples/crafter_classic/engine_deterministic_patch.py +7 -4
synth_ai/environments/examples/crafter_classic/engine_serialization_patch_v3.py +9 -5
synth_ai/environments/examples/crafter_classic/world_config_patch_simple.py +4 -3
synth_ai/environments/examples/red/engine.py +33 -12
synth_ai/environments/examples/red/engine_helpers/reward_components.py +151 -179
synth_ai/environments/examples/red/environment.py +26 -0
synth_ai/environments/examples/red/trace_hooks_v3.py +168 -0
synth_ai/http.py +12 -0
synth_ai/judge_schemas.py +10 -10
synth_ai/learning/__init__.py +10 -0
synth_ai/learning/prompt_learning_client.py +276 -0
synth_ai/learning/prompt_learning_types.py +184 -0
synth_ai/learning/rl/client.py +3 -1
synth_ai/pricing/__init__.py +2 -0
synth_ai/pricing/model_pricing.py +57 -0
synth_ai/streaming/__init__.py +29 -0
synth_ai/streaming/config.py +94 -0
synth_ai/streaming/handlers.py +518 -0
synth_ai/streaming/streamer.py +320 -0
synth_ai/streaming/types.py +95 -0
synth_ai/task/apps/__init__.py +1 -0
synth_ai/task/config.py +2 -0
synth_ai/task/tracing_utils.py +25 -25
synth_ai/task/validators.py +45 -9
synth_ai/task_app_cfgs.py +21 -0
synth_ai/tracing_v3/config.py +162 -19
synth_ai/tracing_v3/constants.py +1 -1
synth_ai/tracing_v3/db_config.py +24 -38
synth_ai/tracing_v3/migration_helper.py +1 -2
synth_ai/tracing_v3/storage/config.py +47 -13
synth_ai/tracing_v3/storage/factory.py +3 -3
synth_ai/tracing_v3/turso/daemon.py +113 -11
synth_ai/tracing_v3/turso/native_manager.py +92 -16
synth_ai/types.py +8 -0
synth_ai/urls.py +11 -0
synth_ai/utils/__init__.py +30 -1
synth_ai/utils/agents.py +74 -0
synth_ai/utils/bin.py +39 -0
synth_ai/utils/cli.py +149 -5
synth_ai/utils/env.py +40 -33
synth_ai/utils/http.py +4 -1
synth_ai/utils/json.py +72 -0
synth_ai/utils/modal.py +285 -3
synth_ai/utils/paths.py +48 -0
synth_ai/utils/uvicorn.py +113 -0
{synth_ai-0.2.16.dist-info → synth_ai-0.2.19.dist-info}/METADATA +109 -6
{synth_ai-0.2.16.dist-info → synth_ai-0.2.19.dist-info}/RECORD +291 -142
examples/qwen_vl/configs/eval_qwen2vl_vision.toml +0 -44
synth_ai/cli/tui.py +0 -62
synth_ai/tui/__init__.py +0 -5
synth_ai/tui/__main__.py +0 -13
synth_ai/tui/cli/__init__.py +0 -1
synth_ai/tui/cli/query_experiments.py +0 -164
synth_ai/tui/cli/query_experiments_v3.py +0 -164
synth_ai/tui/dashboard.py +0 -911
{synth_ai-0.2.16.dist-info → synth_ai-0.2.19.dist-info}/WHEEL +0 -0
{synth_ai-0.2.16.dist-info → synth_ai-0.2.19.dist-info}/entry_points.txt +0 -0
{synth_ai-0.2.16.dist-info → synth_ai-0.2.19.dist-info}/licenses/LICENSE +0 -0
{synth_ai-0.2.16.dist-info → synth_ai-0.2.19.dist-info}/top_level.txt +0 -0

synth_ai/cli/commands/train/validation.py ADDED Viewed

@@ -0,0 +1,386 @@
+"""TOML validation logic for train commands (SFT and RL)."""
+from collections.abc import MutableMapping
+from pathlib import Path
+from typing import Any
+from pydantic import ValidationError
+from synth_ai.api.train.configs.rl import RLConfig
+from synth_ai.api.train.configs.sft import SFTConfig
+from synth_ai.api.train.utils import load_toml
+from .errors import (
+    InvalidJudgeConfigError,
+    InvalidRLConfigError,
+    InvalidRubricConfigError,
+    InvalidSFTConfigError,
+    MissingAlgorithmError,
+    MissingComputeError,
+    MissingDatasetError,
+    MissingModelError,
+    TomlParseError,
+    UnsupportedAlgorithmError,
+)
+from .judge_validation import extract_and_validate_judge_rubric
+__all__ = [
+    "validate_sft_config",
+    "validate_rl_config",
+    "load_and_validate_sft",
+    "load_and_validate_rl",
+]
+def validate_sft_config(config: MutableMapping[str, Any]) -> dict[str, Any]:
+    """Validate SFT configuration from TOML.
+    Args:
+        config: Raw configuration dictionary from TOML
+    Returns:
+        Validated configuration dictionary
+    Raises:
+        InvalidSFTConfigError: If validation fails
+        MissingAlgorithmError: If algorithm section is missing or invalid
+        MissingModelError: If model is not specified
+        MissingDatasetError: If dataset path is not specified
+        MissingComputeError: If compute section is missing required fields
+    """
+    # Check for required top-level sections
+    if "algorithm" not in config or not config["algorithm"]:
+        raise MissingAlgorithmError(
+            detail="[algorithm] section is required for SFT configs"
+        )
+    if "job" not in config or not config["job"]:
+        raise InvalidSFTConfigError(
+            detail="[job] section is required for SFT configs"
+        )
+    job = config.get("job", {})
+    if not job.get("model"):
+        raise MissingModelError(
+            detail="[job].model is required (e.g., 'Qwen/Qwen3-4B')"
+        )
+    # Check that at least one dataset source is specified
+    if not (job.get("data") or job.get("data_path")):
+        raise MissingDatasetError(
+            detail="[job].data or [job].data_path must be specified",
+            hint="Provide path to training JSONL file"
+        )
+    # Validate algorithm type, method, and variety
+    algorithm = config.get("algorithm", {})
+    if algorithm.get("type") not in {"offline", None}:
+        raise UnsupportedAlgorithmError(
+            algorithm_type=algorithm.get("type", "unknown"),
+            expected="offline",
+            hint="SFT requires algorithm.type = 'offline'"
+        )
+    method = algorithm.get("method", "")
+    if method and method not in {"sft", "supervised_finetune"}:
+        raise UnsupportedAlgorithmError(
+            algorithm_type=method,
+            expected="sft or supervised_finetune",
+            hint="SFT requires algorithm.method = 'sft' or 'supervised_finetune'"
+        )
+    # Validate variety is present
+    if not algorithm.get("variety"):
+        raise MissingAlgorithmError(
+            detail="[algorithm].variety is required (e.g., 'fft', 'lora', 'qlora')"
+        )
+    # Validate compute section
+    compute = config.get("compute", {})
+    if not compute:
+        raise MissingComputeError(
+            detail="[compute] section is required",
+            hint="Specify gpu_type, gpu_count, and nodes"
+        )
+    if not compute.get("gpu_type"):
+        raise MissingComputeError(
+            detail="[compute].gpu_type is required (e.g., 'H100', 'A100')"
+        )
+    if not compute.get("gpu_count"):
+        raise MissingComputeError(
+            detail="[compute].gpu_count is required"
+        )
+    # Validate using Pydantic model
+    try:
+        validated = SFTConfig.from_mapping(config)
+        return validated.to_dict()
+    except ValidationError as exc:
+        errors = []
+        for error in exc.errors():
+            loc = ".".join(str(x) for x in error["loc"])
+            msg = error["msg"]
+            errors.append(f"  • {loc}: {msg}")
+        raise InvalidSFTConfigError(
+            detail="Pydantic validation failed:\n" + "\n".join(errors)
+        ) from exc
+def validate_rl_config(config: MutableMapping[str, Any]) -> dict[str, Any]:
+    """Validate RL configuration from TOML.
+    Args:
+        config: Raw configuration dictionary from TOML
+    Returns:
+        Validated configuration dictionary
+    Raises:
+        InvalidRLConfigError: If validation fails
+        MissingAlgorithmError: If algorithm section is missing or invalid
+        MissingModelError: If model is not specified
+        MissingComputeError: If compute section is missing required fields
+    """
+    # Check for required top-level sections
+    if "algorithm" not in config or not config["algorithm"]:
+        raise MissingAlgorithmError(
+            detail="[algorithm] section is required for RL configs"
+        )
+    # Check for model OR policy (policy is the new format)
+    if "policy" not in config and "model" not in config:
+        raise MissingModelError(
+            detail="[policy] or [model] section is required for RL configs"
+        )
+    # Validate algorithm type, method, and variety
+    algorithm = config.get("algorithm", {})
+    if algorithm.get("type") not in {"online", None}:
+        raise UnsupportedAlgorithmError(
+            algorithm_type=algorithm.get("type", "unknown"),
+            expected="online",
+            hint="RL requires algorithm.type = 'online'"
+        )
+    method = algorithm.get("method", "")
+    if method and method not in {"policy_gradient", "ppo", "gspo"}:
+        raise UnsupportedAlgorithmError(
+            algorithm_type=method,
+            expected="policy_gradient",
+            hint="RL requires algorithm.method = 'policy_gradient'"
+        )
+    # Validate variety is present
+    if not algorithm.get("variety"):
+        raise MissingAlgorithmError(
+            detail="[algorithm].variety is required (e.g., 'gspo', 'ppo')"
+        )
+    # Validate model/policy section
+    model = config.get("model", {})
+    policy = config.get("policy", {})
+    # Use policy if available, otherwise fall back to model
+    if policy:
+        if not policy.get("model_name") and not policy.get("source"):
+            raise MissingModelError(
+                detail="[policy].model_name or [policy].source must be specified",
+                hint="Provide base model (e.g., 'Qwen/Qwen3-4B') or source checkpoint"
+            )
+        if not policy.get("trainer_mode"):
+            raise InvalidRLConfigError(
+                detail="[policy].trainer_mode is required (e.g., 'full', 'lora')"
+            )
+        if not policy.get("label"):
+            raise InvalidRLConfigError(
+                detail="[policy].label is required (e.g., 'my-rl-model')",
+                hint="Provide a descriptive label for this model"
+            )
+    elif model:
+        if not model.get("base") and not model.get("source"):
+            raise MissingModelError(
+                detail="[model].base or [model].source must be specified",
+                hint="Provide base model (e.g., 'Qwen/Qwen3-4B') or source checkpoint"
+            )
+        if not model.get("trainer_mode"):
+            raise InvalidRLConfigError(
+                detail="[model].trainer_mode is required (e.g., 'full', 'lora')"
+            )
+        if not model.get("label"):
+            raise InvalidRLConfigError(
+                detail="[model].label is required (e.g., 'my-rl-model')",
+                hint="Provide a descriptive label for this model"
+            )
+    # Validate compute section
+    compute = config.get("compute", {})
+    if not compute:
+        raise MissingComputeError(
+            detail="[compute] section is required",
+            hint="Specify gpu_type and gpu_count"
+        )
+    if not compute.get("gpu_type"):
+        raise MissingComputeError(
+            detail="[compute].gpu_type is required (e.g., 'H100', 'A100')"
+        )
+    if not compute.get("gpu_count"):
+        raise MissingComputeError(
+            detail="[compute].gpu_count is required"
+        )
+    # Check for rollout configuration
+    rollout = config.get("rollout", {})
+    if not rollout:
+        raise InvalidRLConfigError(
+            detail="[rollout] section is required for RL configs",
+            hint="Specify env_name, policy_name, max_turns, etc."
+        )
+    if not rollout.get("env_name"):
+        raise InvalidRLConfigError(
+            detail="[rollout].env_name is required (e.g., 'math', 'crafter')"
+        )
+    if not rollout.get("policy_name"):
+        raise InvalidRLConfigError(
+            detail="[rollout].policy_name is required"
+        )
+    # Validate topology section (can be top-level or under compute)
+    topology = config.get("topology") or compute.get("topology", {})
+    if not topology:
+        raise InvalidRLConfigError(
+            detail="[topology] or [compute.topology] section is required",
+            hint="Specify gpus_for_vllm, gpus_for_training, etc."
+        )
+    # Check for training section and its required fields
+    training = config.get("training", {})
+    if training:
+        required_training_fields = {
+            "num_epochs": "number of training epochs",
+            "iterations_per_epoch": "iterations per epoch",
+            "max_turns": "maximum turns",
+            "batch_size": "batch size",
+            "group_size": "group size",
+            "learning_rate": "learning rate",
+        }
+        for field, description in required_training_fields.items():
+            if field not in training:
+                raise InvalidRLConfigError(
+                    detail=f"[training].{field} is required ({description})",
+                    hint=f"Add {field} to the [training] section"
+                )
+    # Check for evaluation section
+    evaluation = config.get("evaluation", {})
+    if evaluation:
+        required_eval_fields = {
+            "instances": "number of evaluation instances",
+            "every_n_iters": "evaluation frequency",
+            "seeds": "evaluation seeds",
+        }
+        for field, description in required_eval_fields.items():
+            if field not in evaluation:
+                raise InvalidRLConfigError(
+                    detail=f"[evaluation].{field} is required ({description})",
+                    hint=f"Add {field} to the [evaluation] section"
+                )
+    # Inject services section if not present (will be populated at runtime)
+    if "services" not in config:
+        config["services"] = {
+            "task_url": "placeholder",  # Will be resolved at runtime
+        }
+    # Inject reference placement if not present (like builders.py does)
+    # Reference is now under compute.topology.reference_placement
+    if "compute" not in config:
+        config["compute"] = {}
+    if "topology" not in config["compute"]:
+        config["compute"]["topology"] = {}
+    if "reference_placement" not in config["compute"]["topology"]:
+        config["compute"]["topology"]["reference_placement"] = "none"
+    # Validate judge/rubric configuration with formalized Pydantic models
+    # This will emit deprecation warnings for dead fields and validate structure
+    try:
+        rubric_config, judge_config = extract_and_validate_judge_rubric(config)
+        # Validation passed - configs are clean and ready for use
+        # The validated Pydantic models can be used by training code if needed
+    except (InvalidJudgeConfigError, InvalidRubricConfigError) as exc:
+        raise InvalidRLConfigError(
+            detail=f"Judge/Rubric validation failed: {exc.detail}",
+            hint="Check JUDGE_RUBRIC_CLEANUP_GUIDE.md for migration help."
+        ) from exc
+    # Validate using Pydantic model
+    try:
+        validated = RLConfig.from_mapping(config)
+        return validated.to_dict()
+    except ValidationError as exc:
+        errors = []
+        for error in exc.errors():
+            loc = ".".join(str(x) for x in error["loc"])
+            msg = error["msg"]
+            errors.append(f"  • {loc}: {msg}")
+        raise InvalidRLConfigError(
+            detail="Pydantic validation failed:\n" + "\n".join(errors)
+        ) from exc
+def load_and_validate_sft(config_path: Path) -> dict[str, Any]:
+    """Load and validate an SFT TOML configuration file.
+    Args:
+        config_path: Path to TOML configuration file
+    Returns:
+        Validated configuration dictionary
+    Raises:
+        TomlParseError: If TOML parsing fails
+        InvalidSFTConfigError: If validation fails
+    """
+    try:
+        raw_config = load_toml(config_path)
+    except Exception as exc:
+        raise TomlParseError(
+            path=str(config_path),
+            detail=str(exc)
+        ) from exc
+    return validate_sft_config(raw_config)
+def load_and_validate_rl(config_path: Path) -> dict[str, Any]:
+    """Load and validate an RL TOML configuration file.
+    Args:
+        config_path: Path to TOML configuration file
+    Returns:
+        Validated configuration dictionary
+    Raises:
+        TomlParseError: If TOML parsing fails
+        InvalidRLConfigError: If validation fails
+    """
+    try:
+        raw_config = load_toml(config_path)
+    except Exception as exc:
+        raise TomlParseError(
+            path=str(config_path),
+            detail=str(exc)
+        ) from exc
+    return validate_rl_config(raw_config)

synth_ai/cli/demo.py CHANGED Viewed

@@ -1,165 +1,37 @@
-#!/usr/bin/env python3
-"""
-CLI: interactive launcher for example demos and RL demo helpers.
-- `synth-ai demo` (no subcommand) -> initialize RL demo files into ./synth_demo/
-- `synth-ai demo deploy|configure|run` -> invoke RL demo helpers directly.
-"""
-from __future__ import annotations
-import importlib
-import os
-import subprocess
+import shutil
 from pathlib import Path
-from typing import Any, cast
 import click
-from click.exceptions import Exit
-demo_commands = cast(
-    Any, importlib.import_module("synth_ai.demos.core.cli")
-)
-def _find_demo_scripts(root: Path) -> list[Path]:
-    if not root.exists():
-        return []
-    return sorted([p for p in root.rglob("run_demo.sh") if p.is_file()])
-def _run_demo_command(func, *args, **kwargs) -> None:
-    """Invoke a demo command and exit via Click on non-zero status codes."""
-    try:
-        result = func(*args, **kwargs)
-    except SystemExit as exc:  # pragma: no cover - defensive
-        raise Exit(exc.code or 1) from exc
-    if result is None:
-        return
-    try:
-        code = int(result)
-    except (TypeError, ValueError):
-        return
-    if code != 0:
-        raise Exit(code)
-def register(cli):
-    @cli.group("demo", invoke_without_command=True)
-    @click.option(
-        "--force", is_flag=True, help="Overwrite existing files in CWD when initializing demo"
-    )
-    @click.option("--list", "list_only", is_flag=True, help="List available legacy demos and exit")
-    @click.option("-f", "filter_term", default="", help="Filter legacy demos by substring")
-    @click.pass_context
-    def demo(ctx: click.Context, force: bool, list_only: bool, filter_term: str):
-        """Demo helpers.
-        - Default (no subcommand): initialize RL demo files into ./synth_demo/ (alias of rl_demo init)
-        - Legacy mode: with --list, find and run examples/*/run_demo.sh
-        - New RL demo subcommands: deploy, configure, run
-        """
-        if ctx.invoked_subcommand is not None:
-            return
-        # If explicitly asked to list legacy demos, show interactive picker
-        if list_only:
-            repo_root = Path(os.getcwd())
-            examples_dir = repo_root / "examples"
-            demos = _find_demo_scripts(examples_dir)
-            if filter_term:
-                demos = [p for p in demos if filter_term.lower() in str(p).lower()]
+DEMO_SOURCES: dict[str, str] = {
+    "local": "crafter",
+    "modal": "math"
+}
-            if not demos:
-                click.echo("No run_demo.sh scripts found under examples/.")
-                return
-            click.echo("Available demos:")
-            for idx, p in enumerate(demos, start=1):
-                click.echo(f" {idx}. {p.relative_to(repo_root)}")
-            click.echo("")
-            def _validate_choice(val: str) -> int:
-                try:
-                    i = int(val)
-                except Exception as err:
-                    raise click.BadParameter("Enter a number from the list") from err
-                if i < 1 or i > len(demos):
-                    raise click.BadParameter(f"Choose a number between 1 and {len(demos)}")
-                return i
-            choice = click.prompt("Select a demo to run", value_proc=_validate_choice)
-            script = demos[choice - 1]
-            click.echo("")
-            click.echo(f"🚀 Running {script.relative_to(repo_root)}\n")
-            try:
-                subprocess.run(["bash", str(script)], check=True)
-            except subprocess.CalledProcessError as e:
-                click.echo(f"❌ Demo exited with non-zero status: {e.returncode}")
-            except KeyboardInterrupt:
-                click.echo("\n🛑 Demo interrupted by user")
-            return
-        # Default: initialize RL demo files via new command
-        _run_demo_command(demo_commands.init, force=force)
-    # (prepare command removed; configure now prepares baseline TOML)
-    # Help pyright understand dynamic Click group attributes
-    _dg = cast(Any, demo)
-    @_dg.command("deploy")
-    @click.option("--local", is_flag=True, help="Run local FastAPI instead of Modal deploy")
-    @click.option(
-        "--app",
-        type=click.Path(),
-        default=None,
-        help="Path to Modal app.py for uv run modal deploy",
-    )
-    @click.option("--name", type=str, default="synth-math-demo", help="Modal app name")
-    @click.option(
-        "--script",
-        type=click.Path(),
-        default=None,
-        help="Path to deploy_task_app.sh (optional legacy)",
-    )
-    def demo_deploy(local: bool, app: str | None, name: str, script: str | None):
-        _run_demo_command(
-            demo_commands.deploy,
-            local=local,
-            app=app,
-            name=name,
-            script=script,
-        )
-    @_dg.command("configure")
-    def demo_configure():
-        _run_demo_command(demo_commands.run)
-    @_dg.command("setup")
-    def demo_setup():
-        _run_demo_command(demo_commands.setup)
-    @_dg.command("run")
-    @click.option("--batch-size", type=int, default=None)
-    @click.option("--group-size", type=int, default=None)
-    @click.option("--model", type=str, default=None)
-    @click.option("--timeout", type=int, default=600)
-    def demo_run(batch_size: int | None, group_size: int | None, model: str | None, timeout: int):
-        _run_demo_command(
-            demo_commands.run,
-            batch_size=batch_size,
-            group_size=group_size,
-            model=model,
-            timeout=timeout,
-        )
-    @cli.command("setup")
-    def setup_alias():
-        """Perform SDK handshake and write keys to .env."""
-        _run_demo_command(demo_commands.setup)
+@click.command()
+@click.option(
+    "--runtime",
+    "runtime",
+    type=click.Choice(tuple(DEMO_SOURCES.keys()), case_sensitive=False),
+    default="local",
+    show_default=True,
+    help="Select runtime to load a demo task app to your cwd. Options: local, modal"
+)
+def demo_cmd(runtime: str) -> None:
+      runtime_key = runtime.lower()
+      demo_name = DEMO_SOURCES[runtime_key]
+      package_root = Path(__file__).resolve().parents[1]
+      src = package_root / "demos" / demo_name
+      if not src.exists():
+          raise click.ClickException(f"Demo source directory not found: {src}")
+      dst = Path.cwd() / src.name
+      if dst.exists():
+          raise click.ClickException(
+              f"Destination already exists: {dst}. Remove it first if you want to re-copy."
+          )
+      shutil.copytree(src, dst)
+      click.echo(f"Copied {demo_name} demo to {dst}")

synth_ai/cli/deploy/__init__.py ADDED Viewed

@@ -0,0 +1,43 @@
+"""Deploy command package - imports from deploy.py module."""
+from __future__ import annotations
+# Import from the deploy.py module file (using importlib to avoid conflicts)
+# This package exists for backwards compatibility
+import importlib
+import importlib.util
+import sys
+from pathlib import Path
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    from click import Command
+try:
+    # Import the deploy.py module directly by file path to avoid package/module conflict
+    deploy_module_path = Path(__file__).parent.parent / "deploy.py"
+    if deploy_module_path.exists():
+        spec = importlib.util.spec_from_file_location("synth_ai.cli.deploy_module", deploy_module_path)
+        if spec and spec.loader:
+            deploy_module = importlib.util.module_from_spec(spec)
+            sys.modules["synth_ai.cli.deploy_module"] = deploy_module
+            spec.loader.exec_module(deploy_module)
+            command: Command | None = getattr(deploy_module, "deploy_cmd", None)  # type: ignore[assignment]
+            deploy_cmd: Command | None = command  # type: ignore[assignment]
+        else:
+            raise ImportError("Could not load deploy.py")
+    else:
+        raise ImportError("deploy.py not found")
+    get_command: None = None  # Not used in current implementation
+    __all__: list[str] = [
+        "command",
+        "deploy_cmd",
+    ]
+except Exception:
+    # If deploy.py doesn't exist or fails to import, provide a stub
+    command: Command | None = None  # type: ignore[assignment]
+    deploy_cmd: Command | None = None  # type: ignore[assignment]
+    get_command: None = None
+    __all__: list[str] = []

synth-ai 0.2.16__py3-none-any.whl → 0.2.19__py3-none-any.whl

Potentially problematic release.

synth-ai 0.2.16py3-none-any.whl → 0.2.19py3-none-any.whl