PyPI - synth-ai - Versions diffs - 0.2.9.dev7__py3-none-any.whl → 0.2.10__py3-none-any.whl - Mend

synth-ai 0.2.9.dev7py3-none-any.whl → 0.2.10py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synth-ai might be problematic. Click here for more details.

Files changed (323) hide show

examples/__init__.py +16 -0
examples/crafter_debug_render.py +8 -11
examples/dev/qwen3_32b_qlora_4xh100.toml +40 -0
examples/multi_step/crafter_rl_lora.md +29 -0
examples/qwen_coder/README.md +102 -0
examples/qwen_coder/_shared.py +113 -0
examples/qwen_coder/configs/coder_lora_30b.toml +61 -0
examples/qwen_coder/configs/coder_lora_4b.toml +57 -0
examples/qwen_coder/configs/coder_lora_small.toml +58 -0
examples/qwen_coder/generate_dataset.py +98 -0
examples/qwen_coder/infer_ft_smoke.py +65 -0
examples/qwen_coder/infer_prod_proxy.py +73 -0
examples/qwen_coder/infer_via_synth.py +87 -0
examples/qwen_coder/scripts/infer_coder.sh +19 -0
examples/qwen_coder/scripts/train_coder_30b.sh +22 -0
examples/qwen_coder/sft_full_17b.py +103 -0
examples/qwen_coder/sft_lora_30b.py +110 -0
examples/qwen_coder/subset_jsonl.py +39 -0
examples/qwen_coder/todos.md +38 -0
examples/qwen_coder/validate_jsonl.py +60 -0
examples/rl/run_eval.py +36 -37
examples/rl/run_rl_and_save.py +5 -5
examples/rl/task_app/math_single_step.py +65 -43
examples/rl/task_app/math_task_app.py +3 -3
examples/sft/README.md +139 -0
examples/sft/configs/crafter_fft_qwen0p6b.toml +44 -0
examples/sft/configs/crafter_lora_qwen0p6b.toml +45 -0
examples/sft/evaluate.py +117 -0
examples/sft/export_dataset.py +117 -0
examples/sft/generate_traces.py +162 -0
examples/swe/__init__.py +12 -0
examples/swe/task_app/README.md +105 -0
examples/swe/task_app/__init__.py +2 -0
examples/swe/task_app/grpo_swe_mini.py +571 -0
examples/swe/task_app/grpo_swe_mini_task_app.py +136 -0
examples/swe/task_app/hosted/README.md +173 -0
examples/swe/task_app/hosted/__init__.py +5 -0
examples/swe/task_app/hosted/branching.py +143 -0
examples/swe/task_app/hosted/environment_routes.py +1289 -0
examples/swe/task_app/hosted/envs/__init__.py +1 -0
examples/swe/task_app/hosted/envs/crafter/__init__.py +6 -0
examples/swe/task_app/hosted/envs/crafter/app.py +1 -0
examples/swe/task_app/hosted/envs/crafter/environment.py +522 -0
examples/swe/task_app/hosted/envs/crafter/policy.py +478 -0
examples/swe/task_app/hosted/envs/crafter/react_agent.py +108 -0
examples/swe/task_app/hosted/envs/crafter/shared.py +305 -0
examples/swe/task_app/hosted/envs/crafter/tools.py +47 -0
examples/swe/task_app/hosted/envs/mini_swe/__init__.py +8 -0
examples/swe/task_app/hosted/envs/mini_swe/environment.py +1164 -0
examples/swe/task_app/hosted/envs/mini_swe/policy.py +355 -0
examples/swe/task_app/hosted/envs/mini_swe/shared.py +83 -0
examples/swe/task_app/hosted/envs/mini_swe/tools.py +96 -0
examples/swe/task_app/hosted/hosted_app.py +204 -0
examples/swe/task_app/hosted/inference/__init__.py +5 -0
examples/swe/task_app/hosted/inference/openai_client.py +618 -0
examples/swe/task_app/hosted/main.py +100 -0
examples/swe/task_app/hosted/policy_routes.py +1079 -0
examples/swe/task_app/hosted/registry.py +195 -0
examples/swe/task_app/hosted/rollout.py +1869 -0
examples/swe/task_app/hosted/storage/__init__.py +5 -0
examples/swe/task_app/hosted/storage/volume.py +211 -0
examples/swe/task_app/hosted/test_agents.py +161 -0
examples/swe/task_app/hosted/test_service.py +137 -0
examples/swe/task_app/hosted/utils.py +62 -0
examples/vlm/PROPOSAL.md +53 -0
examples/vlm/README.md +68 -0
examples/vlm/configs/crafter_vlm_gpt4o.toml +44 -0
examples/vlm/crafter_image_only_agent.py +207 -0
examples/vlm/crafter_openai_vlm_agent.py +277 -0
examples/vlm/filter_image_rows.py +63 -0
examples/vlm/run_crafter_vlm_benchmark.py +316 -0
examples/warming_up_to_rl/analyze_trace_db.py +5 -5
examples/warming_up_to_rl/configs/rl_from_base_qwen4b.toml +11 -1
examples/warming_up_to_rl/export_trace_sft.py +78 -21
examples/warming_up_to_rl/groq_test.py +4 -4
examples/warming_up_to_rl/manage_secrets.py +13 -18
examples/warming_up_to_rl/run_eval.py +42 -44
examples/warming_up_to_rl/run_fft_and_save.py +11 -16
examples/warming_up_to_rl/run_local_rollout.py +1 -3
examples/warming_up_to_rl/run_local_rollout_modal.py +2 -4
examples/warming_up_to_rl/run_local_rollout_parallel.py +1 -4
examples/warming_up_to_rl/run_local_rollout_traced.py +3 -5
examples/warming_up_to_rl/run_rl_and_save.py +5 -6
examples/warming_up_to_rl/run_rollout_remote.py +8 -10
examples/warming_up_to_rl/task_app/README.md +6 -2
examples/warming_up_to_rl/task_app/grpo_crafter.py +234 -35
examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py +2 -3
examples/warming_up_to_rl/task_app/synth_envs_hosted/__init__.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/branching.py +9 -11
examples/warming_up_to_rl/task_app/synth_envs_hosted/environment_routes.py +131 -114
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/environment.py +101 -41
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py +73 -51
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py +14 -6
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/shared.py +16 -16
examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py +32 -34
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py +94 -31
examples/warming_up_to_rl/task_app/synth_envs_hosted/main.py +0 -2
examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py +303 -203
examples/warming_up_to_rl/task_app/synth_envs_hosted/registry.py +21 -23
examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py +328 -225
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/volume.py +13 -13
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_agents.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_service.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/utils.py +4 -3
synth_ai/api/models/supported.py +376 -0
synth_ai/api/train/builders.py +128 -21
synth_ai/api/train/cli.py +80 -64
synth_ai/api/train/config_finder.py +7 -2
synth_ai/api/train/env_resolver.py +1 -1
synth_ai/api/train/pollers.py +2 -1
synth_ai/api/train/supported_algos.py +139 -0
synth_ai/api/train/task_app.py +1 -2
synth_ai/api/train/utils.py +13 -44
synth_ai/cli/__init__.py +8 -0
synth_ai/cli/_modal_wrapper.py +28 -0
synth_ai/cli/_typer_patch.py +49 -0
synth_ai/cli/balance.py +1 -2
synth_ai/cli/calc.py +1 -1
synth_ai/cli/demo.py +2 -1
synth_ai/cli/recent.py +2 -2
synth_ai/cli/rl_demo.py +2 -1
synth_ai/cli/root.py +11 -13
synth_ai/cli/status.py +2 -2
synth_ai/cli/task_apps.py +529 -179
synth_ai/cli/traces.py +6 -4
synth_ai/cli/watch.py +12 -18
synth_ai/demo_registry.py +1 -1
synth_ai/demos/core/cli.py +36 -43
synth_ai/demos/demo_task_apps/__init__.py +3 -3
synth_ai/demos/demo_task_apps/core.py +17 -25
synth_ai/demos/demo_task_apps/crafter/grpo_crafter_task_app.py +3 -4
synth_ai/demos/demo_task_apps/math/app.py +2 -1
synth_ai/demos/demo_task_apps/math/deploy_modal.py +3 -4
synth_ai/demos/demo_task_apps/math/modal_task_app.py +16 -18
synth_ai/demos/demo_task_apps/math/task_app_entry.py +0 -1
synth_ai/environments/examples/crafter_classic/environment.py +76 -1
synth_ai/environments/reproducibility/tree.py +2 -5
synth_ai/environments/service/app.py +11 -12
synth_ai/environments/service/core_routes.py +4 -7
synth_ai/environments/stateful/engine.py +1 -1
synth_ai/environments/tasks/core.py +1 -0
synth_ai/environments/tasks/filters.py +5 -6
synth_ai/environments/tasks/utils.py +4 -5
synth_ai/handshake.py +9 -9
synth_ai/http.py +1 -1
synth_ai/http_client.py +18 -10
synth_ai/inference/client.py +15 -5
synth_ai/jobs/client.py +78 -83
synth_ai/learning/__init__.py +41 -6
synth_ai/learning/algorithms.py +14 -0
synth_ai/learning/client.py +91 -24
synth_ai/learning/config.py +2 -38
synth_ai/learning/ft_client.py +4 -59
synth_ai/learning/health.py +5 -6
synth_ai/learning/jobs.py +31 -47
synth_ai/{rl → learning/rl}/__init__.py +14 -4
synth_ai/learning/rl/client.py +267 -0
synth_ai/learning/rl/config.py +31 -0
synth_ai/{rl → learning/rl}/contracts.py +5 -8
synth_ai/{rl → learning/rl}/env_keys.py +39 -15
synth_ai/learning/rl/secrets.py +13 -0
synth_ai/learning/rl_client.py +2 -281
synth_ai/learning/sft/__init__.py +29 -0
synth_ai/learning/sft/client.py +68 -0
synth_ai/learning/sft/config.py +270 -0
synth_ai/learning/sft/data.py +295 -0
synth_ai/learning/sse.py +25 -24
synth_ai/learning/validators.py +25 -28
synth_ai/lm/__init__.py +21 -47
synth_ai/task/__init__.py +25 -27
synth_ai/task/apps/__init__.py +7 -8
synth_ai/task/auth.py +8 -8
synth_ai/task/client.py +14 -14
synth_ai/task/contracts.py +36 -35
synth_ai/task/datasets.py +6 -5
synth_ai/task/errors.py +10 -10
synth_ai/task/health.py +17 -9
synth_ai/task/json.py +58 -23
synth_ai/task/proxy.py +13 -9
synth_ai/task/rubrics.py +16 -15
synth_ai/task/server.py +12 -12
synth_ai/task/tracing_utils.py +4 -4
synth_ai/task/vendors.py +5 -6
synth_ai/tracing_v3/__init__.py +2 -0
synth_ai/tracing_v3/abstractions.py +21 -4
synth_ai/tracing_v3/decorators.py +18 -16
synth_ai/tracing_v3/hooks.py +5 -5
synth_ai/tracing_v3/llm_call_record_helpers.py +6 -6
synth_ai/tracing_v3/session_tracer.py +40 -14
synth_ai/tracing_v3/storage/base.py +85 -0
synth_ai/tracing_v3/storage/config.py +21 -8
synth_ai/tracing_v3/storage/factory.py +10 -7
synth_ai/tracing_v3/storage/utils.py +4 -2
synth_ai/tracing_v3/turso/daemon.py +7 -2
synth_ai/tracing_v3/turso/models.py +2 -2
synth_ai/tracing_v3/turso/native_manager.py +1173 -0
synth_ai/tracing_v3/utils.py +4 -4
synth_ai/v0/api/__init__.py +8 -0
synth_ai/v0/api/models/__init__.py +8 -0
synth_ai/v0/api/models/supported.py +8 -0
synth_ai/v0/config/__init__.py +15 -0
synth_ai/v0/config/base_url.py +12 -0
synth_ai/v0/lm/__init__.py +51 -0
synth_ai/{lm → v0/lm}/caching/ephemeral.py +2 -2
synth_ai/{lm → v0/lm}/caching/handler.py +4 -4
synth_ai/{lm → v0/lm}/caching/initialize.py +1 -1
synth_ai/{lm → v0/lm}/caching/persistent.py +1 -1
synth_ai/{lm → v0/lm}/config.py +6 -1
synth_ai/{lm → v0/lm}/core/all.py +9 -9
synth_ai/{lm → v0/lm}/core/main.py +6 -6
synth_ai/{lm → v0/lm}/core/main_v3.py +10 -10
synth_ai/{lm → v0/lm}/core/synth_models.py +2 -14
synth_ai/{lm → v0/lm}/core/vendor_clients.py +2 -2
synth_ai/{lm → v0/lm}/overrides.py +2 -2
synth_ai/{lm → v0/lm}/provider_support/anthropic.py +4 -4
synth_ai/{lm → v0/lm}/provider_support/openai.py +5 -5
synth_ai/{lm → v0/lm}/structured_outputs/handler.py +5 -5
synth_ai/{lm → v0/lm}/structured_outputs/rehabilitate.py +1 -1
synth_ai/{lm → v0/lm}/vendors/core/anthropic_api.py +9 -9
synth_ai/{lm → v0/lm}/vendors/core/gemini_api.py +5 -5
synth_ai/{lm → v0/lm}/vendors/core/mistral_api.py +5 -5
synth_ai/{lm → v0/lm}/vendors/core/openai_api.py +10 -10
synth_ai/{lm → v0/lm}/vendors/openai_standard.py +8 -8
synth_ai/{lm → v0/lm}/vendors/openai_standard_responses.py +2 -2
synth_ai/{lm → v0/lm}/vendors/supported/custom_endpoint.py +3 -3
synth_ai/{lm → v0/lm}/vendors/supported/deepseek.py +2 -2
synth_ai/{lm → v0/lm}/vendors/supported/grok.py +2 -2
synth_ai/{lm → v0/lm}/vendors/supported/groq.py +1 -1
synth_ai/{lm → v0/lm}/vendors/supported/ollama.py +1 -1
synth_ai/{lm → v0/lm}/vendors/supported/openrouter.py +3 -3
synth_ai/{lm → v0/lm}/vendors/supported/together.py +1 -1
synth_ai/{lm → v0/lm}/vendors/synth_client.py +1 -1
synth_ai/v0/tracing_v3/__init__.py +10 -0
synth_ai/v0/tracing_v3/abstractions.py +3 -0
synth_ai/v0/tracing_v3/decorators.py +3 -0
synth_ai/v0/tracing_v3/llm_call_record_helpers.py +3 -0
synth_ai/v0/tracing_v3/session_tracer.py +3 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.10.dist-info}/METADATA +10 -7
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.10.dist-info}/RECORD +269 -233
examples/common_old/backend.py +0 -20
examples/evals_old/README.md +0 -98
examples/evals_old/__init__.py +0 -6
examples/evals_old/compare_models.py +0 -1038
examples/evals_old/example_log.md +0 -145
examples/evals_old/run_demo.sh +0 -126
examples/evals_old/trace_analysis.py +0 -270
examples/finetuning_old/_backup_synth_qwen/config.toml +0 -29
examples/finetuning_old/_backup_synth_qwen/example_log.md +0 -324
examples/finetuning_old/_backup_synth_qwen/filter_traces.py +0 -60
examples/finetuning_old/_backup_synth_qwen/filter_traces_achievements.py +0 -243
examples/finetuning_old/_backup_synth_qwen/purge_v3_traces.py +0 -109
examples/finetuning_old/_backup_synth_qwen/react_agent_lm.py +0 -1924
examples/finetuning_old/_backup_synth_qwen/readme.md +0 -49
examples/finetuning_old/_backup_synth_qwen/run_crafter_qwen4b.py +0 -114
examples/finetuning_old/_backup_synth_qwen/run_demo.sh +0 -195
examples/finetuning_old/_backup_synth_qwen/sft_kickoff.py +0 -119
examples/finetuning_old/synth_qwen_v1/README.md +0 -68
examples/finetuning_old/synth_qwen_v1/filter_traces.py +0 -60
examples/finetuning_old/synth_qwen_v1/filter_traces_achievements.py +0 -243
examples/finetuning_old/synth_qwen_v1/finetune.py +0 -46
examples/finetuning_old/synth_qwen_v1/hello_ft_model.py +0 -71
examples/finetuning_old/synth_qwen_v1/infer.py +0 -36
examples/finetuning_old/synth_qwen_v1/poll.py +0 -46
examples/finetuning_old/synth_qwen_v1/prepare_data.py +0 -35
examples/finetuning_old/synth_qwen_v1/purge_v3_traces.py +0 -109
examples/finetuning_old/synth_qwen_v1/react_agent_lm.py +0 -1933
examples/finetuning_old/synth_qwen_v1/run_crafter_sft_job.py +0 -210
examples/finetuning_old/synth_qwen_v1/run_ft_job.py +0 -237
examples/finetuning_old/synth_qwen_v1/upload_data.py +0 -34
examples/finetuning_old/synth_qwen_v1/util.py +0 -152
examples/rl_old/task_app.py +0 -1131
synth_ai/experimental/synth_oss.py +0 -445
synth_ai/learning/filtering.py +0 -0
synth_ai/learning/offline/dpo.py +0 -0
synth_ai/learning/offline/providers.py +0 -7
synth_ai/learning/offline/sft.py +0 -0
synth_ai/learning/offline/shared.py +0 -0
synth_ai/learning/online/grpo.py +0 -0
synth_ai/learning/online/irft.py +0 -0
synth_ai/learning/prompts/banking77_injection_eval.py +0 -168
synth_ai/learning/prompts/gepa.py +0 -0
synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +0 -211
synth_ai/learning/prompts/mipro.py +0 -289
synth_ai/learning/prompts/random_search.py +0 -249
synth_ai/learning/prompts/run_mipro_banking77.py +0 -172
synth_ai/learning/prompts/run_random_search_banking77.py +0 -329
synth_ai/rl/secrets.py +0 -19
synth_ai/scripts/verify_rewards.py +0 -100
synth_ai/tracing/__init__.py +0 -30
synth_ai/tracing_v1/__init__.py +0 -33
synth_ai/tracing_v3/turso/__init__.py +0 -25
synth_ai/tracing_v3/turso/manager.py +0 -838
synth_ai/zyk/__init__.py +0 -30
/synth_ai/{lm → v0/lm}/caching/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/caching/constants.py +0 -0
/synth_ai/{lm → v0/lm}/caching/dbs.py +0 -0
/synth_ai/{lm → v0/lm}/constants.py +0 -0
/synth_ai/{lm → v0/lm}/core/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/core/exceptions.py +0 -0
/synth_ai/{lm → v0/lm}/cost/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/cost/monitor.py +0 -0
/synth_ai/{lm → v0/lm}/cost/statefulness.py +0 -0
/synth_ai/{lm → v0/lm}/injection.py +0 -0
/synth_ai/{lm → v0/lm}/provider_support/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/provider_support/suppress_logging.py +0 -0
/synth_ai/{lm → v0/lm}/structured_outputs/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/structured_outputs/inject.py +0 -0
/synth_ai/{lm → v0/lm}/tools/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/tools/base.py +0 -0
/synth_ai/{lm → v0/lm}/unified_interface.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/base.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/core/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/core/synth_dev_api.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/local/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/local/ollama.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/retries.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/supported/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/warmup.py +0 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.10.dist-info}/WHEEL +0 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.10.dist-info}/entry_points.txt +0 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.10.dist-info}/licenses/LICENSE +0 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.10.dist-info}/top_level.txt +0 -0

synth_ai/api/train/builders.py CHANGED Viewed

@@ -5,8 +5,19 @@ from pathlib import Path
 from typing import Any
 import click
+from synth_ai.api.models.supported import (
+    UnsupportedModelError,
+    ensure_allowed_model,
+    normalize_model_identifier,
+)
+from synth_ai.learning.sft.config import prepare_sft_job_payload
-from .utils import ensure_api_base, load_toml, TrainError
+from .supported_algos import (
+    AlgorithmValidationError,
+    ensure_model_supported_for_algorithm,
+    validate_algorithm_config,
+)
+from .utils import TrainError, ensure_api_base, load_toml
 @dataclass(slots=True)
@@ -29,29 +40,78 @@ def build_rl_payload(
     task_url: str,
     overrides: dict[str, Any],
     idempotency: str | None,
+    allow_experimental: bool | None = None,
 ) -> RLBuildResult:
     data = load_toml(config_path)
+    try:
+        spec = validate_algorithm_config(data.get("algorithm"), expected_family="rl")
+    except AlgorithmValidationError as exc:
+        raise click.ClickException(str(exc)) from exc
     services = data.get("services") if isinstance(data.get("services"), dict) else {}
     model_cfg = data.get("model") if isinstance(data.get("model"), dict) else {}
     final_task_url = (
-        overrides.get("task_url") or task_url or services.get("task_url") or ""
+        overrides.get("task_url")
+        or task_url
+        or (services.get("task_url") if isinstance(services, dict) else None)
+        or ""
     ).strip()
     if not final_task_url:
         raise click.ClickException(
             "Task app URL required (provide --task-url or set services.task_url in TOML)"
         )
-    model_source = (model_cfg.get("source") or "").strip()
-    model_base = (model_cfg.get("base") or "").strip()
+    raw_source = model_cfg.get("source") if isinstance(model_cfg, dict) else ""
+    model_source = str(raw_source or "").strip()
+    raw_base = model_cfg.get("base") if isinstance(model_cfg, dict) else ""
+    model_base = str(raw_base or "").strip()
     override_model = (overrides.get("model") or "").strip()
     if override_model:
         model_source = override_model
         model_base = ""
     if bool(model_source) == bool(model_base):
+        details = (
+            f"Config: {config_path}\n"
+            f"[model].source={model_source!r} | [model].base={model_base!r}"
+        )
+        hint = (
+            "Set exactly one: [model].base for a base model (e.g. 'Qwen/Qwen3-1.7B') "
+            "or [model].source for a fine-tuned model id. Also remove any conflicting "
+            "'[policy].model' entries."
+        )
         raise click.ClickException(
-            "Model section must specify exactly one of [model].source or [model].base"
+            "Invalid model config: exactly one of [model].source or [model].base is required.\n"
+            + details
+            + "\nHint: "
+            + hint
+        )
+    try:
+        if model_source:
+            model_source = normalize_model_identifier(model_source)
+        if model_base:
+            model_base = normalize_model_identifier(model_base, allow_finetuned_prefixes=False)
+    except UnsupportedModelError as exc:
+        raise click.ClickException(str(exc)) from exc
+    base_model_for_training: str | None = None
+    if model_source:
+        base_model_for_training = ensure_allowed_model(
+            model_source,
+            allow_finetuned_prefixes=True,
+            allow_experimental=allow_experimental,
+        )
+    elif model_base:
+        base_model_for_training = ensure_allowed_model(
+            model_base,
+            allow_finetuned_prefixes=False,
+            allow_experimental=allow_experimental,
         )
+    if base_model_for_training:
+        try:
+            ensure_model_supported_for_algorithm(base_model_for_training, spec)
+        except AlgorithmValidationError as exc:
+            raise click.ClickException(str(exc)) from exc
     # Force TOML services.task_url to the effective endpoint to avoid split URLs
     try:
@@ -87,15 +147,24 @@ def build_sft_payload(
     *,
     config_path: Path,
     dataset_override: Path | None,
+    allow_experimental: bool | None,
 ) -> SFTBuildResult:
     data = load_toml(config_path)
+    try:
+        spec = validate_algorithm_config(data.get("algorithm"), expected_family="sft")
+    except AlgorithmValidationError as exc:
+        raise TrainError(str(exc)) from exc
     job_cfg = data.get("job") if isinstance(data.get("job"), dict) else {}
     data_cfg = data.get("data") if isinstance(data.get("data"), dict) else {}
     hp_cfg = data.get("hyperparameters") if isinstance(data.get("hyperparameters"), dict) else {}
     train_cfg = data.get("training") if isinstance(data.get("training"), dict) else {}
     compute_cfg = data.get("compute") if isinstance(data.get("compute"), dict) else {}
-    raw_dataset = dataset_override or job_cfg.get("data") or job_cfg.get("data_path")
+    raw_dataset = (
+        dataset_override
+        or (job_cfg.get("data") if isinstance(job_cfg, dict) else None)
+        or (job_cfg.get("data_path") if isinstance(job_cfg, dict) else None)
+    )
     if not raw_dataset:
         raise TrainError("Dataset not specified; pass --dataset or set [job].data")
     dataset_path = Path(raw_dataset)
@@ -108,7 +177,9 @@ def build_sft_payload(
     validation_path = (
         data_cfg.get("validation_path")
-        if isinstance(data_cfg.get("validation_path"), str)
+        if isinstance(data_cfg, dict)
+        else None
+        if isinstance(data_cfg, dict) and isinstance(data_cfg.get("validation_path"), str)
         else None
     )
     validation_file = None
@@ -122,7 +193,7 @@ def build_sft_payload(
             validation_file = vpath
     hp_block: dict[str, Any] = {
-        "n_epochs": int(hp_cfg.get("n_epochs", 1)),
+        "n_epochs": int(hp_cfg.get("n_epochs", 1) if isinstance(hp_cfg, dict) else 1),
     }
     for key in (
         "batch_size",
@@ -134,27 +205,35 @@ def build_sft_payload(
         "warmup_ratio",
         "train_kind",
     ):
-        if key in hp_cfg:
+        if isinstance(hp_cfg, dict) and key in hp_cfg:
             hp_block[key] = hp_cfg[key]
-    if isinstance(hp_cfg.get("parallelism"), dict):
+    if isinstance(hp_cfg, dict) and isinstance(hp_cfg.get("parallelism"), dict):
         hp_block["parallelism"] = hp_cfg["parallelism"]
     compute_block = {
-        k: compute_cfg[k] for k in ("gpu_type", "gpu_count", "nodes") if k in compute_cfg
+        k: compute_cfg[k]
+        for k in ("gpu_type", "gpu_count", "nodes")
+        if isinstance(compute_cfg, dict) and k in compute_cfg
     }
     effective = {
         "compute": compute_block,
         "data": {
             "topology": data_cfg.get("topology", {})
-            if isinstance(data_cfg.get("topology"), dict)
+            if isinstance(data_cfg, dict) and isinstance(data_cfg.get("topology"), dict)
             else {}
         },
-        "training": {k: v for k, v in train_cfg.items() if k in ("mode", "use_qlora")},
+        "training": {
+            k: v
+            for k, v in (train_cfg.items() if isinstance(train_cfg, dict) else [])
+            if k in ("mode", "use_qlora")
+        },
     }
     validation_cfg = (
-        train_cfg.get("validation") if isinstance(train_cfg.get("validation"), dict) else None
+        train_cfg.get("validation")
+        if isinstance(train_cfg, dict) and isinstance(train_cfg.get("validation"), dict)
+        else None
     )
     if isinstance(validation_cfg, dict):
         hp_block.update(
@@ -170,13 +249,41 @@ def build_sft_payload(
             "enabled": bool(validation_cfg.get("enabled", True))
         }
-    payload = {
-        "model": job_cfg.get("model") or data.get("model"),
-        "training_file_id": None,  # populated after upload
-        "training_type": "sft_offline",
-        "hyperparameters": hp_block,
-        "metadata": {"effective_config": effective},
-    }
+    raw_model = str(
+        job_cfg.get("model") if isinstance(job_cfg, dict) else None or data.get("model") or ""
+    ).strip()
+    if not raw_model:
+        raise TrainError("Model not specified; set [job].model or [model].base in the config")
+    try:
+        base_model = ensure_allowed_model(
+            raw_model,
+            allow_finetuned_prefixes=False,
+            allow_experimental=allow_experimental,
+        )
+    except UnsupportedModelError as exc:
+        raise TrainError(str(exc)) from exc
+    try:
+        ensure_model_supported_for_algorithm(base_model, spec)
+    except AlgorithmValidationError as exc:
+        raise TrainError(str(exc)) from exc
+    try:
+        payload = prepare_sft_job_payload(
+            model=raw_model,
+            training_file=None,
+            hyperparameters=hp_block,
+            metadata={"effective_config": effective},
+            training_type="sft_offline",
+            training_file_field="training_file_id",
+            require_training_file=False,
+            include_training_file_when_none=True,
+            allow_finetuned_prefixes=False,
+        )
+    except UnsupportedModelError as exc:
+        raise TrainError(str(exc)) from exc
+    except ValueError as exc:
+        raise TrainError(str(exc)) from exc
     return SFTBuildResult(payload=payload, train_file=dataset_path, validation_file=validation_file)

synth_ai/api/train/cli.py CHANGED Viewed

@@ -2,21 +2,22 @@ from __future__ import annotations
 import os
 from pathlib import Path
-from typing import Any, Dict
+from typing import Any
 import click
+from synth_ai.config.base_url import get_backend_from_env
-from .builders import RLBuildResult, SFTBuildResult, build_rl_payload, build_sft_payload
+from .builders import build_rl_payload, build_sft_payload
 from .config_finder import discover_configs, prompt_for_config
 from .env_resolver import KeySpec, resolve_env
 from .pollers import RLJobPoller, SFTJobPoller
 from .task_app import check_task_app_health
 from .utils import (
-    TrainError,
     REPO_ROOT,
+    TrainError,
     ensure_api_base,
-    http_post,
     http_get,
+    http_post,
     limit_jsonl_examples,
     mask_value,
     post_multipart,
@@ -24,7 +25,6 @@ from .utils import (
     sleep,
     validate_sft_jsonl,
 )
-from synth_ai.config.base_url import get_backend_from_env
 def _discover_dataset_candidates(config_path: Path, limit: int = 50) -> list[Path]:
@@ -130,8 +130,23 @@ def _default_backend() -> str:
 )
 @click.option("--backend", default=_default_backend, help="Backend base URL")
 @click.option("--model", default=None, help="Override model identifier")
+@click.option(
+    "--allow-experimental",
+    "allow_experimental",
+    is_flag=True,
+    flag_value=True,
+    default=None,
+    help="Allow experimental models (overrides SDK_EXPERIMENTAL env)",
+)
+@click.option(
+    "--no-allow-experimental",
+    "allow_experimental",
+    is_flag=True,
+    flag_value=False,
+    help="Disallow experimental models (overrides SDK_EXPERIMENTAL env)",
+)
 @click.option("--idempotency", default=None, help="Idempotency-Key header for job creation")
-@click.option("--dry-run", is_flag=True, help="Preview payload without submitting")
+@click.option("--dry-run", is_flag=True, hidden=True, help="Deprecated: no-op")
 @click.option("--poll/--no-poll", default=True, help="Poll job status until terminal state")
 @click.option(
     "--poll-timeout", default=3600.0, type=float, help="Maximum seconds to poll before timing out"
@@ -152,6 +167,7 @@ def train_command(
     dataset_path: str | None,
     backend: str,
     model: str | None,
+    allow_experimental: bool | None,
     idempotency: str | None,
     dry_run: bool,
     poll: bool,
@@ -165,7 +181,9 @@ def train_command(
         list(config_paths), requested_type=train_type if train_type != "auto" else None
     )
     selection = prompt_for_config(
-        candidates, requested_type=train_type if train_type != "auto" else None
+        candidates,
+        requested_type=train_type if train_type != "auto" else None,
+        allow_autoselect=bool(config_paths),
     )
     effective_type = train_type if train_type != "auto" else selection.train_type
@@ -243,6 +261,7 @@ def train_command(
             task_url_override=task_url,
             model_override=model,
             idempotency=idempotency,
+            allow_experimental=allow_experimental,
             dry_run=dry_run,
             poll=poll,
             poll_timeout=poll_timeout,
@@ -255,6 +274,7 @@ def train_command(
             backend_base=backend_base,
             synth_key=synth_key,
             dataset_override=dataset_override_path,
+            allow_experimental=allow_experimental,
             dry_run=dry_run,
             poll=poll,
             poll_timeout=poll_timeout,
@@ -303,7 +323,7 @@ def _wait_for_training_file(
                 error_body = resp.json()
             except Exception:
                 error_body = resp.text[:400]
-            click.echo(f"\n[ERROR] Authentication failed when checking training file:")
+            click.echo("\n[ERROR] Authentication failed when checking training file:")
             click.echo(f"  URL: {url}")
             click.echo(f"  Status: {resp.status_code}")
             click.echo(f"  Response: {error_body}")
@@ -339,12 +359,13 @@ def handle_rl(
     task_url_override: str | None,
     model_override: str | None,
     idempotency: str | None,
+    allow_experimental: bool | None,
     dry_run: bool,
     poll: bool,
     poll_timeout: float,
     poll_interval: float,
 ) -> None:
-    overrides: Dict[str, Any] = {
+    overrides: dict[str, Any] = {
         "backend": backend_base,
         "task_url": task_url_override,
         "model": model_override,
@@ -354,6 +375,7 @@ def handle_rl(
         task_url=task_url_override or os.environ.get("TASK_APP_URL", ""),
         overrides=overrides,
         idempotency=idempotency,
+        allow_experimental=allow_experimental,
     )
     # Backend-side verification: try ALL org environment keys against /health and /task_info
@@ -371,7 +393,7 @@ def handle_rl(
         raise click.ClickException(
             f"Task app verification call failed: {type(_ve).__name__}: {_ve}"
         ) from _ve
-    if vresp.status_code >= 400:
+    if vresp.status_code is not None and vresp.status_code >= 400:
         click.echo("Task app verification error:\n" + preview_json(vjs, limit=800))
         raise click.ClickException(f"Verification failed with status {vresp.status_code}")
     if not bool(vjs.get("any_ok")):
@@ -407,9 +429,6 @@ def handle_rl(
     click.echo(f"POST {create_url}")
     click.echo("Payload preview:\n" + preview_json(build.payload, limit=800))
-    if dry_run:
-        click.echo("Dry run enabled; skipping submission")
-        return
     resp = http_post(create_url, headers=headers, json_body=build.payload)
     try:
@@ -439,6 +458,7 @@ def handle_sft(
     backend_base: str,
     synth_key: str,
     dataset_override: Path | None,
+    allow_experimental: bool | None,
     dry_run: bool,
     poll: bool,
     poll_timeout: float,
@@ -449,7 +469,11 @@ def handle_sft(
     while True:
         try:
-            build = build_sft_payload(config_path=cfg_path, dataset_override=dataset_path)
+            build = build_sft_payload(
+                config_path=cfg_path,
+                dataset_override=dataset_path,
+                allow_experimental=allow_experimental,
+            )
             break
         except TrainError as exc:
             click.echo(str(exc))
@@ -472,54 +496,49 @@ def handle_sft(
             validate_sft_jsonl(build.validation_file)
         upload_url = f"{backend_base}/learning/files"
-        click.echo(f"\n=== Uploading Training Data ===")
+        click.echo("\n=== Uploading Training Data ===")
         click.echo(f"Dataset: {build.train_file}")
         click.echo(f"Destination: {upload_url}")
-        if dry_run:
-            click.echo("Dry run: skipping upload")
-            train_file_id = "dry-run-train"
-            val_file_id = None
-        else:
-            resp = post_multipart(
-                upload_url, api_key=synth_key, file_field="file", file_path=build.train_file
+        resp = post_multipart(
+            upload_url, api_key=synth_key, file_field="file", file_path=build.train_file
+        )
+        js = (
+            resp.json()
+            if resp.headers.get("content-type", "").startswith("application/json")
+            else {}
+        )
+        if resp.status_code is not None and resp.status_code >= 400 or "id" not in js:
+            click.echo("\n[ERROR] Training file upload failed:")
+            click.echo(f"  URL: {upload_url}")
+            click.echo(f"  Status: {resp.status_code}")
+            click.echo(f"  Response: {js or resp.text[:400]}")
+            click.echo(f"  File: {build.train_file}")
+            raise click.ClickException(
+                f"Training file upload failed with status {resp.status_code}"
+            )
+        train_file_id = js["id"]
+        click.echo(f"✓ Training file uploaded (id={train_file_id})")
+        val_file_id = None
+        if build.validation_file:
+            click.echo(f"Uploading validation dataset: {build.validation_file}")
+            vresp = post_multipart(
+                upload_url,
+                api_key=synth_key,
+                file_field="file",
+                file_path=build.validation_file,
             )
-            js = (
-                resp.json()
-                if resp.headers.get("content-type", "").startswith("application/json")
+            vjs = (
+                vresp.json()
+                if vresp.headers.get("content-type", "").startswith("application/json")
                 else {}
             )
-            if resp.status_code >= 400 or "id" not in js:
-                click.echo(f"\n[ERROR] Training file upload failed:")
-                click.echo(f"  URL: {upload_url}")
-                click.echo(f"  Status: {resp.status_code}")
-                click.echo(f"  Response: {js or resp.text[:400]}")
-                click.echo(f"  File: {build.train_file}")
-                raise click.ClickException(
-                    f"Training file upload failed with status {resp.status_code}"
-                )
-            train_file_id = js["id"]
-            click.echo(f"✓ Training file uploaded (id={train_file_id})")
-            val_file_id = None
-            if build.validation_file:
-                click.echo(f"Uploading validation dataset: {build.validation_file}")
-                vresp = post_multipart(
-                    upload_url,
-                    api_key=synth_key,
-                    file_field="file",
-                    file_path=build.validation_file,
-                )
-                vjs = (
-                    vresp.json()
-                    if vresp.headers.get("content-type", "").startswith("application/json")
-                    else {}
+            if vresp.status_code is not None and vresp.status_code < 400 and "id" in vjs:
+                val_file_id = vjs["id"]
+                click.echo(f"✓ Validation file uploaded (id={val_file_id})")
+            else:
+                click.echo(
+                    f"[WARN] Validation upload failed ({vresp.status_code}): {vjs or vresp.text[:200]}"
                 )
-                if vresp.status_code < 400 and "id" in vjs:
-                    val_file_id = vjs["id"]
-                    click.echo(f"✓ Validation file uploaded (id={val_file_id})")
-                else:
-                    click.echo(
-                        f"[WARN] Validation upload failed ({vresp.status_code}): {vjs or vresp.text[:200]}"
-                    )
         payload = dict(build.payload)
         payload["training_file_id"] = train_file_id
         if val_file_id:
@@ -527,18 +546,15 @@ def handle_sft(
                 "data", {}
             )["validation_files"] = [val_file_id]
-        click.echo(f"\n=== Checking File Processing Status ===")
+        click.echo("\n=== Checking File Processing Status ===")
         try:
             _wait_for_training_file(backend_base, synth_key, train_file_id)
         except click.ClickException as exc:
             raise click.ClickException(f"Training file {train_file_id} not ready: {exc}") from exc
-        click.echo(f"\n=== Creating Training Job ===")
+        click.echo("\n=== Creating Training Job ===")
         click.echo("Job payload preview:")
         click.echo(preview_json(payload, limit=800))
-        if dry_run:
-            click.echo("Dry run: skipping job submission")
-            return
         create_url = f"{backend_base}/learning/jobs"
         headers = {"Authorization": f"Bearer {synth_key}", "Content-Type": "application/json"}
@@ -550,7 +566,7 @@ def handle_sft(
             else {}
         )
         if resp.status_code not in (200, 201):
-            click.echo(f"\n[ERROR] Job creation failed:")
+            click.echo("\n[ERROR] Job creation failed:")
             click.echo(f"  URL: {create_url}")
             click.echo(f"  Status: {resp.status_code}")
             click.echo(f"  Response: {preview_json(js, limit=600)}")
@@ -560,14 +576,14 @@ def handle_sft(
             raise click.ClickException("Response missing job id")
         click.echo(f"✓ Job created (id={job_id})")
-        click.echo(f"\n=== Starting Training Job ===")
+        click.echo("\n=== Starting Training Job ===")
         start_url = f"{backend_base}/learning/jobs/{job_id}/start"
         click.echo(f"POST {start_url}")
         start_resp = http_post(start_url, headers=headers, json_body={})
         if start_resp.status_code not in (200, 201):
             click.echo(f"[WARN] Job start returned status {start_resp.status_code}")
         else:
-            click.echo(f"✓ Job started")
+            click.echo("✓ Job started")
         if not poll:
             click.echo(f"Started job {job_id} (polling disabled)")

synth_ai/api/train/config_finder.py CHANGED Viewed

@@ -2,9 +2,9 @@ from __future__ import annotations
 import json
 import os
+from collections.abc import Iterable
 from dataclasses import dataclass
 from pathlib import Path
-from typing import Iterable
 import click
@@ -173,7 +173,7 @@ def discover_configs(explicit: list[str], *, requested_type: str | None) -> list
 def prompt_for_config(
-    candidates: list[ConfigCandidate], *, requested_type: str | None
+    candidates: list[ConfigCandidate], *, requested_type: str | None, allow_autoselect: bool = False
 ) -> ConfigCandidate:
     if not candidates:
         raise click.ClickException("No training configs found. Pass --config explicitly.")
@@ -182,6 +182,11 @@ def prompt_for_config(
     last_config = _load_last_config()
     default_idx = 1
+    if allow_autoselect and len(candidates) == 1:
+        chosen = candidates[0]
+        _save_last_config(chosen.path)
+        return chosen
     if last_config:
         for idx, cand in enumerate(candidates):
             if cand.path.resolve() == last_config:

synth_ai/api/train/env_resolver.py CHANGED Viewed

@@ -1,9 +1,9 @@
 from __future__ import annotations
 import os
+from collections.abc import Callable, Iterable, MutableMapping
 from dataclasses import dataclass
 from pathlib import Path
-from typing import Callable, Iterable, MutableMapping
 import click

synth_ai/api/train/pollers.py CHANGED Viewed

@@ -1,8 +1,9 @@
 from __future__ import annotations
+from collections.abc import Mapping
 from dataclasses import dataclass
 from datetime import datetime
-from typing import Any, Mapping
+from typing import Any
 import click

synth-ai 0.2.9.dev7__py3-none-any.whl → 0.2.10__py3-none-any.whl

Potentially problematic release.

synth-ai 0.2.9.dev7py3-none-any.whl → 0.2.10py3-none-any.whl