PyPI - synth-ai - Versions diffs - 0.2.9.dev7__py3-none-any.whl → 0.2.9.dev8__py3-none-any.whl - Mend

synth-ai 0.2.9.dev7py3-none-any.whl → 0.2.9.dev8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synth-ai might be problematic. Click here for more details.

Files changed (327) hide show

examples/__init__.py +16 -0
examples/crafter_debug_render.py +8 -11
examples/qwen_coder/README.md +102 -0
examples/qwen_coder/_shared.py +113 -0
examples/qwen_coder/configs/coder_lora_30b.toml +61 -0
examples/qwen_coder/configs/coder_lora_4b.toml +57 -0
examples/qwen_coder/configs/coder_lora_small.toml +58 -0
examples/qwen_coder/generate_dataset.py +98 -0
examples/qwen_coder/infer_ft_smoke.py +64 -0
examples/qwen_coder/infer_prod_proxy.py +73 -0
examples/qwen_coder/infer_via_synth.py +87 -0
examples/qwen_coder/scripts/infer_coder.sh +18 -0
examples/qwen_coder/scripts/train_coder_30b.sh +21 -0
examples/qwen_coder/sft_full_17b.py +103 -0
examples/qwen_coder/sft_lora_30b.py +110 -0
examples/qwen_coder/subset_jsonl.py +38 -0
examples/qwen_coder/validate_jsonl.py +59 -0
examples/rl/run_eval.py +36 -37
examples/rl/run_rl_and_save.py +5 -5
examples/rl/task_app/math_single_step.py +65 -43
examples/rl/task_app/math_task_app.py +3 -3
examples/sft/README.md +139 -0
examples/sft/configs/crafter_fft_qwen0p6b.toml +44 -0
examples/sft/configs/crafter_lora_qwen0p6b.toml +45 -0
examples/sft/evaluate.py +117 -0
examples/sft/export_dataset.py +117 -0
examples/sft/generate_traces.py +162 -0
examples/swe/__init__.py +12 -0
examples/swe/task_app/README.md +105 -0
examples/swe/task_app/__init__.py +2 -0
examples/swe/task_app/grpo_swe_mini.py +571 -0
examples/swe/task_app/grpo_swe_mini_task_app.py +136 -0
examples/swe/task_app/hosted/README.md +173 -0
examples/swe/task_app/hosted/__init__.py +5 -0
examples/swe/task_app/hosted/branching.py +143 -0
examples/swe/task_app/hosted/environment_routes.py +1289 -0
examples/swe/task_app/hosted/envs/__init__.py +1 -0
examples/swe/task_app/hosted/envs/crafter/__init__.py +6 -0
examples/swe/task_app/hosted/envs/crafter/app.py +1 -0
examples/swe/task_app/hosted/envs/crafter/environment.py +522 -0
examples/swe/task_app/hosted/envs/crafter/policy.py +478 -0
examples/swe/task_app/hosted/envs/crafter/react_agent.py +108 -0
examples/swe/task_app/hosted/envs/crafter/shared.py +305 -0
examples/swe/task_app/hosted/envs/crafter/tools.py +47 -0
examples/swe/task_app/hosted/envs/mini_swe/__init__.py +8 -0
examples/swe/task_app/hosted/envs/mini_swe/environment.py +1164 -0
examples/swe/task_app/hosted/envs/mini_swe/policy.py +355 -0
examples/swe/task_app/hosted/envs/mini_swe/shared.py +83 -0
examples/swe/task_app/hosted/envs/mini_swe/tools.py +96 -0
examples/swe/task_app/hosted/hosted_app.py +204 -0
examples/swe/task_app/hosted/inference/__init__.py +5 -0
examples/swe/task_app/hosted/inference/openai_client.py +618 -0
examples/swe/task_app/hosted/main.py +100 -0
examples/swe/task_app/hosted/policy_routes.py +1079 -0
examples/swe/task_app/hosted/registry.py +195 -0
examples/swe/task_app/hosted/rollout.py +1869 -0
examples/swe/task_app/hosted/storage/__init__.py +5 -0
examples/swe/task_app/hosted/storage/volume.py +211 -0
examples/swe/task_app/hosted/test_agents.py +161 -0
examples/swe/task_app/hosted/test_service.py +137 -0
examples/swe/task_app/hosted/utils.py +62 -0
examples/vlm/README.md +68 -0
examples/vlm/configs/crafter_vlm_gpt4o.toml +44 -0
examples/vlm/crafter_image_only_agent.py +207 -0
examples/vlm/crafter_openai_vlm_agent.py +277 -0
examples/vlm/filter_image_rows.py +63 -0
examples/vlm/run_crafter_vlm_benchmark.py +316 -0
examples/warming_up_to_rl/analyze_trace_db.py +5 -5
examples/warming_up_to_rl/configs/rl_from_base_qwen4b.toml +11 -1
examples/warming_up_to_rl/export_trace_sft.py +78 -21
examples/warming_up_to_rl/groq_test.py +4 -4
examples/warming_up_to_rl/manage_secrets.py +13 -18
examples/warming_up_to_rl/run_eval.py +42 -44
examples/warming_up_to_rl/run_fft_and_save.py +11 -16
examples/warming_up_to_rl/run_local_rollout.py +1 -3
examples/warming_up_to_rl/run_local_rollout_modal.py +2 -4
examples/warming_up_to_rl/run_local_rollout_parallel.py +1 -4
examples/warming_up_to_rl/run_local_rollout_traced.py +3 -5
examples/warming_up_to_rl/run_rl_and_save.py +5 -6
examples/warming_up_to_rl/run_rollout_remote.py +8 -10
examples/warming_up_to_rl/task_app/README.md +6 -2
examples/warming_up_to_rl/task_app/grpo_crafter.py +234 -35
examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py +2 -3
examples/warming_up_to_rl/task_app/synth_envs_hosted/__init__.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/branching.py +9 -11
examples/warming_up_to_rl/task_app/synth_envs_hosted/environment_routes.py +131 -114
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/environment.py +101 -41
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py +73 -51
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py +14 -6
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/shared.py +16 -16
examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py +32 -34
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py +94 -31
examples/warming_up_to_rl/task_app/synth_envs_hosted/main.py +0 -2
examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py +303 -203
examples/warming_up_to_rl/task_app/synth_envs_hosted/registry.py +21 -23
examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py +328 -225
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/volume.py +13 -13
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_agents.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_service.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/utils.py +4 -3
synth/__init__.py +14 -0
synth_ai/__init__.py +26 -4
synth_ai/api/models/supported.py +376 -0
synth_ai/api/train/builders.py +128 -21
synth_ai/api/train/cli.py +80 -64
synth_ai/api/train/config_finder.py +7 -2
synth_ai/api/train/env_resolver.py +1 -1
synth_ai/api/train/pollers.py +2 -1
synth_ai/api/train/supported_algos.py +139 -0
synth_ai/api/train/task_app.py +1 -2
synth_ai/api/train/utils.py +13 -44
synth_ai/cli/__init__.py +8 -0
synth_ai/cli/_modal_wrapper.py +28 -0
synth_ai/cli/_typer_patch.py +49 -0
synth_ai/cli/balance.py +1 -2
synth_ai/cli/calc.py +1 -1
synth_ai/cli/demo.py +2 -1
synth_ai/cli/recent.py +2 -2
synth_ai/cli/rl_demo.py +2 -1
synth_ai/cli/root.py +11 -13
synth_ai/cli/status.py +2 -2
synth_ai/cli/task_apps.py +529 -179
synth_ai/cli/traces.py +6 -4
synth_ai/cli/watch.py +12 -18
synth_ai/demo_registry.py +1 -1
synth_ai/demos/core/cli.py +36 -43
synth_ai/demos/demo_task_apps/__init__.py +3 -3
synth_ai/demos/demo_task_apps/core.py +17 -25
synth_ai/demos/demo_task_apps/crafter/grpo_crafter_task_app.py +3 -4
synth_ai/demos/demo_task_apps/math/app.py +2 -1
synth_ai/demos/demo_task_apps/math/deploy_modal.py +3 -4
synth_ai/demos/demo_task_apps/math/modal_task_app.py +16 -18
synth_ai/demos/demo_task_apps/math/task_app_entry.py +0 -1
synth_ai/environments/examples/crafter_classic/environment.py +76 -1
synth_ai/environments/reproducibility/tree.py +2 -5
synth_ai/environments/service/app.py +11 -12
synth_ai/environments/service/core_routes.py +4 -7
synth_ai/environments/stateful/engine.py +1 -1
synth_ai/environments/tasks/core.py +1 -0
synth_ai/environments/tasks/filters.py +5 -6
synth_ai/environments/tasks/utils.py +4 -5
synth_ai/handshake.py +9 -9
synth_ai/http.py +1 -1
synth_ai/http_client.py +18 -10
synth_ai/inference/client.py +15 -5
synth_ai/jobs/client.py +78 -83
synth_ai/learning/__init__.py +41 -6
synth_ai/learning/algorithms.py +14 -0
synth_ai/learning/client.py +91 -24
synth_ai/learning/config.py +2 -38
synth_ai/learning/ft_client.py +4 -59
synth_ai/learning/health.py +5 -6
synth_ai/learning/jobs.py +31 -47
synth_ai/{rl → learning/rl}/__init__.py +14 -4
synth_ai/learning/rl/client.py +267 -0
synth_ai/learning/rl/config.py +31 -0
synth_ai/{rl → learning/rl}/contracts.py +5 -8
synth_ai/{rl → learning/rl}/env_keys.py +39 -15
synth_ai/learning/rl/secrets.py +13 -0
synth_ai/learning/rl_client.py +2 -281
synth_ai/learning/sft/__init__.py +29 -0
synth_ai/learning/sft/client.py +68 -0
synth_ai/learning/sft/config.py +270 -0
synth_ai/learning/sft/data.py +295 -0
synth_ai/learning/sse.py +25 -24
synth_ai/learning/validators.py +25 -28
synth_ai/lm/__init__.py +21 -47
synth_ai/main.py +4 -0
synth_ai/task/__init__.py +25 -27
synth_ai/task/apps/__init__.py +7 -8
synth_ai/task/auth.py +8 -8
synth_ai/task/client.py +14 -14
synth_ai/task/contracts.py +36 -35
synth_ai/task/datasets.py +6 -5
synth_ai/task/errors.py +10 -10
synth_ai/task/health.py +17 -9
synth_ai/task/json.py +58 -23
synth_ai/task/proxy.py +13 -9
synth_ai/task/rubrics.py +16 -15
synth_ai/task/server.py +12 -12
synth_ai/task/tracing_utils.py +4 -4
synth_ai/task/vendors.py +5 -6
synth_ai/tracing_v3/__init__.py +2 -0
synth_ai/tracing_v3/abstractions.py +21 -4
synth_ai/tracing_v3/decorators.py +18 -16
synth_ai/tracing_v3/hooks.py +5 -5
synth_ai/tracing_v3/llm_call_record_helpers.py +6 -6
synth_ai/tracing_v3/session_tracer.py +40 -14
synth_ai/tracing_v3/storage/base.py +85 -0
synth_ai/tracing_v3/storage/config.py +21 -8
synth_ai/tracing_v3/storage/factory.py +10 -7
synth_ai/tracing_v3/storage/utils.py +4 -2
synth_ai/tracing_v3/turso/daemon.py +7 -2
synth_ai/tracing_v3/turso/models.py +2 -2
synth_ai/tracing_v3/turso/native_manager.py +1173 -0
synth_ai/tracing_v3/utils.py +4 -4
synth_ai/v0/api/__init__.py +8 -0
synth_ai/v0/api/models/__init__.py +8 -0
synth_ai/v0/api/models/supported.py +8 -0
synth_ai/v0/config/__init__.py +15 -0
synth_ai/v0/config/base_url.py +12 -0
synth_ai/v0/lm/__init__.py +51 -0
synth_ai/{lm → v0/lm}/caching/ephemeral.py +2 -2
synth_ai/{lm → v0/lm}/caching/handler.py +4 -4
synth_ai/{lm → v0/lm}/caching/initialize.py +1 -1
synth_ai/{lm → v0/lm}/caching/persistent.py +1 -1
synth_ai/{lm → v0/lm}/config.py +6 -1
synth_ai/{lm → v0/lm}/core/all.py +9 -9
synth_ai/{lm → v0/lm}/core/main.py +6 -6
synth_ai/{lm → v0/lm}/core/main_v3.py +10 -10
synth_ai/{lm → v0/lm}/core/synth_models.py +2 -14
synth_ai/{lm → v0/lm}/core/vendor_clients.py +2 -2
synth_ai/{lm → v0/lm}/overrides.py +2 -2
synth_ai/{lm → v0/lm}/provider_support/anthropic.py +4 -4
synth_ai/{lm → v0/lm}/provider_support/openai.py +5 -5
synth_ai/{lm → v0/lm}/structured_outputs/handler.py +5 -5
synth_ai/{lm → v0/lm}/structured_outputs/rehabilitate.py +1 -1
synth_ai/{lm → v0/lm}/vendors/core/anthropic_api.py +9 -9
synth_ai/{lm → v0/lm}/vendors/core/gemini_api.py +5 -5
synth_ai/{lm → v0/lm}/vendors/core/mistral_api.py +5 -5
synth_ai/{lm → v0/lm}/vendors/core/openai_api.py +10 -10
synth_ai/{lm → v0/lm}/vendors/openai_standard.py +8 -8
synth_ai/{lm → v0/lm}/vendors/openai_standard_responses.py +2 -2
synth_ai/{lm → v0/lm}/vendors/supported/custom_endpoint.py +3 -3
synth_ai/{lm → v0/lm}/vendors/supported/deepseek.py +2 -2
synth_ai/{lm → v0/lm}/vendors/supported/grok.py +2 -2
synth_ai/{lm → v0/lm}/vendors/supported/groq.py +1 -1
synth_ai/{lm → v0/lm}/vendors/supported/ollama.py +1 -1
synth_ai/{lm → v0/lm}/vendors/supported/openrouter.py +3 -3
synth_ai/{lm → v0/lm}/vendors/supported/together.py +1 -1
synth_ai/{lm → v0/lm}/vendors/synth_client.py +1 -1
synth_ai/v0/tracing_v3/__init__.py +10 -0
synth_ai/v0/tracing_v3/abstractions.py +3 -0
synth_ai/v0/tracing_v3/decorators.py +3 -0
synth_ai/v0/tracing_v3/llm_call_record_helpers.py +3 -0
synth_ai/v0/tracing_v3/session_tracer.py +3 -0
synth_ai-0.2.9.dev8.dist-info/METADATA +191 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.9.dev8.dist-info}/RECORD +268 -238
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.9.dev8.dist-info}/top_level.txt +1 -0
examples/common_old/backend.py +0 -20
examples/evals_old/README.md +0 -98
examples/evals_old/__init__.py +0 -6
examples/evals_old/compare_models.py +0 -1038
examples/evals_old/example_log.md +0 -145
examples/evals_old/run_demo.sh +0 -126
examples/evals_old/trace_analysis.py +0 -270
examples/finetuning_old/_backup_synth_qwen/config.toml +0 -29
examples/finetuning_old/_backup_synth_qwen/example_log.md +0 -324
examples/finetuning_old/_backup_synth_qwen/filter_traces.py +0 -60
examples/finetuning_old/_backup_synth_qwen/filter_traces_achievements.py +0 -243
examples/finetuning_old/_backup_synth_qwen/purge_v3_traces.py +0 -109
examples/finetuning_old/_backup_synth_qwen/react_agent_lm.py +0 -1924
examples/finetuning_old/_backup_synth_qwen/readme.md +0 -49
examples/finetuning_old/_backup_synth_qwen/run_crafter_qwen4b.py +0 -114
examples/finetuning_old/_backup_synth_qwen/run_demo.sh +0 -195
examples/finetuning_old/_backup_synth_qwen/sft_kickoff.py +0 -119
examples/finetuning_old/synth_qwen_v1/README.md +0 -68
examples/finetuning_old/synth_qwen_v1/filter_traces.py +0 -60
examples/finetuning_old/synth_qwen_v1/filter_traces_achievements.py +0 -243
examples/finetuning_old/synth_qwen_v1/finetune.py +0 -46
examples/finetuning_old/synth_qwen_v1/hello_ft_model.py +0 -71
examples/finetuning_old/synth_qwen_v1/infer.py +0 -36
examples/finetuning_old/synth_qwen_v1/poll.py +0 -46
examples/finetuning_old/synth_qwen_v1/prepare_data.py +0 -35
examples/finetuning_old/synth_qwen_v1/purge_v3_traces.py +0 -109
examples/finetuning_old/synth_qwen_v1/react_agent_lm.py +0 -1933
examples/finetuning_old/synth_qwen_v1/run_crafter_sft_job.py +0 -210
examples/finetuning_old/synth_qwen_v1/run_ft_job.py +0 -237
examples/finetuning_old/synth_qwen_v1/upload_data.py +0 -34
examples/finetuning_old/synth_qwen_v1/util.py +0 -152
examples/rl_old/task_app.py +0 -1131
examples/warming_up_to_rl/old/event_rewards.md +0 -234
examples/warming_up_to_rl/old/notes.md +0 -73
synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/filter_traces_sft_turso.py +0 -738
synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/filter_traces_sft_turso.py +0 -580
synth_ai/experimental/synth_oss.py +0 -445
synth_ai/learning/filtering.py +0 -0
synth_ai/learning/offline/dpo.py +0 -0
synth_ai/learning/offline/providers.py +0 -7
synth_ai/learning/offline/sft.py +0 -0
synth_ai/learning/offline/shared.py +0 -0
synth_ai/learning/online/grpo.py +0 -0
synth_ai/learning/online/irft.py +0 -0
synth_ai/learning/prompts/banking77_injection_eval.py +0 -168
synth_ai/learning/prompts/gepa.py +0 -0
synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +0 -211
synth_ai/learning/prompts/mipro.py +0 -289
synth_ai/learning/prompts/random_search.py +0 -249
synth_ai/learning/prompts/run_mipro_banking77.py +0 -172
synth_ai/learning/prompts/run_random_search_banking77.py +0 -329
synth_ai/rl/secrets.py +0 -19
synth_ai/scripts/verify_rewards.py +0 -100
synth_ai/tracing/__init__.py +0 -30
synth_ai/tracing_v1/__init__.py +0 -33
synth_ai/tracing_v3/turso/__init__.py +0 -25
synth_ai/tracing_v3/turso/manager.py +0 -838
synth_ai/zyk/__init__.py +0 -30
synth_ai-0.2.9.dev7.dist-info/METADATA +0 -131
/synth_ai/{lm → v0/lm}/caching/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/caching/constants.py +0 -0
/synth_ai/{lm → v0/lm}/caching/dbs.py +0 -0
/synth_ai/{lm → v0/lm}/constants.py +0 -0
/synth_ai/{lm → v0/lm}/core/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/core/exceptions.py +0 -0
/synth_ai/{lm → v0/lm}/cost/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/cost/monitor.py +0 -0
/synth_ai/{lm → v0/lm}/cost/statefulness.py +0 -0
/synth_ai/{lm → v0/lm}/injection.py +0 -0
/synth_ai/{lm → v0/lm}/provider_support/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/provider_support/suppress_logging.py +0 -0
/synth_ai/{lm → v0/lm}/structured_outputs/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/structured_outputs/inject.py +0 -0
/synth_ai/{lm → v0/lm}/tools/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/tools/base.py +0 -0
/synth_ai/{lm → v0/lm}/unified_interface.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/base.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/core/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/core/synth_dev_api.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/local/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/local/ollama.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/retries.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/supported/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/warmup.py +0 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.9.dev8.dist-info}/WHEEL +0 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.9.dev8.dist-info}/entry_points.txt +0 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.9.dev8.dist-info}/licenses/LICENSE +0 -0

synth_ai/learning/sft/config.py ADDED Viewed

@@ -0,0 +1,270 @@
+"""Utilities for validating and constructing SFT job payloads."""
+from __future__ import annotations
+from collections.abc import Mapping
+from dataclasses import dataclass, field, fields
+from typing import Any
+from synth_ai.api.models.supported import (
+    UnsupportedModelError,
+    normalize_model_identifier,
+)
+_STEP_KEYS = ("n_epochs", "total_steps", "train_steps", "steps")
+def _ensure_positive_int(value: Any, *, key: str) -> int:
+    if isinstance(value, bool):
+        raise ValueError(f"hyperparameters.{key} must be an integer greater than zero")
+    try:
+        ivalue = int(value)
+    except (TypeError, ValueError) as exc:  # pragma: no cover - defensive
+        raise ValueError(f"hyperparameters.{key} must be an integer greater than zero") from exc
+    if ivalue <= 0:
+        raise ValueError(f"hyperparameters.{key} must be an integer greater than zero")
+    return ivalue
+def _ensure_non_negative_float(value: Any, *, key: str) -> float:
+    if isinstance(value, bool):
+        raise ValueError(f"hyperparameters.{key} must be a float greater than or equal to zero")
+    try:
+        fvalue = float(value)
+    except (TypeError, ValueError) as exc:  # pragma: no cover - defensive
+        raise ValueError(
+            f"hyperparameters.{key} must be a float greater than or equal to zero"
+        ) from exc
+    if fvalue < 0:
+        raise ValueError(f"hyperparameters.{key} must be a float greater than or equal to zero")
+    return fvalue
+def _ensure_positive_float(value: Any, *, key: str) -> float:
+    fvalue = _ensure_non_negative_float(value, key=key)
+    if fvalue == 0.0:
+        raise ValueError(f"hyperparameters.{key} must be greater than zero")
+    return fvalue
+@dataclass(slots=True)
+class SFTTrainingHyperparameters:
+    """Typed representation of SFT training hyperparameters."""
+    n_epochs: int | None = None
+    total_steps: int | None = None
+    train_steps: int | None = None
+    steps: int | None = None
+    batch_size: int | None = None
+    global_batch: int | None = None
+    per_device_batch: int | None = None
+    gradient_accumulation_steps: int | None = None
+    sequence_length: int | None = None
+    learning_rate: float | None = None
+    warmup_ratio: float | None = None
+    train_kind: str | None = None
+    extras: dict[str, Any] = field(default_factory=dict)
+    @classmethod
+    def from_mapping(cls, data: Mapping[str, Any] | None) -> SFTTrainingHyperparameters:
+        if data is None:
+            raise ValueError("hyperparameters must not be empty")
+        normalized: dict[str, Any] = dict(data)
+        if not normalized:
+            raise ValueError("hyperparameters must not be empty")
+        kwargs: dict[str, Any] = {}
+        def pop_int(name: str) -> int | None:
+            if name not in normalized:
+                return None
+            value = _ensure_positive_int(normalized.pop(name), key=name)
+            return value
+        def pop_optional_int(name: str) -> int | None:
+            if name not in normalized:
+                return None
+            value = _ensure_positive_int(normalized.pop(name), key=name)
+            return value
+        def pop_positive_float(name: str) -> float | None:
+            if name not in normalized:
+                return None
+            return _ensure_positive_float(normalized.pop(name), key=name)
+        def pop_non_negative_float(name: str) -> float | None:
+            if name not in normalized:
+                return None
+            value = _ensure_non_negative_float(normalized.pop(name), key=name)
+            return value
+        # Step-derived keys
+        step_values = {
+            "n_epochs": pop_int("n_epochs"),
+            "total_steps": pop_int("total_steps"),
+            "train_steps": pop_int("train_steps"),
+            "steps": pop_int("steps"),
+        }
+        if not any(step_values.values()):
+            keys = ", ".join(_STEP_KEYS)
+            raise ValueError(f"hyperparameters must include at least one of: {keys}")
+        kwargs.update(step_values)
+        kwargs["batch_size"] = pop_optional_int("batch_size")
+        kwargs["global_batch"] = pop_optional_int("global_batch")
+        kwargs["per_device_batch"] = pop_optional_int("per_device_batch")
+        kwargs["gradient_accumulation_steps"] = pop_optional_int("gradient_accumulation_steps")
+        kwargs["sequence_length"] = pop_optional_int("sequence_length")
+        kwargs["learning_rate"] = pop_positive_float("learning_rate")
+        kwargs["warmup_ratio"] = pop_non_negative_float("warmup_ratio")
+        if "warmup_ratio" in kwargs and kwargs["warmup_ratio"] is not None:
+            ratio = kwargs["warmup_ratio"]
+            if ratio > 1:
+                raise ValueError("hyperparameters.warmup_ratio must be between 0 and 1 inclusive")
+        if "train_kind" in normalized:
+            value = normalized.pop("train_kind")
+            if not isinstance(value, str):
+                raise ValueError("hyperparameters.train_kind must be a string")
+            kwargs["train_kind"] = value
+        extras = normalized
+        return cls(extras=extras, **kwargs)
+    def to_dict(self) -> dict[str, Any]:
+        result: dict[str, Any] = {}
+        for field_info in fields(self):
+            if field_info.name == "extras":
+                continue
+            value = getattr(self, field_info.name)
+            if value is not None:
+                result[field_info.name] = value
+        result.update(self.extras)
+        return result
+def _coerce_mapping(value: Mapping[str, Any] | None, *, name: str) -> dict[str, Any]:
+    if value is None:
+        return {}
+    if not isinstance(value, Mapping):
+        raise ValueError(f"{name} must be a mapping")
+    return dict(value)
+@dataclass(slots=True)
+class SFTJobConfig:
+    """Structured representation of an SFT training job request."""
+    model: str
+    hyperparameters: Mapping[str, Any] | SFTTrainingHyperparameters
+    training_file: str | None = None
+    metadata: Mapping[str, Any] | None = None
+    training_type: str | None = "sft_offline"
+    validation_file: str | None = None
+    suffix: str | None = None
+    integrations: Mapping[str, Any] | None = None
+    def to_payload(
+        self,
+        *,
+        training_file_field: str = "training_file_id",
+        require_training_file: bool = True,
+        include_training_file_when_none: bool = False,
+        allow_finetuned_prefixes: bool = False,
+    ) -> dict[str, Any]:
+        model = normalize_model_identifier(
+            self.model, allow_finetuned_prefixes=allow_finetuned_prefixes
+        )
+        if isinstance(self.hyperparameters, SFTTrainingHyperparameters):
+            hyper_config = self.hyperparameters
+        else:
+            hyper_config = SFTTrainingHyperparameters.from_mapping(
+                _coerce_mapping(self.hyperparameters, name="hyperparameters")
+            )
+        hyperparameters = hyper_config.to_dict()
+        payload: dict[str, Any] = {
+            "model": model,
+            "hyperparameters": hyperparameters,
+        }
+        training_type = (self.training_type or "").strip() if self.training_type else ""
+        if training_type:
+            payload["training_type"] = training_type
+        metadata = _coerce_mapping(self.metadata, name="metadata")
+        if metadata:
+            payload["metadata"] = metadata
+        integrations = _coerce_mapping(self.integrations, name="integrations")
+        if integrations:
+            payload["integrations"] = integrations
+        suffix = (self.suffix or "").strip()
+        if suffix:
+            payload["suffix"] = suffix
+        validation_file = (self.validation_file or "").strip()
+        if validation_file:
+            payload["validation_file"] = validation_file
+        if training_file_field:
+            training_file = (self.training_file or "").strip() if self.training_file else ""
+            if training_file:
+                payload[training_file_field] = training_file
+            elif require_training_file:
+                raise ValueError("training file identifier is required for SFT jobs")
+            elif include_training_file_when_none:
+                payload[training_file_field] = None
+        return payload
+def prepare_sft_job_payload(
+    *,
+    model: str,
+    hyperparameters: Mapping[str, Any] | SFTTrainingHyperparameters | None,
+    training_file: str | None = None,
+    metadata: Mapping[str, Any] | None = None,
+    training_type: str | None = "sft_offline",
+    validation_file: str | None = None,
+    suffix: str | None = None,
+    integrations: Mapping[str, Any] | None = None,
+    training_file_field: str = "training_file_id",
+    require_training_file: bool = True,
+    include_training_file_when_none: bool = False,
+    allow_finetuned_prefixes: bool = False,
+) -> dict[str, Any]:
+    """Validate inputs and return an SFT job payload suitable for API calls."""
+    if isinstance(hyperparameters, SFTTrainingHyperparameters):
+        hyper_config = hyperparameters
+    else:
+        hyper_config = SFTTrainingHyperparameters.from_mapping(hyperparameters or {})
+    config = SFTJobConfig(
+        model=model,
+        training_file=training_file,
+        hyperparameters=hyper_config,
+        metadata=metadata,
+        training_type=training_type,
+        validation_file=validation_file,
+        suffix=suffix,
+        integrations=integrations,
+    )
+    return config.to_payload(
+        training_file_field=training_file_field,
+        require_training_file=require_training_file,
+        include_training_file_when_none=include_training_file_when_none,
+        allow_finetuned_prefixes=allow_finetuned_prefixes,
+    )
+__all__ = [
+    "SFTTrainingHyperparameters",
+    "SFTJobConfig",
+    "prepare_sft_job_payload",
+    "UnsupportedModelError",
+]

synth_ai/learning/sft/data.py ADDED Viewed

@@ -0,0 +1,295 @@
+from __future__ import annotations
+import json
+from collections.abc import Iterable, Iterator, Sequence
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any
+SFTMessageContent = str | dict[str, Any] | list[Any] | None
+class SFTDataError(ValueError):
+    """Raised when a JSONL record cannot be coerced into an SFTExample."""
+@dataclass(slots=True)
+class SFTToolDefinition:
+    name: str
+    description: str | None
+    parameters: dict[str, Any] | None
+    raw: dict[str, Any] = field(default_factory=dict)
+@dataclass(slots=True)
+class SFTToolCall:
+    name: str
+    arguments: Any
+    call_id: str | None = None
+    type: str | None = None
+    raw: dict[str, Any] = field(default_factory=dict)
+@dataclass(slots=True)
+class SFTMessage:
+    role: str
+    content: SFTMessageContent
+    tool_calls: list[SFTToolCall] = field(default_factory=list)
+    tool_call_id: str | None = None
+    name: str | None = None
+    extra: dict[str, Any] = field(default_factory=dict)
+@dataclass(slots=True)
+class SFTExample:
+    messages: list[SFTMessage]
+    tools: list[SFTToolDefinition] = field(default_factory=list)
+    tool_choice: Any | None = None
+    metadata: dict[str, Any] = field(default_factory=dict)
+    extra: dict[str, Any] = field(default_factory=dict)
+def _parse_tool_arguments(value: Any) -> Any:
+    if isinstance(value, str):
+        try:
+            return json.loads(value)
+        except json.JSONDecodeError:
+            return value
+    return value
+def _coerce_tool_definition(raw: Any, *, index: int) -> SFTToolDefinition:
+    if not isinstance(raw, dict):
+        raise SFTDataError(f"tool {index} is not an object")
+    name = raw.get("name")
+    if not isinstance(name, str) or not name.strip():
+        raise SFTDataError(f"tool {index} missing name")
+    description = raw.get("description")
+    if description is not None and not isinstance(description, str):
+        raise SFTDataError(f"tool {index} description must be a string if present")
+    parameters = raw.get("parameters")
+    if parameters is not None and not isinstance(parameters, dict):
+        raise SFTDataError(f"tool {index} parameters must be an object if present")
+    return SFTToolDefinition(
+        name=name, description=description, parameters=parameters, raw=dict(raw)
+    )
+def _coerce_tool_call(raw: Any, *, index: int) -> SFTToolCall:
+    if not isinstance(raw, dict):
+        raise SFTDataError(f"tool_call {index} is not an object")
+    call_id = raw.get("id")
+    call_type = raw.get("type")
+    fn_payload: dict[str, Any] | None = None
+    name: str | None = None
+    arguments: Any = None
+    if isinstance(raw.get("function"), dict):
+        fn_payload = raw["function"]
+        name = fn_payload.get("name") if isinstance(fn_payload.get("name"), str) else None
+        arguments = fn_payload.get("arguments")
+    if name is None:
+        maybe_name = raw.get("name")
+        if isinstance(maybe_name, str):
+            name = maybe_name
+            arguments = raw.get("arguments")
+    if not isinstance(name, str) or not name.strip():
+        raise SFTDataError(f"tool_call {index} missing function name")
+    parsed_arguments = _parse_tool_arguments(arguments)
+    normalized_id = None
+    if call_id is not None:
+        normalized_id = str(call_id)
+    normalized_type = None
+    if call_type is not None:
+        normalized_type = str(call_type)
+    return SFTToolCall(
+        name=name,
+        arguments=parsed_arguments,
+        call_id=normalized_id,
+        type=normalized_type,
+        raw=dict(raw),
+    )
+def _coerce_message(raw: Any, *, index: int) -> SFTMessage:
+    if not isinstance(raw, dict):
+        raise SFTDataError(f"message {index} is not an object")
+    role = raw.get("role")
+    if not isinstance(role, str) or not role.strip():
+        raise SFTDataError(f"message {index} has invalid role")
+    content = raw.get("content")
+    if content is not None and not isinstance(content, str | list | dict):
+        raise SFTDataError(f"message {index} has unsupported content type {type(content).__name__}")
+    raw_tool_calls = raw.get("tool_calls")
+    tool_calls: list[SFTToolCall] = []
+    if raw_tool_calls is not None:
+        if not isinstance(raw_tool_calls, list | tuple):
+            raise SFTDataError(f"message {index} tool_calls must be a list")
+        for call_index, call in enumerate(raw_tool_calls):
+            tool_calls.append(_coerce_tool_call(call, index=call_index))
+    tool_call_id = raw.get("tool_call_id")
+    if tool_call_id is not None and not isinstance(tool_call_id, str):
+        tool_call_id = str(tool_call_id)
+    name = raw.get("name")
+    if name is not None and not isinstance(name, str):
+        raise SFTDataError(f"message {index} name must be a string if present")
+    extra = {
+        key: value
+        for key, value in raw.items()
+        if key not in {"role", "content", "tool_calls", "tool_call_id", "name"}
+    }
+    return SFTMessage(
+        role=role,
+        content=content,
+        tool_calls=tool_calls,
+        tool_call_id=tool_call_id,
+        name=name,
+        extra=extra,
+    )
+def coerce_example(raw: Any, *, min_messages: int = 1) -> SFTExample:
+    if not isinstance(raw, dict):
+        raise SFTDataError("record is not an object")
+    messages_raw = raw.get("messages")
+    if not isinstance(messages_raw, Sequence):
+        raise SFTDataError("missing messages[] list")
+    if len(messages_raw) < min_messages:
+        raise SFTDataError(f"missing messages[] with at least {min_messages} turns")
+    messages = [_coerce_message(msg, index=i) for i, msg in enumerate(messages_raw)]
+    tools: list[SFTToolDefinition] = []
+    if "tools" in raw and raw["tools"] is not None:
+        tools_raw = raw["tools"]
+        if not isinstance(tools_raw, Sequence):
+            raise SFTDataError("tools must be provided as a list when present")
+        for tool_index, tool in enumerate(tools_raw):
+            tools.append(_coerce_tool_definition(tool, index=tool_index))
+    tool_choice = raw.get("tool_choice")
+    metadata_field = raw.get("metadata")
+    metadata: dict[str, Any] = {}
+    if metadata_field is not None:
+        if not isinstance(metadata_field, dict):
+            raise SFTDataError("metadata must be an object if present")
+        metadata = dict(metadata_field)
+    extra = {
+        key: value
+        for key, value in raw.items()
+        if key not in {"messages", "tools", "tool_choice", "metadata"}
+    }
+    return SFTExample(
+        messages=messages,
+        tools=tools,
+        tool_choice=tool_choice,
+        metadata=metadata,
+        extra=extra,
+    )
+def parse_jsonl_line(line: str, *, min_messages: int = 1) -> SFTExample:
+    record = json.loads(line)
+    return coerce_example(record, min_messages=min_messages)
+def iter_sft_examples(
+    source: Iterable[str], *, min_messages: int = 1, skip_empty: bool = True
+) -> Iterator[SFTExample]:
+    for line in source:
+        if skip_empty and not line.strip():
+            continue
+        yield parse_jsonl_line(line, min_messages=min_messages)
+def collect_sft_jsonl_errors(
+    path: Path,
+    *,
+    min_messages: int = 1,
+    max_lines: int | None = None,
+    max_errors: int | None = None,
+) -> list[str]:
+    errors: list[str] = []
+    lines_checked = 0
+    with path.open("r", encoding="utf-8") as fh:
+        for lineno, raw_line in enumerate(fh, start=1):
+            if max_lines is not None and lines_checked >= max_lines:
+                break
+            stripped = raw_line.strip()
+            if not stripped:
+                continue
+            lines_checked += 1
+            try:
+                parse_jsonl_line(stripped, min_messages=min_messages)
+            except json.JSONDecodeError as exc:
+                errors.append(f"Line {lineno}: invalid JSON ({exc.msg})")
+            except SFTDataError as exc:
+                errors.append(f"Line {lineno}: {exc}")
+            if max_errors is not None and len(errors) >= max_errors:
+                break
+    if lines_checked == 0 and (max_errors is None or len(errors) < max_errors):
+        errors.append("File contains no SFT examples")
+    return errors
+def validate_jsonl_or_raise(
+    path: Path,
+    *,
+    min_messages: int = 1,
+    max_lines: int | None = None,
+    max_errors: int | None = None,
+    error_factory: type[Exception] = ValueError,
+) -> None:
+    if not path.exists():
+        raise FileNotFoundError(str(path))
+    issues = collect_sft_jsonl_errors(
+        path,
+        min_messages=min_messages,
+        max_lines=max_lines,
+        max_errors=max_errors,
+    )
+    if issues:
+        truncated = max_errors is not None and len(issues) >= max_errors
+        suffix = "" if not truncated else f" (showing first {max_errors} issues)"
+        details = "\n - ".join(issues)
+        raise error_factory(f"{path}: Dataset validation failed{suffix}:\n - {details}")
+def load_jsonl(path: Path, *, min_messages: int = 1) -> list[SFTExample]:
+    if not path.exists():
+        raise FileNotFoundError(str(path))
+    with path.open("r", encoding="utf-8") as fh:
+        return list(iter_sft_examples(fh, min_messages=min_messages))
+__all__ = [
+    "SFTDataError",
+    "SFTExample",
+    "SFTMessage",
+    "SFTToolCall",
+    "SFTToolDefinition",
+    "collect_sft_jsonl_errors",
+    "coerce_example",
+    "iter_sft_examples",
+    "load_jsonl",
+    "parse_jsonl_line",
+    "validate_jsonl_or_raise",
+]

synth_ai/learning/sse.py CHANGED Viewed

@@ -2,7 +2,8 @@ from __future__ import annotations
 import json
 import time
-from typing import Any, Callable, Optional
+from collections.abc import Callable
+from contextlib import suppress
 import aiohttp
@@ -18,7 +19,7 @@ async def stream_events(
     job_id: str,
     *,
     seconds: int = 60,
-    on_event: Optional[Callable[[dict], None]] = None,
+    on_event: Callable[[dict], None] | None = None,
 ) -> None:
     if seconds <= 0:
         return
@@ -29,28 +30,28 @@ async def stream_events(
     ]
     for url in candidates:
         try:
-            async with aiohttp.ClientSession(timeout=aiohttp.ClientTimeout(total=None)) as session:
-                async with session.get(url, headers=headers) as resp:
-                    if resp.status != 200:
+            async with (
+                aiohttp.ClientSession(timeout=aiohttp.ClientTimeout(total=None)) as session,
+                session.get(url, headers=headers) as resp,
+            ):
+                if resp.status != 200:
+                    continue
+                start_t = time.time()
+                async for raw in resp.content:
+                    line = raw.decode(errors="ignore").strip()
+                    if not line or line.startswith(":"):
                         continue
-                    start_t = time.time()
-                    async for raw in resp.content:
-                        line = raw.decode(errors="ignore").strip()
-                        if not line or line.startswith(":"):
-                            continue
-                        if not line.startswith("data:"):
-                            continue
-                        data = line[5:].strip()
-                        try:
-                            obj = json.loads(data)
-                        except Exception:
-                            continue
-                        if on_event:
-                            try:
-                                on_event(obj)
-                            except Exception:
-                                pass
-                        if (time.time() - start_t) >= seconds:
-                            return
+                    if not line.startswith("data:"):
+                        continue
+                    data = line[5:].strip()
+                    try:
+                        obj = json.loads(data)
+                    except Exception:
+                        continue
+                    if on_event:
+                        with suppress(Exception):
+                            on_event(obj)
+                    if (time.time() - start_t) >= seconds:
+                        return
         except Exception:
             continue

synth-ai 0.2.9.dev7__py3-none-any.whl → 0.2.9.dev8__py3-none-any.whl

Potentially problematic release.

synth-ai 0.2.9.dev7py3-none-any.whl → 0.2.9.dev8py3-none-any.whl