PyPI - synth-ai - Versions diffs - 0.2.9.dev7__py3-none-any.whl → 0.2.10__py3-none-any.whl - Mend

synth-ai 0.2.9.dev7py3-none-any.whl → 0.2.10py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synth-ai might be problematic. Click here for more details.

Files changed (323) hide show

examples/__init__.py +16 -0
examples/crafter_debug_render.py +8 -11
examples/dev/qwen3_32b_qlora_4xh100.toml +40 -0
examples/multi_step/crafter_rl_lora.md +29 -0
examples/qwen_coder/README.md +102 -0
examples/qwen_coder/_shared.py +113 -0
examples/qwen_coder/configs/coder_lora_30b.toml +61 -0
examples/qwen_coder/configs/coder_lora_4b.toml +57 -0
examples/qwen_coder/configs/coder_lora_small.toml +58 -0
examples/qwen_coder/generate_dataset.py +98 -0
examples/qwen_coder/infer_ft_smoke.py +65 -0
examples/qwen_coder/infer_prod_proxy.py +73 -0
examples/qwen_coder/infer_via_synth.py +87 -0
examples/qwen_coder/scripts/infer_coder.sh +19 -0
examples/qwen_coder/scripts/train_coder_30b.sh +22 -0
examples/qwen_coder/sft_full_17b.py +103 -0
examples/qwen_coder/sft_lora_30b.py +110 -0
examples/qwen_coder/subset_jsonl.py +39 -0
examples/qwen_coder/todos.md +38 -0
examples/qwen_coder/validate_jsonl.py +60 -0
examples/rl/run_eval.py +36 -37
examples/rl/run_rl_and_save.py +5 -5
examples/rl/task_app/math_single_step.py +65 -43
examples/rl/task_app/math_task_app.py +3 -3
examples/sft/README.md +139 -0
examples/sft/configs/crafter_fft_qwen0p6b.toml +44 -0
examples/sft/configs/crafter_lora_qwen0p6b.toml +45 -0
examples/sft/evaluate.py +117 -0
examples/sft/export_dataset.py +117 -0
examples/sft/generate_traces.py +162 -0
examples/swe/__init__.py +12 -0
examples/swe/task_app/README.md +105 -0
examples/swe/task_app/__init__.py +2 -0
examples/swe/task_app/grpo_swe_mini.py +571 -0
examples/swe/task_app/grpo_swe_mini_task_app.py +136 -0
examples/swe/task_app/hosted/README.md +173 -0
examples/swe/task_app/hosted/__init__.py +5 -0
examples/swe/task_app/hosted/branching.py +143 -0
examples/swe/task_app/hosted/environment_routes.py +1289 -0
examples/swe/task_app/hosted/envs/__init__.py +1 -0
examples/swe/task_app/hosted/envs/crafter/__init__.py +6 -0
examples/swe/task_app/hosted/envs/crafter/app.py +1 -0
examples/swe/task_app/hosted/envs/crafter/environment.py +522 -0
examples/swe/task_app/hosted/envs/crafter/policy.py +478 -0
examples/swe/task_app/hosted/envs/crafter/react_agent.py +108 -0
examples/swe/task_app/hosted/envs/crafter/shared.py +305 -0
examples/swe/task_app/hosted/envs/crafter/tools.py +47 -0
examples/swe/task_app/hosted/envs/mini_swe/__init__.py +8 -0
examples/swe/task_app/hosted/envs/mini_swe/environment.py +1164 -0
examples/swe/task_app/hosted/envs/mini_swe/policy.py +355 -0
examples/swe/task_app/hosted/envs/mini_swe/shared.py +83 -0
examples/swe/task_app/hosted/envs/mini_swe/tools.py +96 -0
examples/swe/task_app/hosted/hosted_app.py +204 -0
examples/swe/task_app/hosted/inference/__init__.py +5 -0
examples/swe/task_app/hosted/inference/openai_client.py +618 -0
examples/swe/task_app/hosted/main.py +100 -0
examples/swe/task_app/hosted/policy_routes.py +1079 -0
examples/swe/task_app/hosted/registry.py +195 -0
examples/swe/task_app/hosted/rollout.py +1869 -0
examples/swe/task_app/hosted/storage/__init__.py +5 -0
examples/swe/task_app/hosted/storage/volume.py +211 -0
examples/swe/task_app/hosted/test_agents.py +161 -0
examples/swe/task_app/hosted/test_service.py +137 -0
examples/swe/task_app/hosted/utils.py +62 -0
examples/vlm/PROPOSAL.md +53 -0
examples/vlm/README.md +68 -0
examples/vlm/configs/crafter_vlm_gpt4o.toml +44 -0
examples/vlm/crafter_image_only_agent.py +207 -0
examples/vlm/crafter_openai_vlm_agent.py +277 -0
examples/vlm/filter_image_rows.py +63 -0
examples/vlm/run_crafter_vlm_benchmark.py +316 -0
examples/warming_up_to_rl/analyze_trace_db.py +5 -5
examples/warming_up_to_rl/configs/rl_from_base_qwen4b.toml +11 -1
examples/warming_up_to_rl/export_trace_sft.py +78 -21
examples/warming_up_to_rl/groq_test.py +4 -4
examples/warming_up_to_rl/manage_secrets.py +13 -18
examples/warming_up_to_rl/run_eval.py +42 -44
examples/warming_up_to_rl/run_fft_and_save.py +11 -16
examples/warming_up_to_rl/run_local_rollout.py +1 -3
examples/warming_up_to_rl/run_local_rollout_modal.py +2 -4
examples/warming_up_to_rl/run_local_rollout_parallel.py +1 -4
examples/warming_up_to_rl/run_local_rollout_traced.py +3 -5
examples/warming_up_to_rl/run_rl_and_save.py +5 -6
examples/warming_up_to_rl/run_rollout_remote.py +8 -10
examples/warming_up_to_rl/task_app/README.md +6 -2
examples/warming_up_to_rl/task_app/grpo_crafter.py +234 -35
examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py +2 -3
examples/warming_up_to_rl/task_app/synth_envs_hosted/__init__.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/branching.py +9 -11
examples/warming_up_to_rl/task_app/synth_envs_hosted/environment_routes.py +131 -114
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/environment.py +101 -41
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py +73 -51
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py +14 -6
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/shared.py +16 -16
examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py +32 -34
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py +94 -31
examples/warming_up_to_rl/task_app/synth_envs_hosted/main.py +0 -2
examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py +303 -203
examples/warming_up_to_rl/task_app/synth_envs_hosted/registry.py +21 -23
examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py +328 -225
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/volume.py +13 -13
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_agents.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_service.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/utils.py +4 -3
synth_ai/api/models/supported.py +376 -0
synth_ai/api/train/builders.py +128 -21
synth_ai/api/train/cli.py +80 -64
synth_ai/api/train/config_finder.py +7 -2
synth_ai/api/train/env_resolver.py +1 -1
synth_ai/api/train/pollers.py +2 -1
synth_ai/api/train/supported_algos.py +139 -0
synth_ai/api/train/task_app.py +1 -2
synth_ai/api/train/utils.py +13 -44
synth_ai/cli/__init__.py +8 -0
synth_ai/cli/_modal_wrapper.py +28 -0
synth_ai/cli/_typer_patch.py +49 -0
synth_ai/cli/balance.py +1 -2
synth_ai/cli/calc.py +1 -1
synth_ai/cli/demo.py +2 -1
synth_ai/cli/recent.py +2 -2
synth_ai/cli/rl_demo.py +2 -1
synth_ai/cli/root.py +11 -13
synth_ai/cli/status.py +2 -2
synth_ai/cli/task_apps.py +529 -179
synth_ai/cli/traces.py +6 -4
synth_ai/cli/watch.py +12 -18
synth_ai/demo_registry.py +1 -1
synth_ai/demos/core/cli.py +36 -43
synth_ai/demos/demo_task_apps/__init__.py +3 -3
synth_ai/demos/demo_task_apps/core.py +17 -25
synth_ai/demos/demo_task_apps/crafter/grpo_crafter_task_app.py +3 -4
synth_ai/demos/demo_task_apps/math/app.py +2 -1
synth_ai/demos/demo_task_apps/math/deploy_modal.py +3 -4
synth_ai/demos/demo_task_apps/math/modal_task_app.py +16 -18
synth_ai/demos/demo_task_apps/math/task_app_entry.py +0 -1
synth_ai/environments/examples/crafter_classic/environment.py +76 -1
synth_ai/environments/reproducibility/tree.py +2 -5
synth_ai/environments/service/app.py +11 -12
synth_ai/environments/service/core_routes.py +4 -7
synth_ai/environments/stateful/engine.py +1 -1
synth_ai/environments/tasks/core.py +1 -0
synth_ai/environments/tasks/filters.py +5 -6
synth_ai/environments/tasks/utils.py +4 -5
synth_ai/handshake.py +9 -9
synth_ai/http.py +1 -1
synth_ai/http_client.py +18 -10
synth_ai/inference/client.py +15 -5
synth_ai/jobs/client.py +78 -83
synth_ai/learning/__init__.py +41 -6
synth_ai/learning/algorithms.py +14 -0
synth_ai/learning/client.py +91 -24
synth_ai/learning/config.py +2 -38
synth_ai/learning/ft_client.py +4 -59
synth_ai/learning/health.py +5 -6
synth_ai/learning/jobs.py +31 -47
synth_ai/{rl → learning/rl}/__init__.py +14 -4
synth_ai/learning/rl/client.py +267 -0
synth_ai/learning/rl/config.py +31 -0
synth_ai/{rl → learning/rl}/contracts.py +5 -8
synth_ai/{rl → learning/rl}/env_keys.py +39 -15
synth_ai/learning/rl/secrets.py +13 -0
synth_ai/learning/rl_client.py +2 -281
synth_ai/learning/sft/__init__.py +29 -0
synth_ai/learning/sft/client.py +68 -0
synth_ai/learning/sft/config.py +270 -0
synth_ai/learning/sft/data.py +295 -0
synth_ai/learning/sse.py +25 -24
synth_ai/learning/validators.py +25 -28
synth_ai/lm/__init__.py +21 -47
synth_ai/task/__init__.py +25 -27
synth_ai/task/apps/__init__.py +7 -8
synth_ai/task/auth.py +8 -8
synth_ai/task/client.py +14 -14
synth_ai/task/contracts.py +36 -35
synth_ai/task/datasets.py +6 -5
synth_ai/task/errors.py +10 -10
synth_ai/task/health.py +17 -9
synth_ai/task/json.py +58 -23
synth_ai/task/proxy.py +13 -9
synth_ai/task/rubrics.py +16 -15
synth_ai/task/server.py +12 -12
synth_ai/task/tracing_utils.py +4 -4
synth_ai/task/vendors.py +5 -6
synth_ai/tracing_v3/__init__.py +2 -0
synth_ai/tracing_v3/abstractions.py +21 -4
synth_ai/tracing_v3/decorators.py +18 -16
synth_ai/tracing_v3/hooks.py +5 -5
synth_ai/tracing_v3/llm_call_record_helpers.py +6 -6
synth_ai/tracing_v3/session_tracer.py +40 -14
synth_ai/tracing_v3/storage/base.py +85 -0
synth_ai/tracing_v3/storage/config.py +21 -8
synth_ai/tracing_v3/storage/factory.py +10 -7
synth_ai/tracing_v3/storage/utils.py +4 -2
synth_ai/tracing_v3/turso/daemon.py +7 -2
synth_ai/tracing_v3/turso/models.py +2 -2
synth_ai/tracing_v3/turso/native_manager.py +1173 -0
synth_ai/tracing_v3/utils.py +4 -4
synth_ai/v0/api/__init__.py +8 -0
synth_ai/v0/api/models/__init__.py +8 -0
synth_ai/v0/api/models/supported.py +8 -0
synth_ai/v0/config/__init__.py +15 -0
synth_ai/v0/config/base_url.py +12 -0
synth_ai/v0/lm/__init__.py +51 -0
synth_ai/{lm → v0/lm}/caching/ephemeral.py +2 -2
synth_ai/{lm → v0/lm}/caching/handler.py +4 -4
synth_ai/{lm → v0/lm}/caching/initialize.py +1 -1
synth_ai/{lm → v0/lm}/caching/persistent.py +1 -1
synth_ai/{lm → v0/lm}/config.py +6 -1
synth_ai/{lm → v0/lm}/core/all.py +9 -9
synth_ai/{lm → v0/lm}/core/main.py +6 -6
synth_ai/{lm → v0/lm}/core/main_v3.py +10 -10
synth_ai/{lm → v0/lm}/core/synth_models.py +2 -14
synth_ai/{lm → v0/lm}/core/vendor_clients.py +2 -2
synth_ai/{lm → v0/lm}/overrides.py +2 -2
synth_ai/{lm → v0/lm}/provider_support/anthropic.py +4 -4
synth_ai/{lm → v0/lm}/provider_support/openai.py +5 -5
synth_ai/{lm → v0/lm}/structured_outputs/handler.py +5 -5
synth_ai/{lm → v0/lm}/structured_outputs/rehabilitate.py +1 -1
synth_ai/{lm → v0/lm}/vendors/core/anthropic_api.py +9 -9
synth_ai/{lm → v0/lm}/vendors/core/gemini_api.py +5 -5
synth_ai/{lm → v0/lm}/vendors/core/mistral_api.py +5 -5
synth_ai/{lm → v0/lm}/vendors/core/openai_api.py +10 -10
synth_ai/{lm → v0/lm}/vendors/openai_standard.py +8 -8
synth_ai/{lm → v0/lm}/vendors/openai_standard_responses.py +2 -2
synth_ai/{lm → v0/lm}/vendors/supported/custom_endpoint.py +3 -3
synth_ai/{lm → v0/lm}/vendors/supported/deepseek.py +2 -2
synth_ai/{lm → v0/lm}/vendors/supported/grok.py +2 -2
synth_ai/{lm → v0/lm}/vendors/supported/groq.py +1 -1
synth_ai/{lm → v0/lm}/vendors/supported/ollama.py +1 -1
synth_ai/{lm → v0/lm}/vendors/supported/openrouter.py +3 -3
synth_ai/{lm → v0/lm}/vendors/supported/together.py +1 -1
synth_ai/{lm → v0/lm}/vendors/synth_client.py +1 -1
synth_ai/v0/tracing_v3/__init__.py +10 -0
synth_ai/v0/tracing_v3/abstractions.py +3 -0
synth_ai/v0/tracing_v3/decorators.py +3 -0
synth_ai/v0/tracing_v3/llm_call_record_helpers.py +3 -0
synth_ai/v0/tracing_v3/session_tracer.py +3 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.10.dist-info}/METADATA +10 -7
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.10.dist-info}/RECORD +269 -233
examples/common_old/backend.py +0 -20
examples/evals_old/README.md +0 -98
examples/evals_old/__init__.py +0 -6
examples/evals_old/compare_models.py +0 -1038
examples/evals_old/example_log.md +0 -145
examples/evals_old/run_demo.sh +0 -126
examples/evals_old/trace_analysis.py +0 -270
examples/finetuning_old/_backup_synth_qwen/config.toml +0 -29
examples/finetuning_old/_backup_synth_qwen/example_log.md +0 -324
examples/finetuning_old/_backup_synth_qwen/filter_traces.py +0 -60
examples/finetuning_old/_backup_synth_qwen/filter_traces_achievements.py +0 -243
examples/finetuning_old/_backup_synth_qwen/purge_v3_traces.py +0 -109
examples/finetuning_old/_backup_synth_qwen/react_agent_lm.py +0 -1924
examples/finetuning_old/_backup_synth_qwen/readme.md +0 -49
examples/finetuning_old/_backup_synth_qwen/run_crafter_qwen4b.py +0 -114
examples/finetuning_old/_backup_synth_qwen/run_demo.sh +0 -195
examples/finetuning_old/_backup_synth_qwen/sft_kickoff.py +0 -119
examples/finetuning_old/synth_qwen_v1/README.md +0 -68
examples/finetuning_old/synth_qwen_v1/filter_traces.py +0 -60
examples/finetuning_old/synth_qwen_v1/filter_traces_achievements.py +0 -243
examples/finetuning_old/synth_qwen_v1/finetune.py +0 -46
examples/finetuning_old/synth_qwen_v1/hello_ft_model.py +0 -71
examples/finetuning_old/synth_qwen_v1/infer.py +0 -36
examples/finetuning_old/synth_qwen_v1/poll.py +0 -46
examples/finetuning_old/synth_qwen_v1/prepare_data.py +0 -35
examples/finetuning_old/synth_qwen_v1/purge_v3_traces.py +0 -109
examples/finetuning_old/synth_qwen_v1/react_agent_lm.py +0 -1933
examples/finetuning_old/synth_qwen_v1/run_crafter_sft_job.py +0 -210
examples/finetuning_old/synth_qwen_v1/run_ft_job.py +0 -237
examples/finetuning_old/synth_qwen_v1/upload_data.py +0 -34
examples/finetuning_old/synth_qwen_v1/util.py +0 -152
examples/rl_old/task_app.py +0 -1131
synth_ai/experimental/synth_oss.py +0 -445
synth_ai/learning/filtering.py +0 -0
synth_ai/learning/offline/dpo.py +0 -0
synth_ai/learning/offline/providers.py +0 -7
synth_ai/learning/offline/sft.py +0 -0
synth_ai/learning/offline/shared.py +0 -0
synth_ai/learning/online/grpo.py +0 -0
synth_ai/learning/online/irft.py +0 -0
synth_ai/learning/prompts/banking77_injection_eval.py +0 -168
synth_ai/learning/prompts/gepa.py +0 -0
synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +0 -211
synth_ai/learning/prompts/mipro.py +0 -289
synth_ai/learning/prompts/random_search.py +0 -249
synth_ai/learning/prompts/run_mipro_banking77.py +0 -172
synth_ai/learning/prompts/run_random_search_banking77.py +0 -329
synth_ai/rl/secrets.py +0 -19
synth_ai/scripts/verify_rewards.py +0 -100
synth_ai/tracing/__init__.py +0 -30
synth_ai/tracing_v1/__init__.py +0 -33
synth_ai/tracing_v3/turso/__init__.py +0 -25
synth_ai/tracing_v3/turso/manager.py +0 -838
synth_ai/zyk/__init__.py +0 -30
/synth_ai/{lm → v0/lm}/caching/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/caching/constants.py +0 -0
/synth_ai/{lm → v0/lm}/caching/dbs.py +0 -0
/synth_ai/{lm → v0/lm}/constants.py +0 -0
/synth_ai/{lm → v0/lm}/core/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/core/exceptions.py +0 -0
/synth_ai/{lm → v0/lm}/cost/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/cost/monitor.py +0 -0
/synth_ai/{lm → v0/lm}/cost/statefulness.py +0 -0
/synth_ai/{lm → v0/lm}/injection.py +0 -0
/synth_ai/{lm → v0/lm}/provider_support/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/provider_support/suppress_logging.py +0 -0
/synth_ai/{lm → v0/lm}/structured_outputs/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/structured_outputs/inject.py +0 -0
/synth_ai/{lm → v0/lm}/tools/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/tools/base.py +0 -0
/synth_ai/{lm → v0/lm}/unified_interface.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/base.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/core/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/core/synth_dev_api.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/local/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/local/ollama.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/retries.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/supported/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/warmup.py +0 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.10.dist-info}/WHEEL +0 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.10.dist-info}/entry_points.txt +0 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.10.dist-info}/licenses/LICENSE +0 -0
{synth_ai-0.2.9.dev7.dist-info → synth_ai-0.2.10.dist-info}/top_level.txt +0 -0

synth_ai/{rl → learning/rl}/env_keys.py RENAMED Viewed

@@ -1,12 +1,12 @@
-from __future__ import annotations
 """Helpers for uploading RL environment credentials to the backend."""
+from __future__ import annotations
 import base64
 import binascii
 import json
-from typing import Any, Dict
 import os
+from typing import Any
 import requests
 from nacl.public import PublicKey, SealedBox
@@ -18,14 +18,12 @@ _ALGORITHM = "libsodium.sealedbox.v1"
 def encrypt_for_backend(pubkey_b64: str, secret: str | bytes) -> str:
-    """Encrypt ``secret`` for storage by the backend using libsodium sealed boxes."""
     if not isinstance(pubkey_b64, str) or not pubkey_b64.strip():
         raise ValueError("public key must be a non-empty base64 string")
     try:
         key_bytes = base64.b64decode(pubkey_b64, validate=True)
-    except binascii.Error as exc:  # pragma: no cover - defensive guard
+    except binascii.Error as exc:
         raise ValueError("public key must be base64-encoded") from exc
     if len(key_bytes) != 32:
@@ -35,7 +33,7 @@ def encrypt_for_backend(pubkey_b64: str, secret: str | bytes) -> str:
         secret_bytes = secret.encode("utf-8")
     elif isinstance(secret, bytes):
         secret_bytes = secret
-    else:  # pragma: no cover - type guard
+    else:
         raise TypeError("secret must be str or bytes")
     if not secret_bytes:
@@ -52,20 +50,17 @@ def setup_environment_api_key(
     token: str | None = None,
     *,
     timeout: float = 15.0,
-) -> Dict[str, Any]:
-    """Upload an ENVIRONMENT_API_KEY to the backend."""
+) -> dict[str, Any]:
     backend = backend_base.rstrip("/")
     if not backend:
         raise ValueError("backend_base must be provided")
     if not synth_api_key:
         raise ValueError("synth_api_key must be provided")
-    # Require caller-provided plaintext. If not provided, read from ENVIRONMENT_API_KEY.
     plaintext = token if token is not None else os.getenv("ENVIRONMENT_API_KEY", "").strip()
     if not plaintext:
         raise ValueError("ENVIRONMENT_API_KEY must be set (or pass token=...) to upload")
-    if not isinstance(plaintext, str):  # pragma: no cover - defensive guard
+    if not isinstance(plaintext, str):
         raise TypeError("token must be a string")
     token_bytes = plaintext.encode("utf-8")
@@ -81,7 +76,7 @@ def setup_environment_api_key(
     try:
         doc = response.json()
-    except ValueError as exc:  # pragma: no cover - backend invariant
+    except ValueError as exc:
         raise RuntimeError("backend returned invalid JSON for public key") from exc
     if not isinstance(doc, dict):
@@ -91,16 +86,45 @@ def setup_environment_api_key(
     if not isinstance(pubkey, str) or not pubkey:
         raise RuntimeError("backend response missing public_key")
-    # The backend currently returns a single algorithm identifier; keep a guard in
-    # case future versions change the value and we need to surface that to callers.
     alg = doc.get("alg")
     if alg is not None and alg != _ALGORITHM:
         raise RuntimeError(f"unsupported sealed box algorithm: {alg}")
+    # Diagnostics: safe previews and hashes to correlate with backend logs
+    try:
+        import hashlib as _hash
+        pk_bytes = base64.b64decode(pubkey, validate=True)
+        pk_sha256 = _hash.sha256(pk_bytes).hexdigest()
+        print(
+            f"[env-keys] public_key: b64_len={len(pubkey)} sha256={pk_sha256} head={pubkey[:16]} tail={pubkey[-16:]}"
+        )
+        _plen = len(plaintext)
+        _ppref = (plaintext[:6] + "…") if _plen > 10 else plaintext
+        _psuf = ("…" + plaintext[-4:]) if _plen > 10 else ""
+        _has_ws = any(ch.isspace() for ch in plaintext)
+        print(
+            f"[env-keys] plaintext: len={_plen} preview={_ppref}{_psuf} has_ws={bool(_has_ws)}"
+        )
+    except Exception:
+        pass
     ciphertext_b64 = encrypt_for_backend(pubkey, token_bytes)
     body = {"name": "ENVIRONMENT_API_KEY", "ciphertext_b64": ciphertext_b64}
     post_url = f"{backend}/api/v1/env-keys"
+    # Ciphertext diagnostics
+    try:
+        import hashlib as _hash
+        _ct_bytes = base64.b64decode(ciphertext_b64, validate=True)
+        _ct_sha = _hash.sha256(_ct_bytes).hexdigest()
+        print(
+            f"[env-keys] ciphertext: b64_len={len(ciphertext_b64)} sha256={_ct_sha} head={ciphertext_b64[:16]} tail={ciphertext_b64[-16:]}"
+        )
+    except Exception:
+        pass
     response2 = requests.post(
         post_url,
         headers={**headers, "Content-Type": "application/json"},

synth_ai/learning/rl/secrets.py ADDED Viewed

@@ -0,0 +1,13 @@
+"""Helpers for generating RL environment credentials."""
+from __future__ import annotations
+import secrets
+__all__ = ["mint_environment_api_key"]
+def mint_environment_api_key() -> str:
+    """Mint a random ENVIRONMENT_API_KEY value."""
+    return secrets.token_hex(32)

synth_ai/learning/rl_client.py CHANGED Viewed

@@ -1,284 +1,5 @@
 from __future__ import annotations
-from typing import Any, Dict, List, Optional, Callable
-import os
-import time
+from .rl.client import RlClient
-from ..http import AsyncHttpClient, HTTPError, sleep
-def _api_base(b: str) -> str:
-    b = (b or "").rstrip("/")
-    return b if b.endswith("/api") else f"{b}/api"
-class RlClient:
-    """Lightweight RL client for provider-agnostic job control.
-    Notes:
-    - Uses learning/* for status/events/metrics and rl/* for creation/start.
-    - Trainer endpoints are resolved server-side via trainer_id.
-    """
-    def __init__(self, base_url: str, api_key: str, *, timeout: float = 600.0) -> None:
-        self._base_url = base_url.rstrip("/")
-        self._api_key = api_key
-        self._timeout = timeout
-    async def resolve_trainer_start_url(self, trainer_id: str) -> str:
-        """GET /api/rl/services/{id} → { training_start_url }"""
-        path = f"/api/rl/services/{trainer_id}"
-        async with AsyncHttpClient(self._base_url, self._api_key, timeout=30.0) as http:
-            js = await http.get(path)
-        if not isinstance(js, dict):
-            raise HTTPError(
-                status=500, url=path, message="invalid_service_response", body_snippet=str(js)[:200]
-            )
-        start_url = js.get("training_start_url")
-        if not isinstance(start_url, str) or not start_url:
-            raise HTTPError(
-                status=500,
-                url=path,
-                message="missing_training_start_url",
-                body_snippet=str(js)[:200],
-            )
-        return start_url
-    async def create_job(
-        self,
-        *,
-        model: str,
-        task_app_url: str,
-        trainer: Dict[str, Any],
-        trainer_id: Optional[str] = None,
-        job_config_id: Optional[str] = None,
-        inline_config: Optional[Dict[str, Any]] = None,
-    ) -> Dict[str, Any]:
-        body = {
-            "job_type": "rl",
-            "data": {
-                "model": model,
-                "endpoint_base_url": task_app_url,
-                **({"job_config_id": job_config_id} if job_config_id else {}),
-                **({"config": inline_config} if inline_config else {}),
-                "trainer": {
-                    "batch_size": int(trainer.get("batch_size", 1)),
-                    "group_size": max(2, int(trainer.get("group_size", 2))),
-                },
-            },
-        }
-        async with AsyncHttpClient(self._base_url, self._api_key, timeout=self._timeout) as http:
-            js = await http.post_json(f"{_api_base(self._base_url)}/rl/jobs", json=body)
-        if not isinstance(js, dict):
-            raise HTTPError(
-                status=500,
-                url="/api/rl/jobs",
-                message="invalid_create_response",
-                body_snippet=str(js)[:200],
-            )
-        return js
-    async def start_job_if_supported(self, job_id: str) -> Optional[Dict[str, Any]]:
-        path = f"{_api_base(self._base_url)}/rl/jobs/{job_id}/start"
-        try:
-            async with AsyncHttpClient(self._base_url, self._api_key, timeout=30.0) as http:
-                return await http.post_json(path, json={})
-        except HTTPError as he:  # noqa: PERF203
-            if he.status == 404:
-                return None
-            raise
-    async def get_job(self, job_id: str) -> Dict[str, Any]:
-        async with AsyncHttpClient(self._base_url, self._api_key, timeout=30.0) as http:
-            return await http.get(f"{_api_base(self._base_url)}/learning/jobs/{job_id}")
-    async def get_events(
-        self, job_id: str, *, since_seq: int = 0, limit: int = 200
-    ) -> List[Dict[str, Any]]:
-        params = {"since_seq": since_seq, "limit": limit}
-        async with AsyncHttpClient(self._base_url, self._api_key, timeout=30.0) as http:
-            try:
-                js = await http.get(
-                    f"{_api_base(self._base_url)}/learning/jobs/{job_id}/events", params=params
-                )
-            except HTTPError as he:
-                try:
-                    print(
-                        f"[poll] events HTTPError status={he.status} url={he.url} since_seq={since_seq} body={(he.body_snippet or '')[:200]}"
-                    )
-                except Exception:
-                    pass
-                raise
-        if isinstance(js, dict):
-            evs = js.get("events") or js.get("data")
-            if isinstance(evs, list):
-                return evs
-        return []
-    async def get_metrics(
-        self, job_id: str, *, after_step: int = -1, limit: int = 200
-    ) -> List[Dict[str, Any]]:
-        params = {"after_step": after_step, "limit": limit}
-        async with AsyncHttpClient(self._base_url, self._api_key, timeout=30.0) as http:
-            js = await http.get(
-                f"{_api_base(self._base_url)}/learning/jobs/{job_id}/metrics", params=params
-            )
-        if isinstance(js, dict) and isinstance(js.get("points"), list):
-            return js["points"]
-        return []
-    async def poll_until_terminal(
-        self,
-        job_id: str,
-        *,
-        interval_seconds: float = 2.0,
-        max_seconds: float | None = None,
-        empty_polls_threshold: int = 5,
-        startup_deadline_s: int = 45,
-        on_event: Optional[Callable[[Dict[str, Any]], None]] = None,
-        on_metric: Optional[Callable[[Dict[str, Any]], None]] = None,
-    ) -> Dict[str, Any]:
-        last_seq_by_stream: Dict[str, int] = {}
-        events_job_id: Optional[str] = None
-        last_status: Optional[str] = None
-        last_step_by_name: Dict[str, int] = {}
-        empty_polls = 0
-        saw_any_event = False
-        start_t = time.time()
-        terminal = {"succeeded", "failed", "cancelled", "canceled", "error", "completed"}
-        while True:
-            status_data: Optional[Dict[str, Any]] = None
-            try:
-                status_data = await self.get_job(job_id)
-            except Exception:
-                status_data = None
-            if status_data is None:
-                try:
-                    print(f"[poll] get_job returned None base={self._base_url} job_id={job_id}")
-                except Exception:
-                    pass
-            status = str((status_data or {}).get("status") or "").lower()
-            if status_data:
-                linked = status_data.get("linked_job_id")
-                if isinstance(linked, str) and linked and linked != events_job_id:
-                    events_job_id = linked
-                    try:
-                        print(f"[poll] discovered linked_job_id stream={events_job_id}")
-                    except Exception:
-                        pass
-            if status and status != last_status:
-                last_status = status
-                # Status transitions only to avoid log spam
-                if on_event:
-                    try:
-                        on_event({"type": "rl.status", "message": status})
-                    except Exception:
-                        pass
-            # Events
-            stream_ids = [job_id]
-            if events_job_id and events_job_id not in stream_ids:
-                stream_ids.append(events_job_id)
-            try:
-                print(
-                    f"[poll] streams={stream_ids} intervals={interval_seconds}s since_map={last_seq_by_stream} empty_polls={empty_polls}"
-                )
-            except Exception:
-                pass
-            total_events_this_cycle = 0
-            terminal_event_seen = False
-            terminal_event_status: Optional[str] = None
-            for ev_id in stream_ids:
-                since = last_seq_by_stream.get(ev_id, 0)
-                try:
-                    events = await self.get_events(ev_id, since_seq=since, limit=200)
-                except HTTPError as he:
-                    try:
-                        print(
-                            f"[poll] get_events error status={he.status} url={he.url} since={since} body={(he.body_snippet or '')[:200]}"
-                        )
-                    except Exception:
-                        pass
-                    events = []
-                except Exception as e:
-                    try:
-                        print(
-                            f"[poll] get_events unexpected error ev_id={ev_id} since={since} err={type(e).__name__}: {e}"
-                        )
-                    except Exception:
-                        pass
-                    events = []
-                total_events_this_cycle += len(events)
-                if events:
-                    saw_any_event = True
-                for e in events:
-                    seq_val = int(e.get("seq") or 0)
-                    if seq_val <= last_seq_by_stream.get(ev_id, 0):
-                        continue
-                    last_seq_by_stream[ev_id] = seq_val
-                    if on_event:
-                        try:
-                            on_event(e)
-                        except Exception:
-                            pass
-                    et = str(e.get("type") or e.get("event_type") or "").lower()
-                    if et in ("rl.job.completed", "workflow.completed", "rl.train.completed"):
-                        terminal_event_seen = True
-                        terminal_event_status = "succeeded"
-                    elif et in ("rl.job.failed", "workflow.failed"):
-                        terminal_event_seen = True
-                        terminal_event_status = "failed"
-            # Metrics
-            try:
-                after = max(last_step_by_name.values()) if last_step_by_name else -1
-                points = await self.get_metrics(job_id, after_step=after, limit=200)
-                for p in points:
-                    name = str(p.get("name") or "")
-                    step = int(p.get("step") or -1)
-                    if step <= last_step_by_name.get(name, -1):
-                        continue
-                    last_step_by_name[name] = step
-                    if on_metric:
-                        try:
-                            on_metric(p)
-                        except Exception:
-                            pass
-            except Exception:
-                pass
-            if terminal_event_seen:
-                return {"status": terminal_event_status or status or "completed", "job_id": job_id}
-            if status and status in terminal:
-                return {"status": status, "job_id": job_id}
-            if total_events_this_cycle == 0:
-                empty_polls += 1
-            else:
-                empty_polls = 0
-            if empty_polls >= max(1, int(empty_polls_threshold)):
-                try:
-                    print(
-                        f"[poll] threshold hit: empty_polls={empty_polls} >= {empty_polls_threshold} streams={stream_ids} last_seq_map={last_seq_by_stream}"
-                    )
-                except Exception:
-                    pass
-                raise AssertionError(
-                    f"No new events detected for {empty_polls_threshold} consecutive polls. Check event ingestion."
-                )
-            if not saw_any_event and (time.time() - start_t) > int(startup_deadline_s):
-                try:
-                    print(
-                        f"[poll] startup window exceeded: {startup_deadline_s}s base={self._base_url} job={job_id} streams={stream_ids} last_seq_map={last_seq_by_stream}"
-                    )
-                except Exception:
-                    pass
-                raise AssertionError(
-                    f"No events observed within startup window ({startup_deadline_s}s). Investigate event streaming."
-                )
-            await sleep(interval_seconds)
-            if max_seconds is not None and (time.time() - start_t) >= max_seconds:
-                raise TimeoutError(f"Polling timed out after {max_seconds}s for job {job_id}")
+__all__ = ["RlClient"]

synth_ai/learning/sft/__init__.py ADDED Viewed

@@ -0,0 +1,29 @@
+from .client import FtClient
+from .data import (
+    SFTDataError,
+    SFTExample,
+    SFTMessage,
+    SFTToolCall,
+    SFTToolDefinition,
+    coerce_example,
+    collect_sft_jsonl_errors,
+    iter_sft_examples,
+    load_jsonl,
+    parse_jsonl_line,
+    validate_jsonl_or_raise,
+)
+__all__ = [
+    "FtClient",
+    "SFTDataError",
+    "SFTExample",
+    "SFTMessage",
+    "SFTToolCall",
+    "SFTToolDefinition",
+    "collect_sft_jsonl_errors",
+    "coerce_example",
+    "iter_sft_examples",
+    "load_jsonl",
+    "parse_jsonl_line",
+    "validate_jsonl_or_raise",
+]

synth_ai/learning/sft/client.py ADDED Viewed

@@ -0,0 +1,68 @@
+from __future__ import annotations
+from pathlib import Path
+from typing import Any
+from ...http import AsyncHttpClient, HTTPError
+from .config import prepare_sft_job_payload
+from .data import validate_jsonl_or_raise
+class FtClient:
+    def __init__(self, base_url: str, api_key: str, *, timeout: float = 30.0) -> None:
+        self._base_url = base_url.rstrip("/")
+        self._api_key = api_key
+        self._timeout = timeout
+    async def upload_training_file(self, path: str | Path, *, purpose: str = "fine-tune") -> str:
+        p = Path(path)
+        if p.suffix.lower() == ".jsonl" and purpose == "fine-tune":
+            validate_jsonl_or_raise(p, min_messages=2)
+        content = p.read_bytes()
+        async with AsyncHttpClient(self._base_url, self._api_key, timeout=self._timeout) as http:
+            data = {"purpose": purpose}
+            files = {"file": (p.name, content, _infer_content_type(p.name))}
+            js = await http.post_multipart("/api/learning/files", data=data, files=files)
+        if not isinstance(js, dict) or "id" not in js:
+            raise HTTPError(
+                status=500,
+                url="/api/learning/files",
+                message="invalid_upload_response",
+                body_snippet=str(js)[:200],
+            )
+        return str(js["id"])
+    async def create_sft_job(
+        self,
+        *,
+        model: str,
+        training_file_id: str,
+        hyperparameters: dict[str, Any],
+        metadata: dict[str, Any] | None = None,
+    ) -> dict[str, Any]:
+        body = prepare_sft_job_payload(
+            model=model,
+            training_file=training_file_id,
+            hyperparameters=hyperparameters,
+            metadata=metadata,
+            training_type="sft_offline",
+            training_file_field="training_file_id",
+            require_training_file=True,
+        )
+        async with AsyncHttpClient(self._base_url, self._api_key, timeout=self._timeout) as http:
+            return await http.post_json("/api/learning/jobs", json=body)
+    async def start_job(self, job_id: str) -> dict[str, Any]:
+        async with AsyncHttpClient(self._base_url, self._api_key, timeout=self._timeout) as http:
+            return await http.post_json(f"/api/learning/jobs/{job_id}/start", json={})
+def _infer_content_type(filename: str) -> str:
+    name = filename.lower()
+    if name.endswith(".jsonl"):
+        return "application/jsonl"
+    if name.endswith(".json"):
+        return "application/json"
+    if name.endswith(".txt"):
+        return "text/plain"
+    return "application/octet-stream"

synth-ai 0.2.9.dev7__py3-none-any.whl → 0.2.10__py3-none-any.whl

Potentially problematic release.

synth-ai 0.2.9.dev7py3-none-any.whl → 0.2.10py3-none-any.whl