PyPI - synth-ai - Versions diffs - 0.2.9.dev4__py3-none-any.whl → 0.2.9.dev6__py3-none-any.whl - Mend

synth-ai 0.2.9.dev4py3-none-any.whl → 0.2.9.dev6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synth-ai might be problematic. Click here for more details.

Files changed (353) hide show

examples/__init__.py +16 -0
examples/crafter_debug_render.py +23 -17
examples/qwen_coder/README.md +102 -0
examples/qwen_coder/_shared.py +113 -0
examples/qwen_coder/configs/coder_lora_30b.toml +61 -0
examples/qwen_coder/configs/coder_lora_4b.toml +57 -0
examples/qwen_coder/configs/coder_lora_small.toml +58 -0
examples/qwen_coder/generate_dataset.py +98 -0
examples/qwen_coder/infer_ft_smoke.py +64 -0
examples/qwen_coder/infer_prod_proxy.py +73 -0
examples/qwen_coder/infer_via_synth.py +87 -0
examples/qwen_coder/scripts/infer_coder.sh +18 -0
examples/qwen_coder/scripts/train_coder_30b.sh +21 -0
examples/qwen_coder/sft_full_17b.py +103 -0
examples/qwen_coder/sft_lora_30b.py +110 -0
examples/qwen_coder/subset_jsonl.py +38 -0
examples/qwen_coder/validate_jsonl.py +59 -0
examples/rl/configs/eval_base_qwen.toml +1 -1
examples/rl/configs/rl_from_base_qwen17.toml +1 -1
examples/rl/download_dataset.py +26 -10
examples/rl/run_eval.py +53 -52
examples/rl/run_rl_and_save.py +29 -12
examples/rl/task_app/math_single_step.py +180 -41
examples/rl/task_app/math_task_app.py +14 -6
examples/sft/README.md +139 -0
examples/sft/configs/crafter_fft_qwen0p6b.toml +44 -0
examples/sft/configs/crafter_lora_qwen0p6b.toml +45 -0
examples/sft/evaluate.py +117 -0
examples/sft/export_dataset.py +117 -0
examples/sft/generate_traces.py +162 -0
examples/swe/__init__.py +12 -0
examples/swe/task_app/README.md +105 -0
examples/swe/task_app/__init__.py +2 -0
examples/swe/task_app/grpo_swe_mini.py +571 -0
examples/swe/task_app/grpo_swe_mini_task_app.py +136 -0
examples/swe/task_app/hosted/README.md +173 -0
examples/swe/task_app/hosted/__init__.py +5 -0
examples/swe/task_app/hosted/branching.py +143 -0
examples/swe/task_app/hosted/environment_routes.py +1289 -0
examples/swe/task_app/hosted/envs/__init__.py +1 -0
examples/swe/task_app/hosted/envs/crafter/__init__.py +6 -0
examples/swe/task_app/hosted/envs/crafter/app.py +1 -0
examples/swe/task_app/hosted/envs/crafter/environment.py +522 -0
examples/swe/task_app/hosted/envs/crafter/policy.py +478 -0
examples/swe/task_app/hosted/envs/crafter/react_agent.py +108 -0
examples/swe/task_app/hosted/envs/crafter/shared.py +305 -0
examples/swe/task_app/hosted/envs/crafter/tools.py +47 -0
examples/swe/task_app/hosted/envs/mini_swe/__init__.py +8 -0
examples/swe/task_app/hosted/envs/mini_swe/environment.py +1164 -0
examples/swe/task_app/hosted/envs/mini_swe/policy.py +355 -0
examples/swe/task_app/hosted/envs/mini_swe/shared.py +83 -0
examples/swe/task_app/hosted/envs/mini_swe/tools.py +96 -0
examples/swe/task_app/hosted/hosted_app.py +204 -0
examples/swe/task_app/hosted/inference/__init__.py +5 -0
examples/swe/task_app/hosted/inference/openai_client.py +618 -0
examples/swe/task_app/hosted/main.py +100 -0
examples/swe/task_app/hosted/policy_routes.py +1079 -0
examples/swe/task_app/hosted/registry.py +195 -0
examples/swe/task_app/hosted/rollout.py +1869 -0
examples/swe/task_app/hosted/storage/__init__.py +5 -0
examples/swe/task_app/hosted/storage/volume.py +211 -0
examples/swe/task_app/hosted/test_agents.py +161 -0
examples/swe/task_app/hosted/test_service.py +137 -0
examples/swe/task_app/hosted/utils.py +62 -0
examples/vlm/README.md +68 -0
examples/vlm/configs/crafter_vlm_gpt4o.toml +44 -0
examples/vlm/crafter_image_only_agent.py +207 -0
examples/vlm/crafter_openai_vlm_agent.py +277 -0
examples/vlm/filter_image_rows.py +63 -0
examples/vlm/run_crafter_vlm_benchmark.py +316 -0
examples/warming_up_to_rl/analyze_trace_db.py +12 -10
examples/warming_up_to_rl/configs/rl_from_base_qwen4b.toml +11 -1
examples/warming_up_to_rl/export_trace_sft.py +218 -36
examples/warming_up_to_rl/groq_test.py +15 -8
examples/warming_up_to_rl/manage_secrets.py +29 -25
examples/warming_up_to_rl/readme.md +9 -2
examples/warming_up_to_rl/run_eval.py +137 -61
examples/warming_up_to_rl/run_fft_and_save.py +131 -60
examples/warming_up_to_rl/run_local_rollout.py +88 -39
examples/warming_up_to_rl/run_local_rollout_modal.py +114 -28
examples/warming_up_to_rl/run_local_rollout_parallel.py +81 -20
examples/warming_up_to_rl/run_local_rollout_traced.py +126 -23
examples/warming_up_to_rl/run_rl_and_save.py +35 -12
examples/warming_up_to_rl/run_rollout_remote.py +44 -19
examples/warming_up_to_rl/task_app/README.md +6 -2
examples/warming_up_to_rl/task_app/grpo_crafter.py +319 -57
examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py +11 -30
examples/warming_up_to_rl/task_app/synth_envs_hosted/__init__.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/branching.py +9 -11
examples/warming_up_to_rl/task_app/synth_envs_hosted/environment_routes.py +137 -182
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/__init__.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/__init__.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/app.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/environment.py +150 -57
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py +105 -69
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py +19 -7
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/shared.py +45 -42
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/tools.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py +47 -45
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/__init__.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py +198 -92
examples/warming_up_to_rl/task_app/synth_envs_hosted/main.py +0 -2
examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py +361 -263
examples/warming_up_to_rl/task_app/synth_envs_hosted/registry.py +21 -23
examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py +394 -274
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/__init__.py +1 -1
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/volume.py +56 -62
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_agents.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_service.py +6 -15
examples/warming_up_to_rl/task_app/synth_envs_hosted/utils.py +4 -3
synth/__init__.py +14 -0
synth_ai/__init__.py +20 -4
synth_ai/api/models/supported.py +376 -0
synth_ai/api/train/builders.py +157 -26
synth_ai/api/train/cli.py +213 -57
synth_ai/api/train/config_finder.py +65 -5
synth_ai/api/train/env_resolver.py +33 -15
synth_ai/api/train/pollers.py +13 -4
synth_ai/api/train/supported_algos.py +139 -0
synth_ai/api/train/task_app.py +5 -3
synth_ai/api/train/utils.py +33 -48
synth_ai/cli/__init__.py +19 -4
synth_ai/cli/_modal_wrapper.py +28 -0
synth_ai/cli/_typer_patch.py +49 -0
synth_ai/cli/balance.py +2 -3
synth_ai/cli/calc.py +1 -1
synth_ai/cli/demo.py +21 -6
synth_ai/cli/recent.py +2 -2
synth_ai/cli/rl_demo.py +77 -17
synth_ai/cli/root.py +116 -39
synth_ai/cli/status.py +2 -2
synth_ai/cli/task_apps.py +1709 -243
synth_ai/cli/traces.py +7 -4
synth_ai/cli/turso.py +73 -0
synth_ai/cli/watch.py +12 -18
synth_ai/core/experiment.py +0 -2
synth_ai/demo_registry.py +68 -31
synth_ai/demos/core/cli.py +516 -194
synth_ai/demos/demo_task_apps/__init__.py +3 -3
synth_ai/demos/demo_task_apps/core.py +64 -28
synth_ai/demos/demo_task_apps/crafter/configs/crafter_fft_4b.toml +2 -3
synth_ai/demos/demo_task_apps/crafter/grpo_crafter_task_app.py +37 -30
synth_ai/demos/demo_task_apps/math/_common.py +1 -2
synth_ai/demos/demo_task_apps/math/app.py +2 -1
synth_ai/demos/demo_task_apps/math/deploy_modal.py +3 -6
synth_ai/demos/demo_task_apps/math/modal_task_app.py +183 -82
synth_ai/demos/demo_task_apps/math/task_app_entry.py +0 -2
synth_ai/environments/examples/bandit/engine.py +12 -4
synth_ai/environments/examples/bandit/taskset.py +4 -4
synth_ai/environments/examples/crafter_classic/environment.py +76 -1
synth_ai/environments/reproducibility/tree.py +5 -6
synth_ai/environments/service/app.py +11 -12
synth_ai/environments/service/core_routes.py +10 -9
synth_ai/environments/stateful/engine.py +1 -1
synth_ai/environments/tasks/core.py +1 -0
synth_ai/environments/tasks/filters.py +5 -6
synth_ai/environments/tasks/utils.py +4 -5
synth_ai/evals/base.py +0 -2
synth_ai/handshake.py +11 -9
synth_ai/http.py +1 -1
synth_ai/http_client.py +43 -11
synth_ai/inference/__init__.py +0 -2
synth_ai/inference/client.py +20 -6
synth_ai/jobs/client.py +103 -78
synth_ai/learning/__init__.py +41 -6
synth_ai/learning/algorithms.py +14 -0
synth_ai/learning/client.py +121 -29
synth_ai/learning/config.py +2 -40
synth_ai/learning/constants.py +0 -2
synth_ai/learning/ft_client.py +4 -56
synth_ai/learning/health.py +13 -7
synth_ai/learning/jobs.py +43 -47
synth_ai/{rl → learning/rl}/__init__.py +14 -5
synth_ai/learning/rl/client.py +267 -0
synth_ai/learning/rl/config.py +31 -0
synth_ai/{rl → learning/rl}/contracts.py +5 -10
synth_ai/{rl → learning/rl}/env_keys.py +45 -16
synth_ai/learning/rl/secrets.py +13 -0
synth_ai/learning/rl_client.py +2 -253
synth_ai/learning/sft/__init__.py +29 -0
synth_ai/learning/sft/client.py +68 -0
synth_ai/learning/sft/config.py +270 -0
synth_ai/learning/sft/data.py +295 -0
synth_ai/learning/sse.py +25 -26
synth_ai/learning/validators.py +25 -24
synth_ai/lm/__init__.py +21 -47
synth_ai/task/__init__.py +26 -27
synth_ai/task/apps/__init__.py +18 -19
synth_ai/task/auth.py +35 -23
synth_ai/task/client.py +15 -13
synth_ai/task/contracts.py +37 -35
synth_ai/task/datasets.py +9 -6
synth_ai/task/errors.py +11 -10
synth_ai/task/health.py +17 -11
synth_ai/task/json.py +58 -24
synth_ai/task/proxy.py +15 -14
synth_ai/task/rubrics.py +22 -15
synth_ai/task/server.py +43 -17
synth_ai/task/tracing_utils.py +12 -7
synth_ai/task/validators.py +0 -1
synth_ai/task/vendors.py +5 -7
synth_ai/tracing_v3/__init__.py +2 -0
synth_ai/tracing_v3/abstractions.py +21 -4
synth_ai/tracing_v3/db_config.py +26 -1
synth_ai/tracing_v3/decorators.py +18 -15
synth_ai/tracing_v3/examples/basic_usage.py +3 -2
synth_ai/tracing_v3/hooks.py +6 -4
synth_ai/tracing_v3/llm_call_record_helpers.py +6 -6
synth_ai/tracing_v3/replica_sync.py +1 -0
synth_ai/tracing_v3/session_tracer.py +63 -16
synth_ai/tracing_v3/storage/base.py +89 -1
synth_ai/tracing_v3/storage/config.py +21 -8
synth_ai/tracing_v3/storage/factory.py +10 -8
synth_ai/tracing_v3/storage/utils.py +4 -2
synth_ai/tracing_v3/turso/daemon.py +7 -2
synth_ai/tracing_v3/turso/models.py +5 -2
synth_ai/tracing_v3/turso/native_manager.py +1173 -0
synth_ai/tracing_v3/utils.py +4 -3
synth_ai/v0/api/__init__.py +8 -0
synth_ai/v0/api/models/__init__.py +8 -0
synth_ai/v0/api/models/supported.py +8 -0
synth_ai/v0/config/__init__.py +15 -0
synth_ai/v0/config/base_url.py +12 -0
synth_ai/v0/lm/__init__.py +51 -0
synth_ai/{lm → v0/lm}/caching/ephemeral.py +3 -5
synth_ai/{lm → v0/lm}/caching/handler.py +4 -4
synth_ai/{lm → v0/lm}/caching/initialize.py +1 -1
synth_ai/{lm → v0/lm}/caching/persistent.py +1 -1
synth_ai/{lm → v0/lm}/config.py +6 -1
synth_ai/{lm → v0/lm}/core/all.py +9 -9
synth_ai/{lm → v0/lm}/core/exceptions.py +0 -2
synth_ai/{lm → v0/lm}/core/main.py +19 -7
synth_ai/{lm → v0/lm}/core/main_v3.py +10 -10
synth_ai/{lm → v0/lm}/core/synth_models.py +2 -15
synth_ai/{lm → v0/lm}/core/vendor_clients.py +6 -4
synth_ai/{lm → v0/lm}/overrides.py +4 -4
synth_ai/{lm → v0/lm}/provider_support/anthropic.py +4 -4
synth_ai/{lm → v0/lm}/provider_support/openai.py +5 -5
synth_ai/{lm → v0/lm}/structured_outputs/handler.py +5 -5
synth_ai/{lm → v0/lm}/structured_outputs/rehabilitate.py +1 -1
synth_ai/{lm → v0/lm}/vendors/core/anthropic_api.py +16 -16
synth_ai/{lm → v0/lm}/vendors/core/gemini_api.py +5 -5
synth_ai/{lm → v0/lm}/vendors/core/mistral_api.py +5 -5
synth_ai/{lm → v0/lm}/vendors/core/openai_api.py +12 -10
synth_ai/{lm → v0/lm}/vendors/openai_standard.py +11 -9
synth_ai/{lm → v0/lm}/vendors/openai_standard_responses.py +8 -5
synth_ai/{lm → v0/lm}/vendors/supported/custom_endpoint.py +4 -6
synth_ai/{lm → v0/lm}/vendors/supported/deepseek.py +2 -2
synth_ai/{lm → v0/lm}/vendors/supported/grok.py +2 -2
synth_ai/{lm → v0/lm}/vendors/supported/groq.py +1 -1
synth_ai/{lm → v0/lm}/vendors/supported/ollama.py +1 -1
synth_ai/{lm → v0/lm}/vendors/supported/openrouter.py +3 -3
synth_ai/{lm → v0/lm}/vendors/supported/together.py +1 -1
synth_ai/{lm → v0/lm}/vendors/synth_client.py +38 -11
synth_ai/v0/tracing/upload.py +32 -135
synth_ai/v0/tracing_v3/__init__.py +10 -0
synth_ai/v0/tracing_v3/abstractions.py +3 -0
synth_ai/v0/tracing_v3/decorators.py +3 -0
synth_ai/v0/tracing_v3/llm_call_record_helpers.py +3 -0
synth_ai/v0/tracing_v3/session_tracer.py +3 -0
synth_ai-0.2.9.dev6.dist-info/METADATA +191 -0
{synth_ai-0.2.9.dev4.dist-info → synth_ai-0.2.9.dev6.dist-info}/RECORD +291 -264
{synth_ai-0.2.9.dev4.dist-info → synth_ai-0.2.9.dev6.dist-info}/top_level.txt +1 -0
examples/common_old/backend.py +0 -21
examples/evals_old/README.md +0 -98
examples/evals_old/__init__.py +0 -6
examples/evals_old/compare_models.py +0 -1037
examples/evals_old/example_log.md +0 -145
examples/evals_old/run_demo.sh +0 -126
examples/evals_old/trace_analysis.py +0 -270
examples/finetuning_old/_backup_synth_qwen/config.toml +0 -29
examples/finetuning_old/_backup_synth_qwen/example_log.md +0 -324
examples/finetuning_old/_backup_synth_qwen/filter_traces.py +0 -60
examples/finetuning_old/_backup_synth_qwen/filter_traces_achievements.py +0 -239
examples/finetuning_old/_backup_synth_qwen/purge_v3_traces.py +0 -109
examples/finetuning_old/_backup_synth_qwen/react_agent_lm.py +0 -1924
examples/finetuning_old/_backup_synth_qwen/readme.md +0 -49
examples/finetuning_old/_backup_synth_qwen/run_crafter_qwen4b.py +0 -114
examples/finetuning_old/_backup_synth_qwen/run_demo.sh +0 -195
examples/finetuning_old/_backup_synth_qwen/sft_kickoff.py +0 -118
examples/finetuning_old/synth_qwen_v1/README.md +0 -68
examples/finetuning_old/synth_qwen_v1/filter_traces.py +0 -60
examples/finetuning_old/synth_qwen_v1/filter_traces_achievements.py +0 -239
examples/finetuning_old/synth_qwen_v1/finetune.py +0 -46
examples/finetuning_old/synth_qwen_v1/hello_ft_model.py +0 -71
examples/finetuning_old/synth_qwen_v1/infer.py +0 -37
examples/finetuning_old/synth_qwen_v1/poll.py +0 -44
examples/finetuning_old/synth_qwen_v1/prepare_data.py +0 -35
examples/finetuning_old/synth_qwen_v1/purge_v3_traces.py +0 -109
examples/finetuning_old/synth_qwen_v1/react_agent_lm.py +0 -1932
examples/finetuning_old/synth_qwen_v1/run_crafter_sft_job.py +0 -207
examples/finetuning_old/synth_qwen_v1/run_ft_job.py +0 -232
examples/finetuning_old/synth_qwen_v1/upload_data.py +0 -34
examples/finetuning_old/synth_qwen_v1/util.py +0 -147
examples/rl_old/task_app.py +0 -962
examples/warming_up_to_rl/old/event_rewards.md +0 -234
examples/warming_up_to_rl/old/notes.md +0 -73
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_stepwise_rewards.py +0 -58
synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/filter_traces_sft_turso.py +0 -738
synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/filter_traces_sft_turso.py +0 -580
synth_ai/environments/examples/sokoban/units/astar_common.py +0 -95
synth_ai/experimental/synth_oss.py +0 -446
synth_ai/install_sqld.sh +0 -40
synth_ai/learning/filtering.py +0 -0
synth_ai/learning/offline/dpo.py +0 -0
synth_ai/learning/offline/providers.py +0 -7
synth_ai/learning/offline/sft.py +0 -0
synth_ai/learning/offline/shared.py +0 -0
synth_ai/learning/online/grpo.py +0 -0
synth_ai/learning/online/irft.py +0 -0
synth_ai/learning/prompts/banking77_injection_eval.py +0 -168
synth_ai/learning/prompts/gepa.py +0 -0
synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +0 -213
synth_ai/learning/prompts/mipro.py +0 -289
synth_ai/learning/prompts/random_search.py +0 -246
synth_ai/learning/prompts/run_mipro_banking77.py +0 -172
synth_ai/learning/prompts/run_random_search_banking77.py +0 -324
synth_ai/rl/secrets.py +0 -19
synth_ai/scripts/verify_rewards.py +0 -100
synth_ai/tracing/__init__.py +0 -30
synth_ai/tracing_v1/__init__.py +0 -33
synth_ai/tracing_v3/turso/__init__.py +0 -25
synth_ai/tracing_v3/turso/manager.py +0 -774
synth_ai/zyk/__init__.py +0 -30
synth_ai-0.2.9.dev4.dist-info/METADATA +0 -131
/synth_ai/{lm → v0/lm}/caching/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/caching/constants.py +0 -0
/synth_ai/{lm → v0/lm}/caching/dbs.py +0 -0
/synth_ai/{lm → v0/lm}/constants.py +0 -0
/synth_ai/{lm → v0/lm}/core/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/cost/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/cost/monitor.py +0 -0
/synth_ai/{lm → v0/lm}/cost/statefulness.py +0 -0
/synth_ai/{lm → v0/lm}/injection.py +0 -0
/synth_ai/{lm → v0/lm}/provider_support/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/provider_support/suppress_logging.py +0 -0
/synth_ai/{lm → v0/lm}/structured_outputs/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/structured_outputs/inject.py +0 -0
/synth_ai/{lm → v0/lm}/tools/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/tools/base.py +0 -0
/synth_ai/{lm → v0/lm}/unified_interface.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/base.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/core/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/core/synth_dev_api.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/local/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/local/ollama.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/retries.py +0 -0
/synth_ai/{lm → v0/lm}/vendors/supported/__init__.py +0 -0
/synth_ai/{lm → v0/lm}/warmup.py +0 -0
{synth_ai-0.2.9.dev4.dist-info → synth_ai-0.2.9.dev6.dist-info}/WHEEL +0 -0
{synth_ai-0.2.9.dev4.dist-info → synth_ai-0.2.9.dev6.dist-info}/entry_points.txt +0 -0
{synth_ai-0.2.9.dev4.dist-info → synth_ai-0.2.9.dev6.dist-info}/licenses/LICENSE +0 -0

examples/qwen_coder/infer_prod_proxy.py ADDED Viewed

@@ -0,0 +1,73 @@
+#!/usr/bin/env python3
+"""Smoke test: Qwen3 Coder inference via the Synth prod proxy endpoint.
+No CLI args. Reads SYNTH_API_KEY from env. Optional overrides via env:
+  - BACKEND_BASE_URL (defaults to https://agent-learning.onrender.com/api)
+  - MODEL (defaults to Qwen/Qwen3-Coder-30B-A3B-Instruct)
+  - PROMPT (defaults to a simple coding prompt)
+Run:
+  SYNTH_API_KEY=sk_... uv run python examples/qwen_coder/infer_prod_proxy.py
+"""
+from __future__ import annotations
+import asyncio
+import os
+from typing import Any
+import httpx
+def _backend_root() -> str:
+    raw = os.getenv("BACKEND_BASE_URL", "https://agent-learning.onrender.com/api").strip()
+    if raw.endswith("/api"):
+        raw = raw[:-4]
+    return raw.rstrip("/")
+async def main() -> None:
+    api_key = os.getenv("SYNTH_API_KEY", "").strip()
+    if not api_key:
+        raise SystemExit("SYNTH_API_KEY required in environment")
+    model = os.getenv("MODEL", "Qwen/Qwen3-Coder-30B-A3B-Instruct")
+    prompt = os.getenv(
+        "PROMPT",
+        "Write a Python function to reverse a string, then show an example call.",
+    )
+    # Prod proxy endpoint
+    url = f"{_backend_root()}/api/inference/v1/chat/completions"
+    payload: dict[str, Any] = {
+        "model": model,
+        "messages": [{"role": "user", "content": prompt}],
+        "temperature": 0.2,
+        "max_tokens": 256,
+        "thinking_budget": 256,
+    }
+    async with httpx.AsyncClient(timeout=60.0) as http:
+        resp = await http.post(
+            url,
+            headers={
+                "Authorization": f"Bearer {api_key}",
+                "Content-Type": "application/json",
+            },
+            json=payload,
+        )
+        resp.raise_for_status()
+        data = resp.json()
+        # Print assistant content (compact)
+        try:
+            msg = data.get("choices", [{}])[0].get("message", {})
+            print(msg.get("content") or data)
+        except Exception:
+            print(data)
+if __name__ == "__main__":
+    asyncio.run(main())

examples/qwen_coder/infer_via_synth.py ADDED Viewed

@@ -0,0 +1,87 @@
+#!/usr/bin/env python3
+"""One-shot inference for Qwen3 (and Coder) models via the Synth backend proxy.
+Usage examples:
+  SYNTH_API_KEY=sk_... BACKEND_BASE_URL=https://agent-learning.onrender.com/api \
+  uv run python examples/qwen_coder/infer_via_synth.py \
+    --model Qwen/Qwen3-Coder-30B-A3B-Instruct \
+    --prompt "Write a Python function to reverse a string." \
+    --max-tokens 128 --temperature 0.2
+Optionally you can point to a specific inference host (e.g., your vLLM or task-app proxy):
+  ... infer_via_synth.py --inference-url https://your-host/api/inference
+The script defaults the backend base URL to the hosted service if BACKEND_BASE_URL is not set.
+"""
+from __future__ import annotations
+import argparse
+import asyncio
+import os
+from typing import Any
+from synth_ai.inference.client import InferenceClient
+def _default_backend() -> str:
+    raw = os.getenv("BACKEND_BASE_URL", "https://agent-learning.onrender.com/api").strip()
+    return raw if raw.endswith("/api") else (raw + "/api")
+async def main() -> None:
+    p = argparse.ArgumentParser(description=__doc__)
+    p.add_argument(
+        "--model",
+        default=os.getenv("MODEL", "Qwen/Qwen3-Coder-30B-A3B-Instruct"),
+        help="Base or ft:<id> model identifier",
+    )
+    p.add_argument(
+        "--prompt",
+        default="Write a Python function to reverse a string.",
+        help="User prompt text",
+    )
+    p.add_argument("--max-tokens", type=int, default=256)
+    p.add_argument("--temperature", type=float, default=0.2)
+    p.add_argument(
+        "--inference-url",
+        default=os.getenv("INFERENCE_URL"),
+        help="Optional backend inference base (e.g., https://host/api/inference)",
+    )
+    p.add_argument(
+        "--timeout", type=float, default=60.0, help="HTTP timeout seconds for backend calls"
+    )
+    args = p.parse_args()
+    backend = _default_backend()
+    api_key = os.getenv("SYNTH_API_KEY", "").strip()
+    if not api_key:
+        raise SystemExit("SYNTH_API_KEY required (export it or pass via env-file to uvx)")
+    client = InferenceClient(base_url=backend, api_key=api_key, timeout=args.timeout)
+    body: dict[str, Any] = {
+        "model": args.model,
+        "messages": [{"role": "user", "content": args.prompt}],
+        "max_tokens": int(args.max_tokens),
+        "temperature": float(args.temperature),
+    }
+    if args.inference_url:
+        # Backend supports forwarding to a specific host when provided
+        body["inference_url"] = str(args.inference_url)
+    resp = await client.create_chat_completion(**body)
+    try:
+        msg = resp.get("choices", [{}])[0].get("message", {})
+        content = msg.get("content")
+        print(content or resp)
+    except Exception:
+        print(resp)
+if __name__ == "__main__":
+    asyncio.run(main())

examples/qwen_coder/scripts/infer_coder.sh ADDED Viewed

@@ -0,0 +1,18 @@
+#!/usr/bin/env bash
+set -euo pipefail
+# Optional: pass a .env path as first arg; otherwise relies on current env
+ENV_FILE=${1:-}
+if [[ -n "${ENV_FILE}" ]]; then
+  if [[ ! -f "${ENV_FILE}" ]]; then
+    echo "Env file not found: ${ENV_FILE}" >&2
+    exit 1
+  fi
+  set -a; source "${ENV_FILE}"; set +a
+fi
+# Use prod proxy smoke (base or ft:... via MODEL env)
+uv run python examples/qwen_coder/infer_prod_proxy.py

examples/qwen_coder/scripts/train_coder_30b.sh ADDED Viewed

@@ -0,0 +1,21 @@
+#!/usr/bin/env bash
+set -euo pipefail
+# Optional: pass a .env path as first arg; otherwise relies on current env
+ENV_FILE=${1:-}
+if [[ -n "${ENV_FILE}" ]]; then
+  if [[ ! -f "${ENV_FILE}" ]]; then
+    echo "Env file not found: ${ENV_FILE}" >&2
+    exit 1
+  fi
+  set -a; source "${ENV_FILE}"; set +a
+fi
+uvx synth-ai train \
+  --type sft \
+  --config examples/qwen_coder/configs/coder_lora_30b.toml \
+  --dataset examples/qwen_coder/ft_data/coder_sft.small.jsonl \
+  --env-file "${ENV_FILE:-}"

examples/qwen_coder/sft_full_17b.py ADDED Viewed

@@ -0,0 +1,103 @@
+#!/usr/bin/env python3
+"""Submit a full-parameter SFT job for Qwen/Qwen3-1.7B via Synth API."""
+from __future__ import annotations
+import asyncio
+import os
+from typing import Any
+from examples.qwen_coder._shared import (
+    ensure_tiny_dataset,
+    optional_validation_dataset,
+    resolve_output_path,
+)
+from synth_ai.learning.client import LearningClient
+def _backend() -> str:
+    raw = os.getenv("BACKEND_BASE_URL", "https://agent-learning.onrender.com/api").strip()
+    return raw if raw.endswith("/api") else (raw + "/api")
+async def main() -> None:
+    api_key = os.getenv("SYNTH_API_KEY", "").strip()
+    if not api_key:
+        raise SystemExit("SYNTH_API_KEY required in env")
+    backend = _backend()
+    client = LearningClient(base_url=backend, api_key=api_key, timeout=60.0)
+    data_path = ensure_tiny_dataset()
+    file_id = await client.upload_training_file(str(data_path))
+    validation_file_id: str | None = None
+    val_path = optional_validation_dataset()
+    if val_path and val_path.exists():
+        validation_file_id = await client.upload_training_file(str(val_path))
+    hyper: dict[str, Any] = {
+        "n_epochs": int(os.getenv("QWEN_CODER_FULL_EPOCHS", "1")),
+        "per_device_batch": int(os.getenv("QWEN_CODER_FULL_PER_DEVICE", "1")),
+        "gradient_accumulation_steps": int(os.getenv("QWEN_CODER_FULL_ACCUM", "8")),
+        "sequence_length": int(os.getenv("QWEN_CODER_FULL_SEQ_LEN", "4096")),
+        "learning_rate": float(os.getenv("QWEN_CODER_FULL_LR", "2e-5")),
+        "warmup_ratio": float(os.getenv("QWEN_CODER_FULL_WARMUP", "0.05")),
+        "train_kind": os.getenv("QWEN_CODER_FULL_TRAIN_KIND", "full"),
+    }
+    metadata = {
+        "example": "qwen_coder_full_17b",
+        "effective_config": {
+            "compute": {
+                "gpu_type": os.getenv("SYNTH_GPU_TYPE", "H100"),
+                "gpu_count": int(os.getenv("SYNTH_GPU_COUNT", "4")),
+                "nodes": int(os.getenv("SYNTH_GPU_NODES", "1")),
+            }
+        },
+    }
+    job = await client.create_job(
+        training_type="sft_offline",
+        model=os.getenv("QWEN_CODER_FULL_MODEL", "Qwen/Qwen3-1.7B"),
+        training_file_id=file_id,
+        hyperparameters=hyper,
+        metadata=metadata,
+        validation_file=validation_file_id,
+    )
+    job_id = str(job.get("id") or job.get("job_id") or "").strip()
+    if not job_id:
+        raise SystemExit(f"Invalid create_job response: {job}")
+    await client.start_job(job_id)
+    timeout_seconds = float(os.getenv("SYNTH_TIMEOUT", "7200"))
+    poll_interval = float(os.getenv("QWEN_CODER_FULL_POLL_INTERVAL", "10"))
+    job_final = await client.poll_until_terminal(
+        job_id,
+        interval_seconds=poll_interval,
+        max_seconds=timeout_seconds,
+    )
+    status = str(job_final.get("status"))
+    print(f"Job status: {status}")
+    result_model = (
+        job_final.get("result", {}).get("model_id")
+        if isinstance(job_final.get("result"), dict)
+        else None
+    )
+    print(f"Model ID: {result_model}")
+    try:
+        out_file = resolve_output_path("ft_model_id_full.txt")
+        text = (result_model or "").strip()
+        if text:
+            out_file.write_text(text + "\n", encoding="utf-8")
+            print(f"Wrote {out_file} with ft model id")
+    except Exception as exc:
+        print(f"Warning: failed to write ft_model_id_full.txt: {exc}")
+if __name__ == "__main__":
+    asyncio.run(main())

examples/qwen_coder/sft_lora_30b.py ADDED Viewed

@@ -0,0 +1,110 @@
+#!/usr/bin/env python3
+"""Submit a LoRA SFT job for Qwen/Qwen3-Coder-30B-A3B-Instruct via Synth API.
+Steps:
+  - Generate a tiny coder dataset if missing
+  - Upload the JSONL
+  - Create the job with coder LoRA hyperparameters
+  - Start and poll until terminal, then print the resulting model id
+Env:
+  SYNTH_API_KEY (required)
+  BACKEND_BASE_URL (defaults to https://agent-learning.onrender.com/api)
+"""
+from __future__ import annotations
+import asyncio
+import os
+from typing import Any
+from examples.qwen_coder._shared import (
+    ensure_tiny_dataset,
+    optional_validation_dataset,
+    resolve_output_path,
+)
+from synth_ai.learning.client import LearningClient
+def _backend() -> str:
+    raw = os.getenv("BACKEND_BASE_URL", "https://agent-learning.onrender.com/api").strip()
+    return raw if raw.endswith("/api") else (raw + "/api")
+async def main() -> None:
+    api_key = os.getenv("SYNTH_API_KEY", "").strip()
+    if not api_key:
+        raise SystemExit("SYNTH_API_KEY required in env")
+    backend = _backend()
+    client = LearningClient(base_url=backend, api_key=api_key, timeout=60.0)
+    # Ensure dataset exists
+    data_path = ensure_tiny_dataset()
+    # Upload training file
+    file_id = await client.upload_training_file(str(data_path))
+    # Optional validation file if present alongside training set
+    val_path = optional_validation_dataset()
+    validation_file_id: str | None = None
+    if val_path and val_path.exists():
+        validation_file_id = await client.upload_training_file(str(val_path))
+    # Minimal hyperparameters for LoRA SFT (aligned with coder_lora_30b.toml)
+    hyper: dict[str, Any] = {
+        "n_epochs": 1,
+        "per_device_batch": 1,
+        "gradient_accumulation_steps": 64,
+        "sequence_length": 4096,
+        "learning_rate": 5e-6,
+        "warmup_ratio": 0.03,
+        "train_kind": "peft",
+    }
+    # Create job
+    job = await client.create_job(
+        training_type="sft_offline",
+        model="Qwen/Qwen3-Coder-30B-A3B-Instruct",
+        training_file_id=file_id,
+        hyperparameters=hyper,
+        metadata={
+            "example": "qwen_coder_lora_30b",
+            # Include effective compute hints for backend routing/validation
+            "effective_config": {
+                "compute": {"gpu_type": "H100", "gpu_count": 4, "nodes": 1}
+            },
+        },
+        validation_file=validation_file_id,
+    )
+    job_id = str(job.get("id"))
+    if not job_id:
+        raise SystemExit(f"Invalid create_job response: {job}")
+    # Start
+    await client.start_job(job_id)
+    # Poll until terminal
+    job_final = await client.poll_until_terminal(job_id, interval_seconds=5.0, max_seconds=7200)
+    status = str(job_final.get("status"))
+    print(f"Job status: {status}")
+    # Print resulting model id if available and write to ft_data/ft_model_id.txt
+    result_model = (
+        job_final.get("result", {}).get("model_id")
+        if isinstance(job_final.get("result"), dict)
+        else None
+    )
+    print(f"Model ID: {result_model}")
+    try:
+        out_file = resolve_output_path("ft_model_id.txt")
+        text = (result_model or "").strip()
+        if text:
+            out_file.write_text(text + "\n", encoding="utf-8")
+            print(f"Wrote {out_file} with ft model id")
+    except Exception as exc:
+        # Best-effort write; don't crash if filesystem issues
+        print(f"Warning: failed to write ft_model_id.txt: {exc}")
+if __name__ == "__main__":
+    asyncio.run(main())

examples/qwen_coder/subset_jsonl.py ADDED Viewed

@@ -0,0 +1,38 @@
+#!/usr/bin/env python3
+"""Create a capped subset of a JSONL dataset for quick runs."""
+from __future__ import annotations
+import argparse
+from pathlib import Path
+def main() -> None:
+    p = argparse.ArgumentParser(description=__doc__)
+    p.add_argument("src", help="Source JSONL path")
+    p.add_argument("dst", help="Destination JSONL path")
+    p.add_argument("--n", type=int, default=200, help="Max examples to keep")
+    args = p.parse_args()
+    src = Path(args.src)
+    if not src.exists():
+        raise SystemExit(f"No such file: {src}")
+    dst = Path(args.dst)
+    dst.parent.mkdir(parents=True, exist_ok=True)
+    kept = 0
+    with src.open("r", encoding="utf-8") as fin, dst.open("w", encoding="utf-8") as fout:
+        for line in fin:
+            if kept >= args.n:
+                break
+            if not line.strip():
+                continue
+            fout.write(line)
+            kept += 1
+    print(f"Wrote {dst} with {kept} lines")
+if __name__ == "__main__":
+    main()

examples/qwen_coder/validate_jsonl.py ADDED Viewed

@@ -0,0 +1,59 @@
+#!/usr/bin/env python3
+"""Validate that a JSONL file parses and contains chat-like records.
+Checks first N lines (default 50) for objects with `messages` including an
+assistant response (role == "assistant").
+"""
+from __future__ import annotations
+import argparse
+import json
+from pathlib import Path
+def main() -> None:
+    p = argparse.ArgumentParser(description=__doc__)
+    p.add_argument("path", help="Path to JSONL file")
+    p.add_argument("--n", type=int, default=50, help="Number of lines to sample")
+    args = p.parse_args()
+    src = Path(args.path)
+    if not src.exists():
+        raise SystemExit(f"No such file: {src}")
+    checked = 0
+    ok = 0
+    with src.open("r", encoding="utf-8") as f:
+        for i, line in enumerate(f, start=1):
+            if i > args.n:
+                break
+            line = line.strip()
+            if not line:
+                continue
+            checked += 1
+            try:
+                obj = json.loads(line)
+            except Exception as exc:
+                raise SystemExit(f"Line {i} is not valid JSON: {exc}")
+            msgs = obj.get("messages") if isinstance(obj, dict) else None
+            if not isinstance(msgs, list):
+                raise SystemExit(f"Line {i} missing 'messages' list")
+            has_assistant = any(
+                isinstance(m, dict) and m.get("role") == "assistant" and m.get("content")
+                for m in msgs
+            )
+            if has_assistant:
+                ok += 1
+    if checked == 0:
+        raise SystemExit("No lines checked; file empty?")
+    if ok == 0:
+        raise SystemExit("No assistant messages found in sampled lines")
+    print(f"Validated: {ok}/{checked} sampled lines contain assistant messages")
+if __name__ == "__main__":
+    main()

examples/rl/configs/eval_base_qwen.toml CHANGED Viewed

@@ -6,7 +6,7 @@ num_episodes = 50
 seed_start = 0
 [policy]
-inference_url = "http://localhost:8000/api/inference"
+inference_url = "https://agent-learning.onrender.com/api/inference"
 max_tokens = 128
 temperature = 0.0

examples/rl/configs/rl_from_base_qwen17.toml CHANGED Viewed

@@ -11,7 +11,7 @@ base = "Qwen/Qwen3-1.7B"
 [policy]
 model = "Qwen/Qwen3-1.7B"
-inference_url = "http://localhost:8000/api/inference"
+inference_url = "https://agent-learning.onrender.com/api/inference"
 max_tokens = 1028
 temperature = 0.2

examples/rl/download_dataset.py CHANGED Viewed

@@ -20,10 +20,12 @@ def extract_examples(dataset: Any, *, limit: int | None) -> list[dict[str, str]]
         solution = item.get("solution") or ""
         if isinstance(solution, list):
             solution = "\n".join(str(part) for part in solution)
-        examples.append({
-            "problem": problem,
-            "solution": solution,
-        })
+        examples.append(
+            {
+                "problem": problem,
+                "solution": solution,
+            }
+        )
     return examples
@@ -35,12 +37,26 @@ def write_jsonl(path: Path, rows: list[dict[str, str]]) -> None:
 def main() -> None:
-    parser = argparse.ArgumentParser(description="Download MATH dataset splits to JSONL for offline use")
-    parser.add_argument("--output-dir", default="examples/rl/data", help="Directory to write <split>.jsonl files")
-    parser.add_argument("--dataset", default="nlile/hendrycks-MATH-benchmark", help="Hugging Face dataset identifier")
-    parser.add_argument("--config", default="algebra", help="Hugging Face dataset config (if required)")
-    parser.add_argument("--splits", nargs="*", default=["train", "validation", "test"], help="Splits to download")
-    parser.add_argument("--limit", type=int, default=None, help="Optional cap on examples per split")
+    parser = argparse.ArgumentParser(
+        description="Download MATH dataset splits to JSONL for offline use"
+    )
+    parser.add_argument(
+        "--output-dir", default="examples/rl/data", help="Directory to write <split>.jsonl files"
+    )
+    parser.add_argument(
+        "--dataset",
+        default="nlile/hendrycks-MATH-benchmark",
+        help="Hugging Face dataset identifier",
+    )
+    parser.add_argument(
+        "--config", default="algebra", help="Hugging Face dataset config (if required)"
+    )
+    parser.add_argument(
+        "--splits", nargs="*", default=["train", "validation", "test"], help="Splits to download"
+    )
+    parser.add_argument(
+        "--limit", type=int, default=None, help="Optional cap on examples per split"
+    )
     args = parser.parse_args()
     output_dir = Path(args.output_dir).expanduser()

synth-ai 0.2.9.dev4__py3-none-any.whl → 0.2.9.dev6__py3-none-any.whl

Potentially problematic release.

synth-ai 0.2.9.dev4py3-none-any.whl → 0.2.9.dev6py3-none-any.whl