PyPI - synth-ai - Versions diffs - 0.2.14__py3-none-any.whl → 0.2.17__py3-none-any.whl - Mend

synth-ai 0.2.14py3-none-any.whl → 0.2.17py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synth-ai might be problematic. Click here for more details.

Files changed (354) hide show

examples/README.md +1 -0
examples/analyze_semantic_words.sh +2 -2
examples/blog_posts/pokemon_vl/README.md +98 -0
examples/blog_posts/pokemon_vl/configs/eval_qwen3_vl.toml +25 -0
examples/blog_posts/pokemon_vl/configs/eval_rl_final.toml +24 -0
examples/blog_posts/pokemon_vl/configs/filter_high_reward.toml +10 -0
examples/blog_posts/pokemon_vl/configs/train_rl_from_sft.toml +42 -0
examples/blog_posts/pokemon_vl/configs/train_sft_qwen4b_vl.toml +40 -0
examples/blog_posts/warming_up_to_rl/README.md +158 -0
examples/blog_posts/warming_up_to_rl/configs/eval_ft_qwen4b.toml +25 -0
examples/blog_posts/warming_up_to_rl/configs/eval_groq_qwen32b.toml +25 -0
examples/blog_posts/warming_up_to_rl/configs/eval_openai_gpt_oss_120b.toml +29 -0
examples/blog_posts/warming_up_to_rl/configs/filter_high_reward_dataset.toml +10 -0
examples/blog_posts/warming_up_to_rl/configs/train_rl_from_sft.toml +41 -0
examples/blog_posts/warming_up_to_rl/configs/train_sft_qwen4b.toml +40 -0
examples/dev/qwen3_32b_qlora_4xh100.toml +5 -0
examples/multi_step/SFT_README.md +147 -0
examples/multi_step/configs/crafter_rl_outcome.toml +1 -1
examples/multi_step/configs/crafter_rl_stepwise_hosted_judge.toml +73 -115
examples/multi_step/configs/crafter_rl_stepwise_shaped.toml +1 -1
examples/multi_step/configs/crafter_rl_stepwise_simple.toml +1 -1
examples/multi_step/configs/crafter_rl_stepwise_simple_NEW_FORMAT.toml +105 -0
examples/multi_step/configs/crafter_sft_qwen30b_lora.toml +62 -0
examples/multi_step/configs/verilog_rl_lora.toml +80 -123
examples/multi_step/convert_traces_to_sft.py +84 -0
examples/multi_step/run_sft_qwen30b.sh +45 -0
examples/qwen_coder/configs/coder_lora_30b.toml +1 -2
examples/qwen_coder/configs/coder_lora_4b.toml +5 -1
examples/qwen_coder/configs/coder_lora_small.toml +1 -2
examples/qwen_vl/BUGS_AND_FIXES.md +232 -0
examples/qwen_vl/IMAGE_VALIDATION_COMPLETE.md +271 -0
examples/qwen_vl/IMAGE_VALIDATION_SUMMARY.md +260 -0
examples/qwen_vl/INFERENCE_SFT_TESTS.md +412 -0
examples/qwen_vl/NEXT_STEPS_2B.md +325 -0
examples/qwen_vl/QUICKSTART.md +327 -0
examples/qwen_vl/QUICKSTART_RL_VISION.md +110 -0
examples/qwen_vl/README.md +152 -0
examples/qwen_vl/RL_VISION_COMPLETE.md +475 -0
examples/qwen_vl/RL_VISION_TESTING.md +333 -0
examples/qwen_vl/SDK_VISION_INTEGRATION.md +328 -0
examples/qwen_vl/SETUP_COMPLETE.md +274 -0
examples/qwen_vl/VISION_TESTS_COMPLETE.md +489 -0
examples/qwen_vl/VLM_PIPELINE_COMPLETE.md +242 -0
examples/qwen_vl/__init__.py +2 -0
examples/qwen_vl/collect_data_via_cli.md +415 -0
examples/qwen_vl/collect_vision_traces.py +368 -0
examples/qwen_vl/configs/crafter_rl_vision_qwen3vl4b.toml +110 -0
examples/qwen_vl/configs/crafter_vlm_sft_example.toml +59 -0
examples/qwen_vl/configs/eval_gpt4o_mini_vision.toml +26 -0
examples/qwen_vl/configs/eval_gpt4o_vision_proper.toml +29 -0
examples/qwen_vl/configs/eval_gpt5nano_vision.toml +26 -0
examples/qwen_vl/configs/eval_qwen3vl_vision.toml +26 -0
examples/qwen_vl/configs/filter_qwen3vl_sft.toml +49 -0
examples/qwen_vl/configs/filter_vision_sft.toml +52 -0
examples/qwen_vl/configs/filter_vision_test.toml +8 -0
examples/qwen_vl/configs/sft_qwen3_vl_2b_test.toml +54 -0
examples/qwen_vl/crafter_gpt5nano_agent.py +308 -0
examples/qwen_vl/crafter_qwen_vl_agent.py +300 -0
examples/qwen_vl/run_vision_comparison.sh +61 -0
examples/qwen_vl/run_vision_sft_pipeline.sh +175 -0
examples/qwen_vl/test_image_validation.py +201 -0
examples/qwen_vl/test_sft_vision_data.py +110 -0
examples/rl/README.md +6 -6
examples/rl/configs/eval_base_qwen.toml +17 -0
examples/rl/configs/eval_rl_qwen.toml +13 -0
examples/rl/configs/rl_from_base_qwen.toml +62 -0
examples/rl/configs/rl_from_base_qwen17.toml +79 -0
examples/rl/configs/rl_from_ft_qwen.toml +37 -0
examples/rl/run_eval.py +436 -0
examples/rl/run_rl_and_save.py +111 -0
examples/rl/task_app/README.md +21 -0
examples/rl/task_app/math_single_step.py +990 -0
examples/rl/task_app/math_task_app.py +111 -0
examples/run_crafter_demo.sh +2 -2
examples/sft/README.md +6 -6
examples/sft/configs/crafter_fft_qwen0p6b.toml +7 -2
examples/sft/configs/crafter_lora_qwen0p6b.toml +7 -3
examples/sft/evaluate.py +2 -4
examples/sft/export_dataset.py +7 -4
examples/swe/task_app/README.md +33 -3
examples/swe/task_app/grpo_swe_mini.py +4 -1
examples/swe/task_app/grpo_swe_mini_task_app.py +0 -12
examples/swe/task_app/hosted/envs/crafter/react_agent.py +1 -1
examples/swe/task_app/hosted/envs/mini_swe/environment.py +50 -23
examples/swe/task_app/hosted/inference/openai_client.py +4 -4
examples/swe/task_app/hosted/policy_routes.py +0 -2
examples/swe/task_app/hosted/rollout.py +0 -8
examples/swe/task_app/morph_backend.py +178 -0
examples/task_apps/crafter/task_app/README.md +1 -1
examples/task_apps/crafter/task_app/grpo_crafter.py +70 -10
examples/task_apps/crafter/task_app/grpo_crafter_task_app.py +1 -1
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/policy.py +63 -27
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/react_agent.py +1 -2
examples/task_apps/crafter/task_app/synth_envs_hosted/inference/openai_client.py +48 -50
examples/task_apps/crafter/task_app/synth_envs_hosted/policy_routes.py +75 -36
examples/task_apps/crafter/task_app/synth_envs_hosted/rollout.py +31 -15
examples/task_apps/enron/__init__.py +1 -0
examples/task_apps/enron/task_app/grpo_enron_task_app.py +1 -1
examples/task_apps/math/README.md +1 -2
examples/task_apps/pokemon_red/README.md +3 -4
examples/task_apps/pokemon_red/eval_image_only_gpt4o.toml +6 -5
examples/task_apps/pokemon_red/eval_pokemon_red_policy.py +1 -2
examples/task_apps/pokemon_red/task_app.py +36 -5
examples/task_apps/sokoban/README.md +2 -3
examples/task_apps/verilog/eval_groq_qwen32b.toml +12 -14
examples/task_apps/verilog/task_app/grpo_verilog_task_app.py +1 -1
examples/vlm/README.md +3 -3
examples/vlm/configs/crafter_vlm_gpt4o.toml +5 -0
examples/vlm/crafter_openai_vlm_agent.py +3 -5
examples/vlm/filter_image_rows.py +1 -1
examples/vlm/run_crafter_vlm_benchmark.py +2 -2
examples/warming_up_to_rl/_utils.py +92 -0
examples/warming_up_to_rl/analyze_trace_db.py +1 -1
examples/warming_up_to_rl/configs/crafter_fft.toml +5 -0
examples/warming_up_to_rl/configs/eval_fft_qwen4b.toml +2 -0
examples/warming_up_to_rl/configs/eval_groq_qwen32b.toml +2 -0
examples/warming_up_to_rl/configs/eval_modal_qwen4b.toml +2 -1
examples/warming_up_to_rl/configs/rl_from_base_qwen4b.toml +2 -1
examples/warming_up_to_rl/configs/rl_from_ft.toml +2 -0
examples/warming_up_to_rl/export_trace_sft.py +174 -60
examples/warming_up_to_rl/readme.md +63 -132
examples/warming_up_to_rl/run_fft_and_save.py +1 -1
examples/warming_up_to_rl/run_local_rollout_traced.py +1 -1
examples/warming_up_to_rl/run_rl_and_save.py +1 -1
examples/warming_up_to_rl/task_app/README.md +42 -0
examples/warming_up_to_rl/task_app/grpo_crafter.py +827 -0
examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py +135 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/README.md +173 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/__init__.py +5 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/branching.py +143 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/environment_routes.py +1226 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/__init__.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/__init__.py +6 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/app.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/environment.py +522 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py +454 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py +108 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/shared.py +305 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/tools.py +47 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py +204 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/__init__.py +5 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py +618 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/main.py +100 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py +1084 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/registry.py +195 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py +1861 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/__init__.py +5 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/volume.py +211 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_agents.py +161 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_service.py +137 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/utils.py +62 -0
examples/workflows/math_rl/configs/rl_from_base_qwen.toml +27 -0
examples/workflows/math_rl/configs/rl_from_base_qwen17.toml +5 -0
synth_ai/__init__.py +44 -30
synth_ai/_utils/__init__.py +47 -0
synth_ai/_utils/base_url.py +10 -0
synth_ai/_utils/http.py +10 -0
synth_ai/_utils/prompts.py +10 -0
synth_ai/_utils/task_app_state.py +12 -0
synth_ai/_utils/user_config.py +10 -0
synth_ai/api/models/supported.py +144 -7
synth_ai/api/train/__init__.py +13 -1
synth_ai/api/train/builders.py +9 -3
synth_ai/api/train/cli.py +155 -17
synth_ai/api/train/config_finder.py +18 -11
synth_ai/api/train/configs/__init__.py +8 -1
synth_ai/api/train/configs/rl.py +32 -7
synth_ai/api/train/configs/sft.py +6 -2
synth_ai/api/train/configs/shared.py +59 -2
synth_ai/api/train/env_resolver.py +13 -10
synth_ai/auth/credentials.py +119 -0
synth_ai/cli/__init__.py +61 -69
synth_ai/cli/_modal_wrapper.py +7 -5
synth_ai/cli/_typer_patch.py +0 -2
synth_ai/cli/_validate_task_app.py +22 -4
synth_ai/cli/commands/__init__.py +17 -0
synth_ai/cli/commands/demo/__init__.py +6 -0
synth_ai/cli/commands/demo/core.py +163 -0
synth_ai/cli/commands/deploy/__init__.py +23 -0
synth_ai/cli/commands/deploy/core.py +614 -0
synth_ai/cli/commands/deploy/errors.py +72 -0
synth_ai/cli/commands/deploy/validation.py +11 -0
synth_ai/cli/commands/eval/__init__.py +19 -0
synth_ai/cli/commands/eval/core.py +1109 -0
synth_ai/cli/commands/eval/errors.py +81 -0
synth_ai/cli/commands/eval/validation.py +133 -0
synth_ai/cli/commands/filter/__init__.py +12 -0
synth_ai/cli/commands/filter/core.py +388 -0
synth_ai/cli/commands/filter/errors.py +55 -0
synth_ai/cli/commands/filter/validation.py +77 -0
synth_ai/cli/commands/help/__init__.py +177 -0
synth_ai/cli/commands/help/core.py +73 -0
synth_ai/cli/commands/status/__init__.py +64 -0
synth_ai/cli/commands/status/client.py +192 -0
synth_ai/cli/commands/status/config.py +92 -0
synth_ai/cli/commands/status/errors.py +20 -0
synth_ai/cli/commands/status/formatters.py +164 -0
synth_ai/cli/commands/status/subcommands/__init__.py +9 -0
synth_ai/cli/commands/status/subcommands/files.py +79 -0
synth_ai/cli/commands/status/subcommands/jobs.py +334 -0
synth_ai/cli/commands/status/subcommands/models.py +79 -0
synth_ai/cli/commands/status/subcommands/runs.py +81 -0
synth_ai/cli/commands/status/subcommands/summary.py +47 -0
synth_ai/cli/commands/status/utils.py +114 -0
synth_ai/cli/commands/train/__init__.py +53 -0
synth_ai/cli/commands/train/core.py +21 -0
synth_ai/cli/commands/train/errors.py +117 -0
synth_ai/cli/commands/train/judge_schemas.py +199 -0
synth_ai/cli/commands/train/judge_validation.py +304 -0
synth_ai/cli/commands/train/validation.py +443 -0
synth_ai/cli/demo.py +2 -162
synth_ai/cli/deploy/__init__.py +28 -0
synth_ai/cli/deploy/core.py +5 -0
synth_ai/cli/deploy/errors.py +23 -0
synth_ai/cli/deploy/validation.py +5 -0
synth_ai/cli/eval/__init__.py +36 -0
synth_ai/cli/eval/core.py +5 -0
synth_ai/cli/eval/errors.py +31 -0
synth_ai/cli/eval/validation.py +5 -0
synth_ai/cli/filter/__init__.py +28 -0
synth_ai/cli/filter/core.py +5 -0
synth_ai/cli/filter/errors.py +23 -0
synth_ai/cli/filter/validation.py +5 -0
synth_ai/cli/legacy_root_backup.py +3 -1
synth_ai/cli/lib/__init__.py +10 -0
synth_ai/cli/lib/task_app_discovery.py +7 -0
synth_ai/cli/lib/task_app_env.py +518 -0
synth_ai/cli/modal_serve/__init__.py +12 -0
synth_ai/cli/modal_serve/core.py +14 -0
synth_ai/cli/modal_serve/errors.py +8 -0
synth_ai/cli/modal_serve/validation.py +11 -0
synth_ai/cli/recent.py +2 -1
synth_ai/cli/serve/__init__.py +12 -0
synth_ai/cli/serve/core.py +14 -0
synth_ai/cli/serve/errors.py +8 -0
synth_ai/cli/serve/validation.py +11 -0
synth_ai/cli/setup.py +21 -0
synth_ai/cli/status.py +7 -126
synth_ai/cli/task_app_deploy.py +7 -0
synth_ai/cli/task_app_list.py +25 -0
synth_ai/cli/task_app_modal_serve.py +11 -0
synth_ai/cli/task_app_serve.py +11 -0
synth_ai/cli/task_apps.py +110 -1499
synth_ai/cli/traces.py +1 -1
synth_ai/cli/train/__init__.py +12 -0
synth_ai/cli/train/core.py +21 -0
synth_ai/cli/train/errors.py +8 -0
synth_ai/cli/train/validation.py +24 -0
synth_ai/cli/train.py +5 -0
synth_ai/cli/turso.py +1 -1
synth_ai/cli/watch.py +1 -1
synth_ai/demos/__init__.py +10 -0
synth_ai/demos/core/__init__.py +28 -1
synth_ai/demos/crafter/__init__.py +1 -0
synth_ai/demos/crafter/crafter_fft_4b.toml +55 -0
synth_ai/demos/crafter/grpo_crafter_task_app.py +185 -0
synth_ai/demos/crafter/rl_from_base_qwen4b.toml +74 -0
synth_ai/demos/demo_registry.py +176 -0
synth_ai/demos/demo_task_apps/crafter/grpo_crafter_task_app.py +1 -1
synth_ai/demos/math/__init__.py +1 -0
synth_ai/demos/math/_common.py +16 -0
synth_ai/demos/math/app.py +38 -0
synth_ai/demos/math/config.toml +76 -0
synth_ai/demos/math/deploy_modal.py +54 -0
synth_ai/demos/math/modal_task_app.py +702 -0
synth_ai/demos/math/task_app_entry.py +51 -0
synth_ai/environments/environment/core.py +7 -1
synth_ai/environments/examples/bandit/engine.py +0 -1
synth_ai/environments/examples/bandit/environment.py +0 -1
synth_ai/environments/examples/red/engine.py +33 -12
synth_ai/environments/examples/red/engine_helpers/reward_components.py +151 -179
synth_ai/environments/examples/red/environment.py +26 -0
synth_ai/environments/examples/red/trace_hooks_v3.py +168 -0
synth_ai/environments/examples/wordle/environment.py +0 -1
synth_ai/evals/base.py +16 -5
synth_ai/evals/client.py +1 -1
synth_ai/http.py +8 -22
synth_ai/inference/client.py +1 -1
synth_ai/judge_schemas.py +4 -5
synth_ai/learning/client.py +1 -1
synth_ai/learning/health.py +1 -1
synth_ai/learning/jobs.py +1 -1
synth_ai/learning/rl/client.py +4 -2
synth_ai/learning/rl/env_keys.py +1 -1
synth_ai/learning/rl/secrets.py +1 -1
synth_ai/learning/sft/client.py +1 -1
synth_ai/learning/sft/data.py +407 -4
synth_ai/learning/validators.py +4 -1
synth_ai/streaming/__init__.py +29 -0
synth_ai/streaming/config.py +94 -0
synth_ai/streaming/handlers.py +469 -0
synth_ai/streaming/streamer.py +301 -0
synth_ai/streaming/types.py +95 -0
synth_ai/task/apps/__init__.py +4 -2
synth_ai/task/config.py +6 -4
synth_ai/task/rubrics/__init__.py +1 -2
synth_ai/task/rubrics/loaders.py +14 -10
synth_ai/task/rubrics.py +219 -0
synth_ai/task/trace_correlation_helpers.py +24 -11
synth_ai/task/tracing_utils.py +14 -3
synth_ai/task/validators.py +0 -1
synth_ai/tracing_v3/abstractions.py +3 -3
synth_ai/tracing_v3/config.py +15 -13
synth_ai/tracing_v3/constants.py +21 -0
synth_ai/tracing_v3/db_config.py +3 -1
synth_ai/tracing_v3/decorators.py +10 -7
synth_ai/tracing_v3/llm_call_record_helpers.py +5 -5
synth_ai/tracing_v3/migration_helper.py +1 -2
synth_ai/tracing_v3/session_tracer.py +7 -7
synth_ai/tracing_v3/storage/base.py +29 -29
synth_ai/tracing_v3/storage/config.py +3 -3
synth_ai/tracing_v3/turso/daemon.py +8 -9
synth_ai/tracing_v3/turso/native_manager.py +80 -72
synth_ai/tracing_v3/utils.py +2 -2
synth_ai/utils/__init__.py +101 -0
synth_ai/utils/base_url.py +94 -0
synth_ai/utils/cli.py +131 -0
synth_ai/utils/env.py +294 -0
synth_ai/utils/http.py +172 -0
synth_ai/utils/modal.py +308 -0
synth_ai/utils/process.py +212 -0
synth_ai/utils/prompts.py +39 -0
synth_ai/utils/sqld.py +122 -0
synth_ai/utils/task_app_discovery.py +882 -0
synth_ai/utils/task_app_env.py +186 -0
synth_ai/utils/task_app_state.py +318 -0
synth_ai/utils/user_config.py +137 -0
synth_ai/v0/config/__init__.py +1 -5
synth_ai/v0/config/base_url.py +1 -7
synth_ai/v0/tracing/config.py +1 -1
synth_ai/v0/tracing/decorators.py +1 -1
synth_ai/v0/tracing/upload.py +1 -1
synth_ai/v0/tracing_v1/config.py +1 -1
synth_ai/v0/tracing_v1/decorators.py +1 -1
synth_ai/v0/tracing_v1/upload.py +1 -1
{synth_ai-0.2.14.dist-info → synth_ai-0.2.17.dist-info}/METADATA +91 -32
{synth_ai-0.2.14.dist-info → synth_ai-0.2.17.dist-info}/RECORD +341 -154
synth_ai/cli/man.py +0 -106
synth_ai/cli/tui.py +0 -57
synth_ai/compound/cais.py +0 -0
synth_ai/core/experiment.py +0 -13
synth_ai/core/system.py +0 -15
synth_ai/demo_registry.py +0 -295
synth_ai/handshake.py +0 -109
synth_ai/tui/__init__.py +0 -5
synth_ai/tui/__main__.py +0 -13
synth_ai/tui/cli/__init__.py +0 -1
synth_ai/tui/cli/query_experiments.py +0 -164
synth_ai/tui/cli/query_experiments_v3.py +0 -164
synth_ai/tui/dashboard.py +0 -906
{synth_ai-0.2.14.dist-info → synth_ai-0.2.17.dist-info}/WHEEL +0 -0
{synth_ai-0.2.14.dist-info → synth_ai-0.2.17.dist-info}/entry_points.txt +0 -0
{synth_ai-0.2.14.dist-info → synth_ai-0.2.17.dist-info}/licenses/LICENSE +0 -0
{synth_ai-0.2.14.dist-info → synth_ai-0.2.17.dist-info}/top_level.txt +0 -0

examples/rl/task_app/math_task_app.py ADDED Viewed

@@ -0,0 +1,111 @@
+"""Legacy entrypoint for the math single-step task app."""
+from __future__ import annotations
+import argparse
+from pathlib import Path
+from fastapi.exceptions import RequestValidationError
+from fastapi.responses import JSONResponse
+from starlette.requests import Request
+from synth_ai.task.auth import is_api_key_header_authorized, normalize_environment_api_key
+from synth_ai.task.server import create_task_app, run_task_app
+from .math_single_step import build_config
+def fastapi_app():
+    """Return a FastAPI application for hosting the math task app."""
+    app = create_task_app(build_config())
+    # Replace default health endpoints with auth-tolerant handlers.
+    filtered_routes = []
+    for route in app.router.routes:
+        path = getattr(route, "path", None)
+        methods = getattr(route, "methods", set()) or set()
+        if path in {"/health", "/health/rollout"} and "GET" in methods:
+            continue
+        filtered_routes.append(route)
+    app.router.routes = filtered_routes
+    def _log_env_key_prefix(source: str, env_key: str | None) -> str | None:
+        if not env_key:
+            return None
+        prefix = env_key[: max(1, len(env_key) // 2)]
+        print(f"[{source}] expected ENVIRONMENT_API_KEY prefix: {prefix}")
+        return prefix
+    @app.get("/health")
+    async def health(request: Request):
+        env_key = normalize_environment_api_key()
+        if not env_key:
+            return JSONResponse(
+                status_code=503,
+                content={"status": "unhealthy", "detail": "Missing ENVIRONMENT_API_KEY"},
+            )
+        if not is_api_key_header_authorized(request):
+            prefix = _log_env_key_prefix("health", env_key)
+            content = {"status": "healthy", "authorized": False}
+            if prefix:
+                content["expected_api_key_prefix"] = prefix
+            return JSONResponse(status_code=200, content=content)
+        return {"status": "healthy", "authorized": True}
+    @app.get("/health/rollout")
+    async def health_rollout(request: Request):
+        env_key = normalize_environment_api_key()
+        if not env_key:
+            return JSONResponse(
+                status_code=503,
+                content={"status": "unhealthy", "detail": "Missing ENVIRONMENT_API_KEY"},
+            )
+        if not is_api_key_header_authorized(request):
+            prefix = _log_env_key_prefix("health/rollout", env_key)
+            content = {"status": "healthy", "authorized": False}
+            if prefix:
+                content["expected_api_key_prefix"] = prefix
+            return JSONResponse(status_code=200, content=content)
+        return {"ok": True, "authorized": True}
+    @app.exception_handler(RequestValidationError)
+    async def _on_validation_error(request: Request, exc: RequestValidationError):
+        try:
+            hdr = request.headers
+            snapshot = {
+                "path": str(request.url.path),
+                "have_x_api_key": bool(hdr.get("x-api-key")),
+                "have_x_api_keys": bool(hdr.get("x-api-keys")),
+                "have_authorization": bool(hdr.get("authorization")),
+                "errors": exc.errors()[:5],
+            }
+            print("[422] validation", snapshot, flush=True)
+        except Exception:
+            pass
+        return JSONResponse(
+            status_code=422, content={"status": "invalid", "detail": exc.errors()[:5]}
+        )
+    return app
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="Run the math single-step task app locally")
+    parser.add_argument("--host", default="0.0.0.0")
+    parser.add_argument("--port", type=int, default=8101)
+    parser.add_argument("--reload", action="store_true", help="Enable uvicorn autoreload")
+    parser.add_argument(
+        "--env-file",
+        action="append",
+        default=[],
+        help="Path to .env file to load (can be specified multiple times)",
+    )
+    args = parser.parse_args()
+    run_task_app(
+        build_config,
+        host=args.host,
+        port=args.port,
+        reload=args.reload,
+        env_files=args.env_file or [],
+    )

examples/run_crafter_demo.sh CHANGED Viewed

@@ -4,7 +4,7 @@
 # This script demonstrates a reactive agent in the Crafter environment
 echo "🚀 Starting Crafter agent demo with Gemini 1.5 Flash..."
-echo "Make sure the synth-ai service is running: uvx synth-ai serve"
+echo "Make sure the synth-ai service is running: uvx synth-ai deploy --runtime uvicorn"
 echo ""
-uv run python -m synth_ai.environments.examples.crafter_classic.agent_demos.test_crafter_react_agent --model gemini-1.5-flash
+uv run python -m synth_ai.environments.examples.crafter_classic.agent_demos.test_crafter_react_agent --model gemini-1.5-flash

examples/sft/README.md CHANGED Viewed

@@ -25,9 +25,9 @@ You can generate traces with the Crafter task app and then export them to SFT JS
 ```bash
 # Serve the task app locally with tracing enabled (example)
-uvx synth-ai serve grpo-crafter \
+uvx synth-ai deploy --runtime uvicorn grpo-crafter \
   --trace traces/v3 \
-  --trace-db traces/v3/synth_ai.db \
+  --trace-db traces/v3/task_app_traces_<timestamp>.db \
   --port 8001
 # Or run traced local rollouts to accumulate data
@@ -36,9 +36,9 @@ uv run python examples/warming_up_to_rl/run_local_rollout_traced.py \
 # Export SFT dataset from the trace DB
 uv run python examples/warming_up_to_rl/export_trace_sft.py \
-  --db traces/v3/synth_ai.db \
+  --db traces/v3/task_app_traces_<timestamp>.db \
   --min-unique 0 \
-  --output examples/sft/ft_data/crafter_traces.jsonl
+  --output examples/sft/ft_data/crafter_sft.jsonl
 ```
 Notes:
@@ -56,7 +56,7 @@ Use the standard CLI. Do not use a custom Python finetuning script. Point the CL
 uvx synth-ai train \
   --type sft \
   --config examples/sft/configs/crafter_lora_qwen0p6b.toml \
-  --dataset examples/sft/ft_data/crafter_traces.jsonl \
+  --dataset examples/sft/ft_data/crafter_sft.jsonl \
   --env-file /Users/joshpurtell/Documents/GitHub/monorepo/backend/.env.dev
 ```
@@ -76,7 +76,7 @@ Full finetuning updates all weights and uses a near-identical CLI flow with the
 uvx synth-ai train \
   --type sft \
   --config examples/sft/configs/crafter_fft_qwen0p6b.toml \
-  --dataset examples/sft/ft_data/crafter_traces.jsonl \
+  --dataset examples/sft/ft_data/crafter_sft.jsonl \
   --env-file /Users/joshpurtell/Documents/GitHub/monorepo/backend/.env.dev
 ```

examples/sft/configs/crafter_fft_qwen0p6b.toml CHANGED Viewed

@@ -1,7 +1,12 @@
+[algorithm]
+type = "offline"
+method = "sft"
+variety = "fft"
 [job]
 model = "Qwen/Qwen3-0.6B"
 # Prefer passing --dataset at runtime for repeatability
-# data = "examples/sft/ft_data/crafter_traces.jsonl"
+# data = "examples/sft/ft_data/crafter_sft.jsonl"
 [compute]
 gpu_type = "H100"
@@ -11,7 +16,7 @@ nodes = 1
 [data]
 topology = {}
 # Optional validation set if you have one locally
-# validation_path = "examples/sft/ft_data/crafter_traces.val.jsonl"
+# validation_path = "examples/sft/ft_data/crafter_sft.val.jsonl"
 [training]
 mode = "sft_offline"

examples/sft/configs/crafter_lora_qwen0p6b.toml CHANGED Viewed

@@ -1,7 +1,12 @@
+[algorithm]
+type = "offline"
+method = "sft"
+variety = "qlora"
 [job]
 model = "Qwen/Qwen3-0.6B"
 # Optionally set here, but prefer passing --dataset at runtime
-# data = "examples/sft/ft_data/crafter_traces.jsonl"
+# data = "examples/sft/ft_data/crafter_sft.jsonl"
 [compute]
 gpu_type = "H100"
@@ -12,7 +17,7 @@ nodes = 1
 # Forwarded into metadata.effective_config
 topology = {}
 # Optional validation set if you have one locally
-# validation_path = "examples/sft/ft_data/crafter_traces.val.jsonl"
+# validation_path = "examples/sft/ft_data/crafter_sft.val.jsonl"
 [training]
 mode = "lora"
@@ -42,4 +47,3 @@ fsdp = false
 bf16 = true
 fp16 = false
 activation_checkpointing = true

examples/sft/evaluate.py CHANGED Viewed

@@ -11,6 +11,7 @@ from __future__ import annotations
 import argparse
 import asyncio
 import os
+from contextlib import suppress
 from dataclasses import dataclass
 from typing import Any
@@ -104,10 +105,8 @@ async def main() -> None:
     for r in results:
         ers = r.get("episode_returns") or []
         if isinstance(ers, list) and ers:
-            try:
+            with suppress(Exception):
                 flat_returns.append(float(ers[0]))
-            except Exception:
-                pass
     if flat_returns:
         mean_ret = sum(flat_returns) / len(flat_returns)
         print(f"mean_return={mean_ret:.3f} over {len(flat_returns)} episodes")
@@ -116,4 +115,3 @@ async def main() -> None:
 if __name__ == "__main__":
     asyncio.run(main())

examples/sft/export_dataset.py CHANGED Viewed

@@ -20,12 +20,17 @@ from examples.warming_up_to_rl.export_trace_sft import (
     parse_event_filters,
     write_jsonl,
 )
+from synth_ai.tracing_v3.constants import TRACE_DB_DIR, canonical_trace_db_name
 def main() -> None:
     p = argparse.ArgumentParser(description=__doc__)
-    p.add_argument("--db", type=Path, default=Path("traces/v3/synth_ai.db"))
-    p.add_argument("--output", type=Path, default=Path("examples/sft/ft_data/crafter_traces.jsonl"))
+    p.add_argument(
+        "--db",
+        type=Path,
+        default=TRACE_DB_DIR / canonical_trace_db_name(),
+    )
+    p.add_argument("--output", type=Path, default=Path("examples/sft/ft_data/crafter_sft.jsonl"))
     p.add_argument("--model", action="append", dest="models")
     p.add_argument("--provider", action="append", dest="providers")
     p.add_argument("--min-unique", type=int, default=0)
@@ -113,5 +118,3 @@ def main() -> None:
 if __name__ == "__main__":
     main()

examples/swe/task_app/README.md CHANGED Viewed

@@ -28,17 +28,17 @@ endpoints.
 ## Using the task app
 ```
-uvx synth-ai serve swe-mini --port 8020
+uvx synth-ai deploy --runtime uvicorn swe-mini --port 8020
 ```
 ### Recommended: non-interactive serve + .env
 ```bash
-uvx synth-ai serve swe-mini \
+uvx synth-ai deploy --runtime uvicorn swe-mini \
   --port 8020 \
   --env-file .env \
   --trace traces/v3 \
-  --trace-db traces/v3/synth_ai.db
+  --trace-db traces/v3/task_app_traces_<timestamp>.db
 ```
 This avoids interactive prompts (useful for CI) and loads `ENVIRONMENT_API_KEY`, `OPENAI_API_KEY`, etc. from `.env`.
@@ -60,6 +60,36 @@ Execution is handled by mini-swe's environment classes. Configure execution via
 `SWE_MINI_ENVIRONMENT_CLASS` (`local`, `docker`, `singularity`, …) and pass
 additional keyword arguments with `SWE_MINI_ENVIRONMENT_KWARGS` (JSON).
+### Morph Cloud backend
+The task app now ships with a Morph-powered environment class so you can run
+mini-SWE rollouts in managed sandboxes. When `MORPH_API_KEY` is present the app
+defaults to this backend automatically unless you override
+`SWE_MINI_ENVIRONMENT_CLASS`.
+1. Install the optional dependencies: `pip install "synth-ai[swe]"`.
+2. Export your API key: `export MORPH_API_KEY=...`.
+3. Point the task app at Morph by setting:
+   ```bash
+   export SWE_MINI_ENVIRONMENT_CLASS=morph
+   export SWE_MINI_ENVIRONMENT_KWARGS='{
+     "snapshot_id": "snap_your_pre_baked_swebench_image",
+     "cwd": "/workspace/swebench",
+     "env": {"PIP_PROGRESS_BAR": "off"},
+     "metadata": {"project": "synth-ai", "task": "swe-mini"}
+   }'
+   ```
+   If you do not have a pre-built snapshot, provide `"image_id"` (defaults to
+   `morphvm-minimal`) along with resource hints (`"vcpus"`, `"memory_mb"`,
+   `"disk_mb"`). You can also set `SWE_MINI_MORPH_SNAPSHOT_ID` globally.
+During cleanup the backend deletes the remote workspace and stops the Morph
+instance automatically. All shell commands (including submissions) now execute
+inside the Morph sandbox, enabling RL workflows that require persistent remote
+compute.
 ### Tracing & SFT
 Tracing works the same as Crafter; pass `--trace` / `--trace-db` to the CLI or

examples/swe/task_app/grpo_swe_mini.py CHANGED Viewed

@@ -404,6 +404,10 @@ def _ensure_env_has_task(
         if not instance_id:
             raise ValueError("mini-swe rollout request requires env.config.instance_id")
         config["task"] = dataset.get(instance_id)
+    env_cfg = dict(config.get("environment") or {})
+    if "environment_class" not in env_cfg and os.getenv("MORPH_API_KEY"):
+        env_cfg["environment_class"] = "morph"
+    config["environment"] = env_cfg
     return env_spec.model_copy(update={"config": config})
@@ -556,7 +560,6 @@ register_task_app(
         description="mini-swe-agent task app with rollout + proxy endpoints",
         config_factory=build_config,
         aliases=("mini-swe", "swe-mini-task"),
-        env_files=(str(REPO_ROOT / "backend" / ".env.dev"),),
         modal=ModalDeploymentConfig(
             app_name="swe-mini-task-app",
             python_version="3.11",

examples/swe/task_app/grpo_swe_mini_task_app.py CHANGED Viewed

@@ -114,23 +114,11 @@ if __name__ == "__main__":
     parser.add_argument("--host", default="0.0.0.0")
     parser.add_argument("--port", type=int, default=8020)
     parser.add_argument("--reload", action="store_true", help="Enable uvicorn autoreload")
-    parser.add_argument(
-        "--env-file",
-        action="append",
-        default=[],
-        help="Additional .env files to load before startup",
-    )
     args = parser.parse_args()
-    default_env = Path(__file__).resolve().parents[4] / "backend" / ".env.dev"
-    env_files = [str(default_env)] if default_env.exists() else []
-    env_files.extend(args.env_file or [])
     run_task_app(
         build_task_app_config,
         host=args.host,
         port=args.port,
         reload=args.reload,
-        env_files=env_files,
     )

examples/swe/task_app/hosted/envs/crafter/react_agent.py CHANGED Viewed

@@ -46,7 +46,7 @@ class CrafterReActAgent:
             "- Always return a single tool call: interact_many({actions: [...]})\n"
             "- Use 2–5 actions per call; prefer long movement sequences to explore.\n"
             "- Mix in 'do' only when it makes sense (tree, stone, animal, enemy nearby).\n"
-            "- Do not spam the same exact sequence twice in a row—explore in varied directions.\n\n"
+            "\n"
             "Available actions: noop, move_up, move_down, move_left, move_right, do (interact), sleep, "
             "place_stone, place_table, place_furnace, place_plant, make_wood_pickaxe, make_stone_pickaxe, "
             "make_iron_pickaxe, make_wood_sword, make_stone_sword, make_iron_sword\n"

examples/swe/task_app/hosted/envs/mini_swe/environment.py CHANGED Viewed

@@ -18,6 +18,7 @@ from typing import Any
 from minisweagent.environments import get_environment
 from synth_ai.environments.environment.tools import EnvToolCall
+from examples.swe.task_app.morph_backend import MorphSandboxBackend
 from .shared import summarise_history
 from .tools import TOOLS_SCHEMA
@@ -25,8 +26,9 @@ logger = logging.getLogger(__name__)
 def _environment_type_from_config(config: dict[str, Any]) -> str:
+    default = "morph" if os.getenv("MORPH_API_KEY") else "local"
     value = (config or {}).get("environment_class") or os.getenv(
-        "SWE_MINI_ENVIRONMENT_CLASS", "local"
+        "SWE_MINI_ENVIRONMENT_CLASS", default
     )
     return str(value).strip() or "local"
@@ -91,6 +93,7 @@ class MiniSweEnvironmentWrapper:
         self._local_workspace_dir: Path | None = None
         self._remote_workspace: str | None = None
         self._cleanup_workspace = False
+        self._using_morph_backend = False
         if self.environment_type == "local":
             workspace = self._prepare_local_workspace(kwargs)
@@ -117,11 +120,11 @@ class MiniSweEnvironmentWrapper:
             timeout = self.env_config.get("timeout")
             if timeout and "timeout" not in kwargs:
                 kwargs["timeout"] = int(timeout)
-            if self.repo_url and "image" not in kwargs:
+            if self.environment_type in {"docker", "bubblewrap"} and self.repo_url and "image" not in kwargs:
                 image = self.metadata.get("image_name") or os.getenv("SWE_MINI_DOCKER_IMAGE")
                 if image:
                     kwargs["image"] = image
-            if self.environment_type in {"docker", "bubblewrap"}:
+            if self.environment_type in {"docker", "bubblewrap", "morph"}:
                 remote_env = dict(kwargs.get("env") or {})
                 remote_env.setdefault("GIT_TERMINAL_PROMPT", "0")
                 kwargs["env"] = remote_env
@@ -131,13 +134,34 @@ class MiniSweEnvironmentWrapper:
             self.environment_type,
             kwargs,
         )
-        self.env = get_environment(
-            {
-                "environment_class": self.environment_type,
-                **kwargs,
-            },
-            default_type="local",
-        )
+        if self.environment_type == "morph":
+            morph_kwargs = dict(kwargs)
+            image_value = morph_kwargs.pop("image", None)
+            if image_value and "image_id" not in morph_kwargs:
+                morph_kwargs["image_id"] = image_value
+            timeout_value = morph_kwargs.pop("timeout", None)
+            if timeout_value is not None and "startup_timeout" not in morph_kwargs:
+                try:
+                    morph_kwargs["startup_timeout"] = int(timeout_value)
+                except Exception:
+                    logger.warning("Invalid timeout value for morph backend: %r", timeout_value)
+            metadata_override = morph_kwargs.pop("metadata", {}) or {}
+            metadata_payload = {
+                "app": "swe-mini",
+                "instance_id": self.instance_id,
+            }
+            metadata_payload.update({str(k): str(v) for k, v in dict(metadata_override).items()})
+            morph_kwargs["metadata"] = metadata_payload
+            self.env = MorphSandboxBackend(**morph_kwargs)
+            self._using_morph_backend = True
+        else:
+            self.env = get_environment(
+                {
+                    "environment_class": self.environment_type,
+                    **kwargs,
+                },
+                default_type="local",
+            )
         if self.environment_type != "local":
             self._bootstrap_remote_workspace()
@@ -181,6 +205,9 @@ class MiniSweEnvironmentWrapper:
             with contextlib.suppress(Exception):
                 self.env.execute(f"rm -rf {shlex.quote(self._remote_workspace)}")
         self._remote_workspace = None
+        if self._using_morph_backend and hasattr(self.env, "close"):
+            with contextlib.suppress(Exception):
+                self.env.close()
     def _resolve_repo_url(self, metadata: dict[str, Any]) -> str | None:
         candidates = [
@@ -776,7 +803,7 @@ class MiniSweEnvironmentWrapper:
             or os.getenv("SWE_REX_MODAL_SANDBOX_KWARGS")
         )
         modal_kwargs: dict[str, Any] = {}
-        if isinstance(modal_kwargs_raw, (dict, list)):
+        if isinstance(modal_kwargs_raw, dict | list):
             modal_kwargs = dict(modal_kwargs_raw or {})
         elif isinstance(modal_kwargs_raw, str) and modal_kwargs_raw.strip():
             try:
@@ -841,9 +868,9 @@ class MiniSweEnvironmentWrapper:
             instance_image_tag=instance_image_tag,
             env_image_tag=env_image_tag,
             model_name=model_name,
-            Command=Command,
-            WriteFileRequest=WriteFileRequest,
-            ReadFileRequest=ReadFileRequest,
+            command_cls=Command,
+            write_file_request_cls=WriteFileRequest,
+            read_file_request_cls=ReadFileRequest,
         )
         try:
             return self._run_coroutine_blocking(coro)
@@ -867,9 +894,9 @@ class MiniSweEnvironmentWrapper:
         instance_image_tag: str,
         env_image_tag: str,
         model_name: str,
-        Command,
-        WriteFileRequest,
-        ReadFileRequest,
+        command_cls,
+        write_file_request_cls,
+        read_file_request_cls,
     ) -> dict[str, Any]:
         deployment = deployment_config.get_deployment()
         await deployment.start()
@@ -880,7 +907,7 @@ class MiniSweEnvironmentWrapper:
             # Ensure working directory exists.
             mkdir_resp = await runtime.execute(
-                Command(command=["mkdir", "-p", remote_root], timeout=60, shell=False)
+                command_cls(command=["mkdir", "-p", remote_root], timeout=60, shell=False)
             )
             if mkdir_resp.exit_code not in (0, None):
                 logger.warning("Failed to ensure remote directory %s (exit=%s)", remote_root, mkdir_resp.exit_code)
@@ -888,8 +915,8 @@ class MiniSweEnvironmentWrapper:
             # Upload dataset & predictions.
             dataset_blob = json.dumps([instance], ensure_ascii=False)
             predictions_blob = json.dumps({instance_id: prediction}, ensure_ascii=False)
-            await runtime.write_file(WriteFileRequest(path=dataset_remote_path, content=dataset_blob))
-            await runtime.write_file(WriteFileRequest(path=predictions_remote_path, content=predictions_blob))
+            await runtime.write_file(write_file_request_cls(path=dataset_remote_path, content=dataset_blob))
+            await runtime.write_file(write_file_request_cls(path=predictions_remote_path, content=predictions_blob))
             eval_cmd = [
                 "python",
@@ -921,7 +948,7 @@ class MiniSweEnvironmentWrapper:
             command_timeout = max(eval_timeout + 900, 1200)
             response = await runtime.execute(
-                Command(
+                command_cls(
                     command=eval_cmd,
                     timeout=command_timeout,
                     cwd=remote_root,
@@ -945,7 +972,7 @@ class MiniSweEnvironmentWrapper:
                 for filename in ("report.json", "test_output.txt", "run_instance.log", "patch.diff"):
                     remote_path = f"{remote_log_dir}/{filename}"
                     try:
-                        content = await runtime.read_file(ReadFileRequest(path=remote_path))
+                        content = await runtime.read_file(read_file_request_cls(path=remote_path))
                     except Exception:
                         continue
                     if getattr(content, "content", None):
@@ -1073,7 +1100,7 @@ class MiniSweEnvironmentWrapper:
             return value
         if isinstance(value, str):
             return value.strip().lower() in {"1", "true", "yes", "on"}
-        if isinstance(value, (int, float)):
+        if isinstance(value, int | float):
             return bool(value)
         return False  # pragma: no cover - defensive default

examples/swe/task_app/hosted/inference/openai_client.py CHANGED Viewed

@@ -156,13 +156,13 @@ class OpenAIClient:
             keys_preview = sorted(processed_request.keys())
             logger.info(f"Request keys: {keys_preview}")
-        # Final hard-guard for OpenAI: ensure unsupported field is not present
+        # Final hard-guard for OpenAI/Groq: ensure unsupported field is not present
         try:
-            if "openai" in url.lower() and "stop_after_tool_calls" in processed_request:
+            low_url = url.lower()
+            if ("openai" in low_url or "groq.com" in low_url or "/proxy/groq" in low_url) and "stop_after_tool_calls" in processed_request:
                 processed_request.pop("stop_after_tool_calls", None)
-                logger.info("Removed stop_after_tool_calls for OpenAI request")
+                logger.info("Removed stop_after_tool_calls for Groq/OpenAI request")
             # Groq-specific requirement: when using JSON mode, one of the messages must contain the word 'json'
-            low_url = url.lower()
             if ("groq.com" in low_url or "/openai" in low_url) and isinstance(
                 processed_request, dict
             ):

examples/swe/task_app/hosted/policy_routes.py CHANGED Viewed

@@ -343,8 +343,6 @@ async def step_policy(
             inf_req = meta["inference_request"]
             msgs = inf_req["messages"]
             model_name = inf_req.get("model") or getattr(policy, "model", None) or ""
-            system_messages: list[str] = []
-            user_messages: list[str] = []
             if msgs and len(msgs) > 0 and msgs[0]["role"] == "system":
                 sys_text = msgs[0]["content"]
                 policy_name = getattr(policy, "name", "") or type(policy).__name__.lower()

examples/swe/task_app/hosted/rollout.py CHANGED Viewed

@@ -888,14 +888,6 @@ async def execute_rollout(
             logger.debug(f"TRACER_FACTORY_FAIL: {exc}")
     tracing_context = RolloutTracingContext(tracer_instance, request, req)
     await tracing_context.start_session()
-    # Print whether tracing is active for this rollout
-    try:
-        print(
-            f"[rollout] tracing enabled={bool(tracing_context.enabled)} run_id={request.run_id}",
-            flush=True,
-        )
-    except Exception:
-        pass
     # Register run
     registry.register_run(request.run_id)

synth-ai 0.2.14__py3-none-any.whl → 0.2.17__py3-none-any.whl

Potentially problematic release.

synth-ai 0.2.14py3-none-any.whl → 0.2.17py3-none-any.whl