PyPI - synth-ai - Versions diffs - 0.2.8.dev4__py3-none-any.whl → 0.2.23.dev3__py3-none-any.whl - Mend

synth-ai 0.2.8.dev4py3-none-any.whl → 0.2.23.dev3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (889) hide show

examples/README.md +1 -0
examples/__init__.py +16 -0
examples/analyze_semantic_words.sh +17 -0
examples/baseline/banking77_baseline.py +243 -0
examples/baseline/banking77_pipeline_baseline.py +294 -0
examples/baseline/crafter_baseline.py +407 -0
examples/baseline/pokemon_red_baseline.py +326 -0
examples/baseline/simple_baseline.py +56 -0
examples/baseline/warming_up_to_rl_baseline.py +239 -0
examples/blog_posts/gepa/README.md +355 -0
examples/blog_posts/gepa/configs/banking77_gepa_local.toml +95 -0
examples/blog_posts/gepa/configs/banking77_gepa_test.toml +80 -0
examples/blog_posts/gepa/configs/banking77_mipro_local.toml +50 -0
examples/blog_posts/gepa/configs/banking77_pipeline_gepa_local.toml +101 -0
examples/blog_posts/gepa/configs/banking77_pipeline_gepa_test.toml +96 -0
examples/blog_posts/gepa/configs/hotpotqa_gepa_local.toml +57 -0
examples/blog_posts/gepa/configs/hotpotqa_gepa_qwen.toml +35 -0
examples/blog_posts/gepa/configs/hotpotqa_mipro_local.toml +51 -0
examples/blog_posts/gepa/configs/hover_gepa_local.toml +57 -0
examples/blog_posts/gepa/configs/hover_gepa_qwen.toml +35 -0
examples/blog_posts/gepa/configs/hover_mipro_local.toml +51 -0
examples/blog_posts/gepa/configs/ifbench_gepa_local.toml +57 -0
examples/blog_posts/gepa/configs/ifbench_gepa_qwen.toml +35 -0
examples/blog_posts/gepa/configs/ifbench_mipro_local.toml +51 -0
examples/blog_posts/gepa/configs/pupa_gepa_local.toml +58 -0
examples/blog_posts/gepa/configs/pupa_mipro_local.toml +52 -0
examples/blog_posts/gepa/deploy_banking77_task_app.sh +54 -0
examples/blog_posts/gepa/gepa_baseline.py +204 -0
examples/blog_posts/gepa/query_prompts_example.py +97 -0
examples/blog_posts/gepa/run_gepa_banking77.sh +112 -0
examples/blog_posts/gepa/run_gepa_banking77_pipeline.sh +163 -0
examples/blog_posts/gepa/task_apps.py +105 -0
examples/blog_posts/gepa/test_gepa_local.sh +67 -0
examples/blog_posts/gepa/verify_banking77_setup.sh +123 -0
examples/blog_posts/mipro/README.md +415 -0
examples/blog_posts/mipro/configs/banking77_mipro_local.toml +91 -0
examples/blog_posts/mipro/configs/banking77_mipro_test.toml +87 -0
examples/blog_posts/mipro/configs/banking77_pipeline_mipro_gemini_flash_lite_local.toml +98 -0
examples/blog_posts/mipro/configs/banking77_pipeline_mipro_gpt41mini_local.toml +96 -0
examples/blog_posts/mipro/configs/banking77_pipeline_mipro_local.toml +94 -0
examples/blog_posts/mipro/configs/banking77_pipeline_mipro_test.toml +170 -0
examples/blog_posts/mipro/deploy_banking77_pipeline_task_app.sh +59 -0
examples/blog_posts/mipro/deploy_banking77_task_app.sh +41 -0
examples/blog_posts/mipro/multi_step.md +79 -0
examples/blog_posts/mipro/run_mipro_banking77.sh +191 -0
examples/blog_posts/mipro/run_mipro_banking77_pipeline.sh +171 -0
examples/blog_posts/mipro/run_mipro_banking77_pipeline_gemini_flash_lite.sh +177 -0
examples/blog_posts/mipro/run_mipro_banking77_pipeline_gpt41mini.sh +173 -0
examples/blog_posts/mipro/verify_banking77_setup.sh +117 -0
examples/blog_posts/pokemon_vl/README.md +98 -0
examples/blog_posts/pokemon_vl/configs/eval_gpt5nano.toml +26 -0
examples/blog_posts/pokemon_vl/configs/eval_qwen3_vl.toml +27 -0
examples/blog_posts/pokemon_vl/configs/eval_rl_final.toml +24 -0
examples/blog_posts/pokemon_vl/configs/filter_high_reward.toml +10 -0
examples/blog_posts/pokemon_vl/configs/train_rl_from_sft.toml +43 -0
examples/blog_posts/pokemon_vl/configs/train_sft_qwen4b_vl.toml +40 -0
examples/blog_posts/pokemon_vl/extract_images.py +239 -0
examples/blog_posts/pokemon_vl/pokemon_vl_baseline.py +326 -0
examples/blog_posts/pokemon_vl/run_eval_extract_images.py +209 -0
examples/blog_posts/pokemon_vl/run_qwen_eval_extract_images.py +212 -0
examples/blog_posts/pokemon_vl/text_box_analysis.md +106 -0
examples/blog_posts/warming_up_to_rl/ARCHITECTURE.md +195 -0
examples/blog_posts/warming_up_to_rl/FINAL_TEST_RESULTS.md +127 -0
examples/blog_posts/warming_up_to_rl/INFERENCE_SUCCESS.md +132 -0
examples/blog_posts/warming_up_to_rl/README.md +158 -0
examples/blog_posts/warming_up_to_rl/SMOKE_TESTING.md +164 -0
examples/blog_posts/warming_up_to_rl/SMOKE_TEST_COMPLETE.md +253 -0
examples/blog_posts/warming_up_to_rl/configs/eval_baseline_qwen32b_10x20.toml +25 -0
examples/blog_posts/warming_up_to_rl/configs/eval_ft_qwen4b.toml +25 -0
examples/blog_posts/warming_up_to_rl/configs/eval_ft_qwen4b_10x20.toml +26 -0
examples/blog_posts/warming_up_to_rl/configs/eval_groq_qwen32b.toml +25 -0
examples/blog_posts/warming_up_to_rl/configs/eval_openai_gpt_oss_120b.toml +29 -0
examples/blog_posts/warming_up_to_rl/configs/filter_high_reward_dataset.toml +10 -0
examples/blog_posts/warming_up_to_rl/configs/smoke_test.toml +75 -0
examples/blog_posts/warming_up_to_rl/configs/train_rl_from_sft.toml +91 -0
examples/blog_posts/warming_up_to_rl/configs/train_sft_qwen4b.toml +40 -0
examples/blog_posts/warming_up_to_rl/warming_up_to_rl_baseline.py +187 -0
examples/crafter_debug_render.py +186 -0
examples/dev/qwen3_32b_qlora_4xh100.toml +45 -0
examples/gepa/banking77_pipeline_gepa.toml +96 -0
examples/gepa/multi_stage_gepa_example.toml +84 -0
examples/gepa/run_gepa_banking77_pipeline.sh +157 -0
examples/multi_step/SFT_README.md +147 -0
examples/multi_step/configs/README_verilog_rl.md +77 -0
examples/multi_step/configs/VERILOG_REWARDS.md +103 -0
examples/multi_step/configs/VERILOG_RL_CHECKLIST.md +196 -0
examples/multi_step/configs/crafter_eval_synth_qwen4b.toml +35 -0
examples/multi_step/configs/crafter_eval_text_only_groq_qwen32b.toml +36 -0
examples/multi_step/configs/crafter_rl_outcome.toml +75 -0
examples/multi_step/configs/crafter_rl_stepwise_hosted_judge.toml +145 -0
examples/multi_step/configs/crafter_rl_stepwise_shaped.toml +84 -0
examples/multi_step/configs/crafter_rl_stepwise_simple.toml +79 -0
examples/multi_step/configs/crafter_rl_stepwise_simple_NEW_FORMAT.toml +105 -0
examples/multi_step/configs/crafter_sft_qwen30b_lora.toml +62 -0
examples/multi_step/configs/crafter_synth_backend.md +40 -0
examples/multi_step/configs/verilog_eval_groq_qwen32b.toml +31 -0
examples/multi_step/configs/verilog_eval_synth_qwen8b.toml +33 -0
examples/multi_step/configs/verilog_rl_lora.toml +147 -0
examples/multi_step/convert_traces_to_sft.py +84 -0
examples/multi_step/crafter_rl_lora.md +70 -0
examples/multi_step/judges/crafter_backend_judge.py +220 -0
examples/multi_step/judges/verilog_backend_judge.py +234 -0
examples/multi_step/readme.md +48 -0
examples/multi_step/run_sft_qwen30b.sh +45 -0
examples/multi_step/sse_metrics_streaming_notes.md +357 -0
examples/multi_step/task_app_config_notes.md +494 -0
examples/multi_step/verilog_rl_lora.md +218 -0
examples/qwen_coder/README.md +102 -0
examples/qwen_coder/_shared.py +113 -0
examples/qwen_coder/configs/coder_lora_30b.toml +60 -0
examples/qwen_coder/configs/coder_lora_4b.toml +61 -0
examples/qwen_coder/configs/coder_lora_small.toml +57 -0
examples/qwen_coder/generate_dataset.py +98 -0
examples/qwen_coder/infer_ft_smoke.py +65 -0
examples/qwen_coder/infer_prod_proxy.py +73 -0
examples/qwen_coder/infer_via_synth.py +87 -0
examples/qwen_coder/scripts/infer_coder.sh +19 -0
examples/qwen_coder/scripts/train_coder_30b.sh +22 -0
examples/qwen_coder/sft_full_17b.py +103 -0
examples/qwen_coder/sft_lora_30b.py +110 -0
examples/qwen_coder/subset_jsonl.py +39 -0
examples/qwen_coder/todos.md +38 -0
examples/qwen_coder/validate_jsonl.py +60 -0
examples/qwen_vl/BUGS_AND_FIXES.md +232 -0
examples/qwen_vl/IMAGE_VALIDATION_COMPLETE.md +271 -0
examples/qwen_vl/IMAGE_VALIDATION_SUMMARY.md +260 -0
examples/qwen_vl/INFERENCE_SFT_TESTS.md +412 -0
examples/qwen_vl/NEXT_STEPS_2B.md +325 -0
examples/qwen_vl/QUICKSTART.md +327 -0
examples/qwen_vl/QUICKSTART_RL_VISION.md +110 -0
examples/qwen_vl/README.md +152 -0
examples/qwen_vl/RL_VISION_COMPLETE.md +475 -0
examples/qwen_vl/RL_VISION_TESTING.md +333 -0
examples/qwen_vl/SDK_VISION_INTEGRATION.md +328 -0
examples/qwen_vl/SETUP_COMPLETE.md +274 -0
examples/qwen_vl/VISION_TESTS_COMPLETE.md +489 -0
examples/qwen_vl/VLM_PIPELINE_COMPLETE.md +242 -0
examples/qwen_vl/__init__.py +2 -0
examples/qwen_vl/collect_data_via_cli.md +415 -0
examples/qwen_vl/collect_vision_traces.py +368 -0
examples/qwen_vl/configs/crafter_rl_vision_qwen3vl4b.toml +110 -0
examples/qwen_vl/configs/crafter_vlm_sft_example.toml +59 -0
examples/qwen_vl/configs/eval_gpt4o_mini_vision.toml +26 -0
examples/qwen_vl/configs/eval_gpt4o_vision_proper.toml +29 -0
examples/qwen_vl/configs/eval_gpt5nano_vision.toml +26 -0
examples/qwen_vl/configs/eval_qwen3vl_vision.toml +26 -0
examples/qwen_vl/configs/filter_qwen3vl_sft.toml +49 -0
examples/qwen_vl/configs/filter_vision_sft.toml +52 -0
examples/qwen_vl/configs/filter_vision_test.toml +8 -0
examples/qwen_vl/configs/sft_qwen3_vl_2b_test.toml +54 -0
examples/qwen_vl/crafter_gpt5nano_agent.py +308 -0
examples/qwen_vl/crafter_qwen_vl_agent.py +300 -0
examples/qwen_vl/run_vision_comparison.sh +61 -0
examples/qwen_vl/run_vision_sft_pipeline.sh +175 -0
examples/qwen_vl/test_image_validation.py +201 -0
examples/qwen_vl/test_sft_vision_data.py +110 -0
examples/rl/README.md +169 -0
examples/rl/configs/eval_base_qwen.toml +17 -0
examples/rl/configs/eval_rl_qwen.toml +13 -0
examples/rl/configs/rl_from_base_qwen.toml +62 -0
examples/rl/configs/rl_from_base_qwen17.toml +80 -0
examples/rl/configs/rl_from_ft_qwen.toml +37 -0
examples/rl/download_dataset.py +80 -0
examples/rl/run_eval.py +436 -0
examples/rl/run_rl_and_save.py +111 -0
examples/rl/task_app/README.md +21 -0
examples/rl/task_app/math_single_step.py +990 -0
examples/rl/task_app/math_task_app.py +111 -0
examples/run_crafter_demo.sh +10 -0
examples/sdk_prompt_learning_example.py +55 -0
examples/sft/README.md +139 -0
examples/sft/configs/crafter_fft_qwen0p6b.toml +49 -0
examples/sft/configs/crafter_lora_qwen0p6b.toml +49 -0
examples/sft/evaluate.py +117 -0
examples/sft/export_dataset.py +120 -0
examples/sft/generate_traces.py +164 -0
examples/swe/__init__.py +12 -0
examples/swe/task_app/README.md +135 -0
examples/swe/task_app/__init__.py +2 -0
examples/swe/task_app/grpo_swe_mini.py +604 -0
examples/swe/task_app/grpo_swe_mini_task_app.py +124 -0
examples/swe/task_app/hosted/README.md +173 -0
examples/swe/task_app/hosted/__init__.py +5 -0
examples/swe/task_app/hosted/branching.py +143 -0
examples/swe/task_app/hosted/environment_routes.py +1289 -0
examples/swe/task_app/hosted/envs/__init__.py +1 -0
examples/swe/task_app/hosted/envs/crafter/__init__.py +6 -0
examples/swe/task_app/hosted/envs/crafter/app.py +1 -0
examples/swe/task_app/hosted/envs/crafter/environment.py +522 -0
examples/swe/task_app/hosted/envs/crafter/policy.py +478 -0
examples/swe/task_app/hosted/envs/crafter/react_agent.py +108 -0
examples/swe/task_app/hosted/envs/crafter/shared.py +305 -0
examples/swe/task_app/hosted/envs/crafter/tools.py +47 -0
examples/swe/task_app/hosted/envs/mini_swe/__init__.py +8 -0
examples/swe/task_app/hosted/envs/mini_swe/environment.py +1191 -0
examples/swe/task_app/hosted/envs/mini_swe/policy.py +355 -0
examples/swe/task_app/hosted/envs/mini_swe/shared.py +83 -0
examples/swe/task_app/hosted/envs/mini_swe/tools.py +96 -0
examples/swe/task_app/hosted/hosted_app.py +204 -0
examples/swe/task_app/hosted/inference/__init__.py +5 -0
examples/swe/task_app/hosted/inference/openai_client.py +584 -0
examples/swe/task_app/hosted/main.py +100 -0
examples/swe/task_app/hosted/policy_routes.py +1094 -0
examples/swe/task_app/hosted/registry.py +195 -0
examples/swe/task_app/hosted/rollout.py +1905 -0
examples/swe/task_app/hosted/storage/__init__.py +5 -0
examples/swe/task_app/hosted/storage/volume.py +211 -0
examples/swe/task_app/hosted/test_agents.py +161 -0
examples/swe/task_app/hosted/test_service.py +136 -0
examples/swe/task_app/hosted/utils.py +62 -0
examples/swe/task_app/morph_backend.py +178 -0
examples/task_apps/IMAGE_ONLY_EVAL_QUICKSTART.md +258 -0
examples/task_apps/TESTING.md +275 -0
examples/task_apps/banking77/__init__.py +6 -0
examples/task_apps/banking77/banking77_task_app.py +912 -0
examples/task_apps/banking77/deploy_wrapper.py +46 -0
examples/task_apps/banking77_pipeline/__init__.py +6 -0
examples/task_apps/banking77_pipeline/banking77_pipeline_task_app.py +489 -0
examples/task_apps/banking77_pipeline/deploy_wrapper.py +50 -0
examples/task_apps/crafter/CREATE_SFT_DATASET.md +286 -0
examples/task_apps/crafter/EVAL_IMAGE_ONLY_RESULTS.md +152 -0
examples/task_apps/crafter/FILTER_COMMAND_STATUS.md +187 -0
examples/task_apps/crafter/FILTER_COMMAND_SUCCESS.md +281 -0
examples/task_apps/crafter/QUERY_EXAMPLES.md +203 -0
examples/task_apps/crafter/README_IMAGE_ONLY_EVAL.md +316 -0
examples/task_apps/crafter/eval_image_only_gpt4o.toml +28 -0
examples/task_apps/crafter/eval_text_only_groq_llama.toml +36 -0
examples/task_apps/crafter/filter_sft_dataset.toml +16 -0
examples/task_apps/crafter/task_app/README.md +42 -0
examples/task_apps/crafter/task_app/__init__.py +5 -0
examples/task_apps/crafter/task_app/grpo_crafter.py +1055 -0
examples/task_apps/crafter/task_app/grpo_crafter_task_app.py +146 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/README.md +173 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/__init__.py +5 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/branching.py +143 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/environment_routes.py +1226 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/__init__.py +1 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/__init__.py +6 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/app.py +1 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/environment.py +532 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/policy.py +583 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/react_agent.py +122 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/shared.py +305 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/tools.py +47 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/hosted_app.py +253 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/inference/__init__.py +5 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/inference/openai_client.py +999 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/main.py +100 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/policy_routes.py +1252 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/registry.py +195 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/rollout.py +2233 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/storage/__init__.py +5 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/storage/volume.py +211 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/test_agents.py +161 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/test_service.py +136 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/utils.py +411 -0
examples/task_apps/dev/pokemon_emerald/__init__.py +2 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/README.md +811 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/__init__.py +120 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/action.py +160 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/memory.py +155 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/perception.py +69 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/planning.py +96 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/simple.py +1502 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/system_prompt.py +4 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/grab_map.py +68 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/manual.py +216 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/__init__.py +35 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/emerald_utils.py +631 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/emulator.py +1544 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/enums.py +1428 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/memory_reader.py +4848 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/types.py +41 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/utils.py +298 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pyproject.toml +95 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/run.py +204 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/server/app.py +2152 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/server/client.py +429 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/server/frame_server.py +155 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/README.md +78 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/run_tests.py +122 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_agent_direct.py +76 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_agent_prompts.py +413 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_battle_state_formatting.py +204 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_dialogue_detection.py +133 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_dialogue_detection_comprehensive.py +229 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_direct_agent_emulator.py +300 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_fps_adjustment_pytest.py +205 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_house_to_outside_direct.py +200 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_house_to_outside_transition.py +284 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_map_ground_truth_comparison.py +468 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_memory_map.py +575 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_server_map_validation.py +311 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_torchic_state.py +259 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/anticheat.py +372 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/checkpoint.py +296 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/error_handler.py +275 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/get_local_ip.py +22 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/helpers.py +44 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/llm_logger.py +514 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/map_formatter.py +415 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/map_stitcher.py +1763 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/map_stitcher_singleton.py +33 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/map_trimmer.py +106 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/map_visualizer.py +334 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/ocr_dialogue.py +1020 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/recording.py +188 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/state_formatter.py +1481 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/vlm.py +862 -0
examples/task_apps/dev/pokemon_emerald/modal_app.py +114 -0
examples/task_apps/dev/pokemon_emerald/task_app/README.md +81 -0
examples/task_apps/dev/pokemon_emerald/task_app/__init__.py +6 -0
examples/task_apps/dev/pokemon_emerald/task_app/pokemon_emerald.py +685 -0
examples/task_apps/enron/__init__.py +2 -0
examples/task_apps/enron/eval_groq_qwen32.toml +16 -0
examples/task_apps/enron/filter_sft.toml +5 -0
examples/task_apps/enron/task_app/README.md +14 -0
examples/task_apps/enron/task_app/__init__.py +1 -0
examples/task_apps/enron/task_app/grpo_enron.py +906 -0
examples/task_apps/enron/task_app/grpo_enron_task_app.py +146 -0
examples/task_apps/enron/tests/__init__.py +4 -0
examples/task_apps/enron/tests/conftest.py +115 -0
examples/task_apps/enron/tests/integration/__init__.py +4 -0
examples/task_apps/enron/tests/integration/test_enron_eval.py +179 -0
examples/task_apps/enron/tests/integration/test_enron_rollout.py +135 -0
examples/task_apps/enron/tests/unit/__init__.py +4 -0
examples/task_apps/enron/tests/unit/test_enron_environment.py +126 -0
examples/task_apps/gepa_benchmarks/__init__.py +7 -0
examples/task_apps/gepa_benchmarks/common.py +260 -0
examples/task_apps/gepa_benchmarks/hotpotqa_task_app.py +507 -0
examples/task_apps/gepa_benchmarks/hover_task_app.py +436 -0
examples/task_apps/gepa_benchmarks/ifbench_task_app.py +563 -0
examples/task_apps/gepa_benchmarks/pupa_task_app.py +460 -0
examples/task_apps/math/README.md +21 -0
examples/task_apps/math/math_single_step.py +1000 -0
examples/task_apps/math/math_task_app.py +115 -0
examples/task_apps/pokemon_battle/__init__.py +2 -0
examples/task_apps/pokemon_battle/modal_app.py +104 -0
examples/task_apps/pokemon_battle/task_app/README.md +68 -0
examples/task_apps/pokemon_battle/task_app/__init__.py +6 -0
examples/task_apps/pokemon_battle/task_app/pokemon_showdown.py +932 -0
examples/task_apps/pokemon_red/EVAL_IMAGE_ONLY_COMPLETE.md +283 -0
examples/task_apps/pokemon_red/EVAL_IMAGE_ONLY_STATUS.md +155 -0
examples/task_apps/pokemon_red/README.md +356 -0
examples/task_apps/pokemon_red/README_IMAGE_ONLY_EVAL.md +428 -0
examples/task_apps/pokemon_red/__init__.py +3 -0
examples/task_apps/pokemon_red/eval_image_only_gpt4o.toml +30 -0
examples/task_apps/pokemon_red/eval_pokemon_red_policy.py +224 -0
examples/task_apps/pokemon_red/pallet_town_rl_config.toml +75 -0
examples/task_apps/pokemon_red/task_app.py +1048 -0
examples/task_apps/pokemon_red/test_pallet_town_rewards.py +193 -0
examples/task_apps/sokoban/README.md +306 -0
examples/task_apps/sokoban/__init__.py +3 -0
examples/task_apps/sokoban/eval_groq_qwen32.toml +16 -0
examples/task_apps/sokoban/eval_openai_gpt5.toml +16 -0
examples/task_apps/sokoban/filter_sft.toml +5 -0
examples/task_apps/sokoban/task_app.py +1058 -0
examples/task_apps/sokoban/tests/__init__.py +4 -0
examples/task_apps/sokoban/tests/conftest.py +113 -0
examples/task_apps/sokoban/tests/integration/__init__.py +4 -0
examples/task_apps/sokoban/tests/integration/test_sokoban_eval.py +57 -0
examples/task_apps/sokoban/tests/integration/test_sokoban_rollout.py +198 -0
examples/task_apps/sokoban/tests/unit/__init__.py +4 -0
examples/task_apps/sokoban/tests/unit/test_sokoban_environment.py +114 -0
examples/task_apps/verilog/__init__.py +1 -0
examples/task_apps/verilog/eval_groq_qwen32b.toml +22 -0
examples/task_apps/verilog/filter_sft.toml +5 -0
examples/task_apps/verilog/task_app/README.md +12 -0
examples/task_apps/verilog/task_app/__init__.py +1 -0
examples/task_apps/verilog/task_app/grpo_verilog.py +1166 -0
examples/task_apps/verilog/task_app/grpo_verilog_task_app.py +145 -0
examples/task_apps/verilog/tests/__init__.py +4 -0
examples/task_apps/verilog/tests/conftest.py +115 -0
examples/task_apps/verilog/tests/integration/__init__.py +4 -0
examples/task_apps/verilog/tests/integration/test_verilog_eval.py +181 -0
examples/task_apps/verilog/tests/integration/test_verilog_rollout.py +55 -0
examples/task_apps/verilog/tests/unit/__init__.py +4 -0
examples/task_apps/verilog/tests/unit/test_verilog_scoring.py +118 -0
examples/tunnel_gepa_banking77/README.md +106 -0
examples/tunnel_gepa_banking77/banking77_gepa_tunnel.toml +95 -0
examples/tunnel_gepa_banking77/keep_tunnel_running.py +60 -0
examples/tunnel_gepa_banking77/run_gepa_with_tunnel.sh +226 -0
examples/vlm/PROPOSAL.md +53 -0
examples/vlm/README.md +68 -0
examples/vlm/configs/crafter_vlm_gpt4o.toml +49 -0
examples/vlm/crafter_image_only_agent.py +207 -0
examples/vlm/crafter_openai_vlm_agent.py +275 -0
examples/vlm/filter_image_rows.py +63 -0
examples/vlm/run_crafter_vlm_benchmark.py +316 -0
examples/warming_up_to_rl/_utils.py +92 -0
examples/warming_up_to_rl/analyze_trace_db.py +422 -0
examples/warming_up_to_rl/configs/crafter_fft.toml +53 -0
examples/warming_up_to_rl/configs/crafter_fft_4b.toml +54 -0
examples/warming_up_to_rl/configs/eval_fft_qwen4b.toml +22 -0
examples/warming_up_to_rl/configs/eval_groq_qwen32b.toml +15 -0
examples/warming_up_to_rl/configs/eval_modal_qwen4b.toml +24 -0
examples/warming_up_to_rl/configs/eval_stepwise_complex.toml +35 -0
examples/warming_up_to_rl/configs/eval_stepwise_consistent.toml +26 -0
examples/warming_up_to_rl/configs/eval_stepwise_per_achievement.toml +36 -0
examples/warming_up_to_rl/configs/eval_stepwise_simple.toml +32 -0
examples/warming_up_to_rl/configs/rl_from_base_qwen4b.toml +85 -0
examples/warming_up_to_rl/configs/rl_from_ft.toml +58 -0
examples/warming_up_to_rl/export_trace_sft.py +837 -0
examples/warming_up_to_rl/groq_test.py +97 -0
examples/warming_up_to_rl/manage_secrets.py +131 -0
examples/warming_up_to_rl/old/event_rewards.md +234 -0
examples/warming_up_to_rl/old/notes.md +73 -0
examples/warming_up_to_rl/readme.md +110 -0
examples/warming_up_to_rl/run_eval.py +736 -0
examples/warming_up_to_rl/run_fft_and_save.py +380 -0
examples/warming_up_to_rl/run_local_rollout.py +239 -0
examples/warming_up_to_rl/run_local_rollout_modal.py +248 -0
examples/warming_up_to_rl/run_local_rollout_parallel.py +405 -0
examples/warming_up_to_rl/run_local_rollout_traced.py +477 -0
examples/warming_up_to_rl/run_rl_and_save.py +124 -0
examples/warming_up_to_rl/run_rollout_remote.py +156 -0
examples/warming_up_to_rl/task_app/README.md +42 -0
examples/warming_up_to_rl/task_app/grpo_crafter.py +876 -0
examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py +135 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/README.md +173 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/__init__.py +5 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/branching.py +143 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/environment_routes.py +1226 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/__init__.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/__init__.py +6 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/app.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/environment.py +522 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py +454 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py +108 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/shared.py +305 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/tools.py +47 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py +253 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/__init__.py +5 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py +729 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/main.py +100 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py +1114 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/registry.py +195 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py +1891 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/__init__.py +5 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/volume.py +211 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_agents.py +161 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_service.py +137 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/utils.py +129 -0
examples/workflows/math_rl/configs/eval_base_qwen.toml +15 -0
examples/workflows/math_rl/configs/eval_rl_qwen.toml +11 -0
examples/workflows/math_rl/configs/rl_from_base_qwen.toml +62 -0
examples/workflows/math_rl/configs/rl_from_base_qwen17.toml +80 -0
examples/workflows/math_rl/configs/rl_from_ft_qwen.toml +35 -0
examples/workflows/math_rl/download_dataset.py +80 -0
examples/workflows/math_rl/run_eval.py +436 -0
examples/workflows/math_rl/run_rl_and_save.py +111 -0
synth_ai/__init__.py +47 -23
synth_ai/_utils/__init__.py +47 -0
synth_ai/_utils/base_url.py +10 -0
synth_ai/_utils/http.py +10 -0
synth_ai/_utils/prompts.py +10 -0
synth_ai/_utils/task_app_state.py +12 -0
synth_ai/_utils/user_config.py +10 -0
synth_ai/api/models/supported.py +514 -0
synth_ai/api/train/__init__.py +63 -0
synth_ai/api/train/builders.py +473 -0
synth_ai/api/train/cli.py +1185 -0
synth_ai/api/train/config_finder.py +246 -0
synth_ai/api/train/configs/__init__.py +65 -0
synth_ai/api/train/configs/prompt_learning.py +496 -0
synth_ai/api/train/configs/rl.py +188 -0
synth_ai/api/train/configs/sft.py +99 -0
synth_ai/api/train/configs/shared.py +81 -0
synth_ai/api/train/env_resolver.py +352 -0
synth_ai/api/train/pollers.py +91 -0
synth_ai/api/train/prompt_learning.py +425 -0
synth_ai/api/train/sft.py +390 -0
synth_ai/api/train/supported_algos.py +147 -0
synth_ai/api/train/task_app.py +195 -0
synth_ai/api/train/utils.py +244 -0
synth_ai/api/train/validators.py +1117 -0
synth_ai/api/tunnel.py +49 -0
synth_ai/auth/credentials.py +94 -0
synth_ai/baseline/__init__.py +25 -0
synth_ai/baseline/config.py +209 -0
synth_ai/baseline/discovery.py +214 -0
synth_ai/baseline/execution.py +146 -0
synth_ai/cfgs.py +227 -0
synth_ai/cli/__init__.py +90 -45
synth_ai/cli/_modal_wrapper.py +31 -0
synth_ai/cli/_storage.py +20 -0
synth_ai/cli/_typer_patch.py +47 -0
synth_ai/cli/_validate_task_app.py +29 -0
synth_ai/cli/balance.py +16 -4
synth_ai/cli/calc.py +36 -21
synth_ai/cli/claude.py +70 -0
synth_ai/cli/codex.py +267 -0
synth_ai/cli/commands/__init__.py +18 -0
synth_ai/cli/commands/baseline/__init__.py +12 -0
synth_ai/cli/commands/baseline/core.py +637 -0
synth_ai/cli/commands/baseline/list.py +93 -0
synth_ai/cli/commands/demo/__init__.py +6 -0
synth_ai/cli/commands/demo/core.py +163 -0
synth_ai/cli/commands/eval/__init__.py +19 -0
synth_ai/cli/commands/eval/core.py +1112 -0
synth_ai/cli/commands/eval/errors.py +81 -0
synth_ai/cli/commands/eval/validation.py +133 -0
synth_ai/cli/commands/filter/__init__.py +12 -0
synth_ai/cli/commands/filter/core.py +424 -0
synth_ai/cli/commands/filter/errors.py +55 -0
synth_ai/cli/commands/filter/validation.py +77 -0
synth_ai/cli/commands/help/__init__.py +185 -0
synth_ai/cli/commands/help/core.py +72 -0
synth_ai/cli/commands/smoke/__init__.py +7 -0
synth_ai/cli/commands/smoke/core.py +1437 -0
synth_ai/cli/commands/status/__init__.py +66 -0
synth_ai/cli/commands/status/client.py +192 -0
synth_ai/cli/commands/status/config.py +92 -0
synth_ai/cli/commands/status/errors.py +20 -0
synth_ai/cli/commands/status/formatters.py +164 -0
synth_ai/cli/commands/status/subcommands/__init__.py +9 -0
synth_ai/cli/commands/status/subcommands/files.py +79 -0
synth_ai/cli/commands/status/subcommands/jobs.py +334 -0
synth_ai/cli/commands/status/subcommands/models.py +79 -0
synth_ai/cli/commands/status/subcommands/pricing.py +22 -0
synth_ai/cli/commands/status/subcommands/runs.py +81 -0
synth_ai/cli/commands/status/subcommands/session.py +183 -0
synth_ai/cli/commands/status/subcommands/summary.py +47 -0
synth_ai/cli/commands/status/subcommands/usage.py +203 -0
synth_ai/cli/commands/status/utils.py +114 -0
synth_ai/cli/commands/train/__init__.py +53 -0
synth_ai/cli/commands/train/core.py +21 -0
synth_ai/cli/commands/train/errors.py +117 -0
synth_ai/cli/commands/train/judge_schemas.py +200 -0
synth_ai/cli/commands/train/judge_validation.py +305 -0
synth_ai/cli/commands/train/validation.py +386 -0
synth_ai/cli/demo.py +32 -140
synth_ai/cli/deploy.py +233 -0
synth_ai/cli/eval/__init__.py +36 -0
synth_ai/cli/eval/core.py +5 -0
synth_ai/cli/eval/errors.py +31 -0
synth_ai/cli/eval/validation.py +5 -0
synth_ai/cli/filter/__init__.py +28 -0
synth_ai/cli/filter/core.py +5 -0
synth_ai/cli/filter/errors.py +23 -0
synth_ai/cli/filter/validation.py +5 -0
synth_ai/cli/legacy_root_backup.py +28 -22
synth_ai/cli/lib/__init__.py +10 -0
synth_ai/cli/lib/task_app_discovery.py +7 -0
synth_ai/cli/lib/task_app_env.py +518 -0
synth_ai/cli/mcp.py +34 -0
synth_ai/cli/modal_serve/__init__.py +12 -0
synth_ai/cli/modal_serve/core.py +14 -0
synth_ai/cli/modal_serve/errors.py +8 -0
synth_ai/cli/modal_serve/validation.py +11 -0
synth_ai/cli/opencode.py +256 -0
synth_ai/cli/recent.py +13 -7
synth_ai/cli/rl_demo.py +166 -114
synth_ai/cli/root.py +143 -112
synth_ai/cli/serve/__init__.py +12 -0
synth_ai/cli/serve/core.py +14 -0
synth_ai/cli/serve/errors.py +8 -0
synth_ai/cli/serve/validation.py +11 -0
synth_ai/cli/setup.py +49 -0
synth_ai/cli/status.py +7 -125
synth_ai/cli/task_app_deploy.py +7 -0
synth_ai/cli/task_app_list.py +25 -0
synth_ai/cli/task_app_modal_serve.py +11 -0
synth_ai/cli/task_app_serve.py +11 -0
synth_ai/cli/task_apps.py +3134 -0
synth_ai/cli/traces.py +9 -5
synth_ai/cli/train/__init__.py +12 -0
synth_ai/cli/train/core.py +21 -0
synth_ai/cli/train/errors.py +8 -0
synth_ai/cli/train/validation.py +24 -0
synth_ai/cli/train.py +5 -0
synth_ai/cli/turso.py +73 -0
synth_ai/cli/watch.py +13 -18
synth_ai/demos/__init__.py +10 -0
synth_ai/demos/core/__init__.py +28 -1
synth_ai/demos/core/cli.py +745 -416
synth_ai/demos/crafter/__init__.py +1 -0
synth_ai/demos/crafter/crafter_fft_4b.toml +55 -0
synth_ai/demos/crafter/grpo_crafter_task_app.py +185 -0
synth_ai/demos/crafter/rl_from_base_qwen4b.toml +74 -0
synth_ai/demos/demo_registry.py +176 -0
synth_ai/demos/demo_task_apps/__init__.py +7 -1
synth_ai/demos/demo_task_apps/core.py +75 -37
synth_ai/demos/demo_task_apps/crafter/__init__.py +1 -0
synth_ai/demos/demo_task_apps/crafter/configs/crafter_fft_4b.toml +53 -0
synth_ai/demos/demo_task_apps/crafter/configs/rl_from_base_qwen4b.toml +73 -0
synth_ai/demos/demo_task_apps/crafter/grpo_crafter_task_app.py +184 -0
synth_ai/demos/demo_task_apps/math/_common.py +1 -2
synth_ai/demos/demo_task_apps/math/app.py +2 -1
synth_ai/demos/demo_task_apps/math/config.toml +55 -110
synth_ai/demos/demo_task_apps/math/deploy_modal.py +3 -6
synth_ai/demos/demo_task_apps/math/modal_task_app.py +491 -166
synth_ai/demos/demo_task_apps/math/task_app_entry.py +37 -0
synth_ai/demos/math/__init__.py +1 -0
synth_ai/demos/math/_common.py +16 -0
synth_ai/demos/math/app.py +38 -0
synth_ai/demos/math/config.toml +76 -0
synth_ai/demos/math/deploy_modal.py +54 -0
synth_ai/demos/math/modal_task_app.py +703 -0
synth_ai/demos/math/task_app_entry.py +51 -0
synth_ai/environments/environment/core.py +7 -1
synth_ai/environments/examples/bandit/engine.py +12 -5
synth_ai/environments/examples/bandit/environment.py +0 -1
synth_ai/environments/examples/bandit/taskset.py +4 -4
synth_ai/environments/examples/crafter_classic/engine_deterministic_patch.py +7 -4
synth_ai/environments/examples/crafter_classic/engine_serialization_patch_v3.py +9 -5
synth_ai/environments/examples/crafter_classic/environment.py +93 -2
synth_ai/environments/examples/crafter_classic/world_config_patch_simple.py +4 -3
synth_ai/environments/examples/enron/engine.py +7 -2
synth_ai/environments/examples/enron/environment.py +68 -0
synth_ai/environments/examples/red/engine.py +60 -12
synth_ai/environments/examples/red/engine_helpers/memory_map.py +7 -0
synth_ai/environments/examples/red/engine_helpers/reward_components.py +151 -179
synth_ai/environments/examples/red/engine_helpers/reward_library/pallet_town_progression.py +477 -0
synth_ai/environments/examples/red/engine_helpers/state_extraction.py +32 -0
synth_ai/environments/examples/red/environment.py +86 -0
synth_ai/environments/examples/red/trace_hooks_v3.py +168 -0
synth_ai/environments/examples/sokoban/taskset.py +116 -0
synth_ai/environments/examples/verilog/engine.py +104 -12
synth_ai/environments/examples/wordle/environment.py +0 -1
synth_ai/environments/reproducibility/tree.py +5 -6
synth_ai/environments/service/app.py +11 -12
synth_ai/environments/service/core_routes.py +10 -9
synth_ai/environments/stateful/engine.py +1 -1
synth_ai/environments/tasks/core.py +1 -0
synth_ai/environments/tasks/filters.py +5 -6
synth_ai/environments/tasks/utils.py +4 -5
synth_ai/evals/__init__.py +15 -0
synth_ai/evals/base.py +14 -5
synth_ai/evals/client.py +82 -0
synth_ai/evals/types.py +42 -0
synth_ai/http.py +8 -22
synth_ai/http_client.py +45 -12
synth_ai/inference/__init__.py +0 -2
synth_ai/inference/client.py +21 -7
synth_ai/jobs/client.py +129 -80
synth_ai/judge_schemas.py +127 -0
synth_ai/learning/__init__.py +51 -6
synth_ai/learning/algorithms.py +14 -0
synth_ai/learning/client.py +122 -30
synth_ai/learning/config.py +2 -40
synth_ai/learning/constants.py +0 -2
synth_ai/learning/ft_client.py +4 -56
synth_ai/learning/health.py +14 -8
synth_ai/learning/jobs.py +43 -47
synth_ai/learning/prompt_learning_client.py +276 -0
synth_ai/learning/prompt_learning_types.py +185 -0
synth_ai/{rl → learning/rl}/__init__.py +14 -5
synth_ai/learning/rl/client.py +269 -0
synth_ai/learning/rl/config.py +31 -0
synth_ai/{rl → learning/rl}/contracts.py +5 -10
synth_ai/{rl → learning/rl}/env_keys.py +45 -16
synth_ai/learning/rl/secrets.py +13 -0
synth_ai/learning/rl_client.py +2 -253
synth_ai/learning/sft/__init__.py +29 -0
synth_ai/learning/sft/client.py +68 -0
synth_ai/learning/sft/config.py +270 -0
synth_ai/learning/sft/data.py +698 -0
synth_ai/learning/sse.py +25 -26
synth_ai/learning/validators.py +29 -25
synth_ai/mcp/__init__.py +5 -0
synth_ai/mcp/__main__.py +8 -0
synth_ai/mcp/main.py +254 -0
synth_ai/mcp/setup.py +100 -0
synth_ai/modal.py +257 -0
synth_ai/pricing/__init__.py +3 -0
synth_ai/pricing/model_pricing.py +64 -0
synth_ai/session/__init__.py +75 -0
synth_ai/session/client.py +383 -0
synth_ai/session/constants.py +63 -0
synth_ai/session/exceptions.py +105 -0
synth_ai/session/manager.py +139 -0
synth_ai/session/models.py +89 -0
synth_ai/session/query.py +110 -0
synth_ai/spec/__init__.py +46 -0
synth_ai/spec/dataclasses.py +149 -0
synth_ai/spec/loader.py +144 -0
synth_ai/spec/serializer.py +199 -0
synth_ai/spec/validation.py +250 -0
synth_ai/streaming/__init__.py +29 -0
synth_ai/streaming/config.py +94 -0
synth_ai/streaming/handlers.py +589 -0
synth_ai/streaming/streamer.py +320 -0
synth_ai/streaming/types.py +95 -0
synth_ai/task/__init__.py +116 -3
synth_ai/task/apps/__init__.py +132 -0
synth_ai/task/auth.py +165 -0
synth_ai/task/client.py +167 -0
synth_ai/task/config.py +261 -0
synth_ai/task/contracts.py +173 -57
synth_ai/task/datasets.py +108 -0
synth_ai/task/errors.py +50 -0
synth_ai/task/health.py +17 -11
synth_ai/task/inference_api.py +101 -0
synth_ai/task/json.py +111 -0
synth_ai/task/proxy.py +251 -0
synth_ai/task/rubrics/__init__.py +55 -0
synth_ai/task/rubrics/loaders.py +156 -0
synth_ai/task/rubrics/models.py +57 -0
synth_ai/task/rubrics/scoring.py +116 -0
synth_ai/task/rubrics/strict.py +149 -0
synth_ai/task/rubrics.py +219 -0
synth_ai/task/server.py +432 -0
synth_ai/task/trace_correlation_helpers.py +328 -0
synth_ai/task/tracing_utils.py +95 -0
synth_ai/task/validators.py +449 -6
synth_ai/task/vendors.py +59 -0
synth_ai/tracing_v3/__init__.py +4 -0
synth_ai/tracing_v3/abstractions.py +21 -4
synth_ai/tracing_v3/config.py +167 -22
synth_ai/tracing_v3/constants.py +21 -0
synth_ai/tracing_v3/db_config.py +42 -29
synth_ai/tracing_v3/decorators.py +80 -45
synth_ai/tracing_v3/examples/basic_usage.py +15 -9
synth_ai/tracing_v3/hooks.py +6 -4
synth_ai/tracing_v3/llm_call_record_helpers.py +161 -61
synth_ai/tracing_v3/migration_helper.py +1 -2
synth_ai/tracing_v3/replica_sync.py +12 -7
synth_ai/tracing_v3/serialization.py +130 -0
synth_ai/tracing_v3/session_tracer.py +86 -21
synth_ai/tracing_v3/storage/base.py +98 -12
synth_ai/tracing_v3/storage/config.py +63 -16
synth_ai/tracing_v3/storage/factory.py +11 -9
synth_ai/tracing_v3/storage/utils.py +15 -11
synth_ai/tracing_v3/trace_utils.py +317 -0
synth_ai/tracing_v3/turso/__init__.py +8 -21
synth_ai/tracing_v3/turso/daemon.py +123 -15
synth_ai/tracing_v3/turso/models.py +5 -2
synth_ai/tracing_v3/turso/native_manager.py +1293 -0
synth_ai/tracing_v3/utils.py +5 -4
synth_ai/tunnel.py +143 -0
synth_ai/tunnel_deploy.py +278 -0
synth_ai/types.py +8 -0
synth_ai/urls.py +11 -0
synth_ai/utils/__init__.py +166 -0
synth_ai/utils/agents.py +74 -0
synth_ai/utils/apps.py +152 -0
synth_ai/utils/base_url.py +94 -0
synth_ai/utils/bin.py +39 -0
synth_ai/utils/claude.py +36 -0
synth_ai/utils/cli.py +284 -0
synth_ai/utils/config.py +81 -0
synth_ai/utils/env.py +346 -0
synth_ai/utils/errors.py +85 -0
synth_ai/utils/http.py +172 -0
synth_ai/utils/json.py +72 -0
synth_ai/utils/log_filter.py +99 -0
synth_ai/utils/logging.py +198 -0
synth_ai/utils/modal.py +299 -0
synth_ai/utils/paths.py +95 -0
synth_ai/utils/process.py +233 -0
synth_ai/utils/prompts.py +39 -0
synth_ai/utils/sqld.py +122 -0
synth_ai/utils/ssl.py +25 -0
synth_ai/utils/task_app_discovery.py +882 -0
synth_ai/utils/task_app_env.py +186 -0
synth_ai/utils/task_app_state.py +318 -0
synth_ai/utils/tunnel/__init__.py +12 -0
synth_ai/utils/tunnel/config.py +55 -0
synth_ai/utils/user_config.py +137 -0
synth_ai/uvicorn.py +77 -0
synth_ai-0.2.23.dev3.dist-info/METADATA +357 -0
synth_ai-0.2.23.dev3.dist-info/RECORD +983 -0
{synth_ai-0.2.8.dev4.dist-info → synth_ai-0.2.23.dev3.dist-info}/entry_points.txt +0 -1
{synth_ai-0.2.8.dev4.dist-info → synth_ai-0.2.23.dev3.dist-info}/top_level.txt +1 -0
synth_ai/cli/man.py +0 -106
synth_ai/core/experiment.py +0 -15
synth_ai/core/system.py +0 -15
synth_ai/environments/examples/sokoban/units/astar_common.py +0 -95
synth_ai/experimental/synth_oss.py +0 -446
synth_ai/handshake.py +0 -63
synth_ai/install_sqld.sh +0 -40
synth_ai/learning/offline/dpo.py +0 -0
synth_ai/learning/offline/providers.py +0 -7
synth_ai/learning/offline/sft.py +0 -0
synth_ai/learning/offline/shared.py +0 -0
synth_ai/learning/online/grpo.py +0 -0
synth_ai/learning/online/irft.py +0 -0
synth_ai/learning/prompts/banking77_injection_eval.py +0 -168
synth_ai/learning/prompts/gepa.py +0 -0
synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +0 -213
synth_ai/learning/prompts/mipro.py +0 -289
synth_ai/learning/prompts/random_search.py +0 -246
synth_ai/learning/prompts/run_mipro_banking77.py +0 -172
synth_ai/learning/prompts/run_random_search_banking77.py +0 -324
synth_ai/lm/__init__.py +0 -51
synth_ai/lm/caching/constants.py +0 -6
synth_ai/lm/caching/dbs.py +0 -0
synth_ai/lm/caching/ephemeral.py +0 -102
synth_ai/lm/caching/handler.py +0 -137
synth_ai/lm/caching/initialize.py +0 -11
synth_ai/lm/caching/persistent.py +0 -114
synth_ai/lm/config.py +0 -110
synth_ai/lm/constants.py +0 -32
synth_ai/lm/core/__init__.py +0 -8
synth_ai/lm/core/all.py +0 -73
synth_ai/lm/core/exceptions.py +0 -7
synth_ai/lm/core/main.py +0 -319
synth_ai/lm/core/main_v3.py +0 -594
synth_ai/lm/core/synth_models.py +0 -48
synth_ai/lm/core/vendor_clients.py +0 -188
synth_ai/lm/cost/monitor.py +0 -1
synth_ai/lm/cost/statefulness.py +0 -1
synth_ai/lm/injection.py +0 -80
synth_ai/lm/overrides.py +0 -206
synth_ai/lm/provider_support/__init__.py +0 -8
synth_ai/lm/provider_support/anthropic.py +0 -972
synth_ai/lm/provider_support/openai.py +0 -1139
synth_ai/lm/provider_support/suppress_logging.py +0 -31
synth_ai/lm/structured_outputs/handler.py +0 -440
synth_ai/lm/structured_outputs/inject.py +0 -297
synth_ai/lm/structured_outputs/rehabilitate.py +0 -185
synth_ai/lm/tools/__init__.py +0 -3
synth_ai/lm/tools/base.py +0 -172
synth_ai/lm/unified_interface.py +0 -202
synth_ai/lm/vendors/base.py +0 -81
synth_ai/lm/vendors/core/anthropic_api.py +0 -387
synth_ai/lm/vendors/core/gemini_api.py +0 -292
synth_ai/lm/vendors/core/mistral_api.py +0 -322
synth_ai/lm/vendors/core/openai_api.py +0 -225
synth_ai/lm/vendors/core/synth_dev_api.py +0 -0
synth_ai/lm/vendors/local/ollama.py +0 -0
synth_ai/lm/vendors/openai_standard.py +0 -780
synth_ai/lm/vendors/openai_standard_responses.py +0 -256
synth_ai/lm/vendors/retries.py +0 -22
synth_ai/lm/vendors/supported/custom_endpoint.py +0 -417
synth_ai/lm/vendors/supported/deepseek.py +0 -69
synth_ai/lm/vendors/supported/grok.py +0 -75
synth_ai/lm/vendors/supported/groq.py +0 -16
synth_ai/lm/vendors/supported/ollama.py +0 -15
synth_ai/lm/vendors/supported/openrouter.py +0 -74
synth_ai/lm/vendors/supported/together.py +0 -11
synth_ai/lm/vendors/synth_client.py +0 -808
synth_ai/lm/warmup.py +0 -186
synth_ai/rl/secrets.py +0 -19
synth_ai/scripts/verify_rewards.py +0 -100
synth_ai/tracing/__init__.py +0 -30
synth_ai/tracing_v1/__init__.py +0 -33
synth_ai/tracing_v3/turso/manager.py +0 -760
synth_ai/v0/tracing/abstractions.py +0 -224
synth_ai/v0/tracing/base_client.py +0 -91
synth_ai/v0/tracing/client_manager.py +0 -131
synth_ai/v0/tracing/config.py +0 -142
synth_ai/v0/tracing/context.py +0 -146
synth_ai/v0/tracing/decorators.py +0 -682
synth_ai/v0/tracing/events/__init__.py +0 -0
synth_ai/v0/tracing/events/manage.py +0 -147
synth_ai/v0/tracing/events/scope.py +0 -86
synth_ai/v0/tracing/events/store.py +0 -228
synth_ai/v0/tracing/immediate_client.py +0 -151
synth_ai/v0/tracing/local.py +0 -18
synth_ai/v0/tracing/log_client_base.py +0 -73
synth_ai/v0/tracing/retry_queue.py +0 -186
synth_ai/v0/tracing/trackers.py +0 -515
synth_ai/v0/tracing/upload.py +0 -512
synth_ai/v0/tracing/utils.py +0 -9
synth_ai/v0/tracing_v1/__init__.py +0 -16
synth_ai/v0/tracing_v1/abstractions.py +0 -224
synth_ai/v0/tracing_v1/base_client.py +0 -91
synth_ai/v0/tracing_v1/client_manager.py +0 -131
synth_ai/v0/tracing_v1/config.py +0 -142
synth_ai/v0/tracing_v1/context.py +0 -146
synth_ai/v0/tracing_v1/decorators.py +0 -703
synth_ai/v0/tracing_v1/events/__init__.py +0 -0
synth_ai/v0/tracing_v1/events/manage.py +0 -147
synth_ai/v0/tracing_v1/events/scope.py +0 -86
synth_ai/v0/tracing_v1/events/store.py +0 -228
synth_ai/v0/tracing_v1/immediate_client.py +0 -151
synth_ai/v0/tracing_v1/local.py +0 -18
synth_ai/v0/tracing_v1/log_client_base.py +0 -73
synth_ai/v0/tracing_v1/retry_queue.py +0 -186
synth_ai/v0/tracing_v1/trackers.py +0 -515
synth_ai/v0/tracing_v1/upload.py +0 -527
synth_ai/v0/tracing_v1/utils.py +0 -9
synth_ai/zyk/__init__.py +0 -30
synth_ai-0.2.8.dev4.dist-info/METADATA +0 -129
synth_ai-0.2.8.dev4.dist-info/RECORD +0 -420
{synth_ai/lm/caching → examples/task_apps}/__init__.py +0 -0
{synth_ai/lm/cost → examples/task_apps/crafter}/__init__.py +0 -0
{synth_ai/lm/structured_outputs → examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/server}/__init__.py +0 -0
{synth_ai/lm/vendors → examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests}/__init__.py +0 -0
{synth_ai/lm/vendors/core → examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils}/__init__.py +0 -0
{synth_ai/lm/vendors/local → examples/task_apps/math}/__init__.py +0 -0
{synth_ai/lm/vendors/supported → examples/workflows}/__init__.py +0 -0
{synth_ai/v0/tracing → examples/workflows/math_rl}/__init__.py +0 -0
/synth_ai/{compound/cais.py → cli/__main__.py} +0 -0
/synth_ai/{learning/filtering.py → py.typed} +0 -0
{synth_ai-0.2.8.dev4.dist-info → synth_ai-0.2.23.dev3.dist-info}/WHEEL +0 -0
{synth_ai-0.2.8.dev4.dist-info → synth_ai-0.2.23.dev3.dist-info}/licenses/LICENSE +0 -0

synth_ai/demos/core/cli.py CHANGED Viewed

@@ -1,19 +1,38 @@
 from __future__ import annotations
-import argparse
+import contextlib
 import json
 import os
-import sys
-import time
-from pathlib import Path
-from typing import Any, Dict, Callable
 import shutil
 import stat
+import sys
 import textwrap
+import time
+from collections.abc import Callable
+from pathlib import Path
+from typing import Any
+from synth_ai.demo_registry import (
+    DemoTemplate,
+    get_demo_template,
+    list_demo_templates,
+)
 from synth_ai.demos.demo_task_apps import core as demo_core
-from synth_ai.handshake import run_handshake, HandshakeError
-from synth_ai.demos.demo_task_apps.core import DemoEnv
+from synth_ai.demos.demo_task_apps.core import DEFAULT_TASK_APP_SECRET_NAME, DemoEnv
+from synth_ai.handshake import HandshakeError, run_handshake
+from synth_ai.utils.process import get_subprocess_env, should_filter_log_line
+def _key_preview(value: str, label: str) -> str:
+    """Return a short descriptor for a secret without leaking the full value."""
+    try:
+        text = value or ""
+        length = len(text)
+        prefix = text[:6] if length >= 6 else text
+        suffix = text[-5:] if length >= 5 else text
+        return f"{label} len={length} prefix={prefix} last5={suffix}"
+    except Exception:
+        return f"{label} len=0"
 def _is_modal_public_url(u: str) -> bool:
@@ -26,35 +45,71 @@ def _is_modal_public_url(u: str) -> bool:
         return False
-def cmd_setup(_args: argparse.Namespace) -> int:
-    # 1) Always perform SDK handshake and overwrite .env with returned keys
+def setup() -> int:
+    # Change to demo directory if stored
+    demo_dir = demo_core.load_demo_dir()
+    if demo_dir and os.path.isdir(demo_dir):
+        os.chdir(demo_dir)
+        print(f"Using demo directory: {demo_dir}")
+    # 1) Try to fetch keys from frontend; fall back to manual input if fetch fails
+    synth_key = ""
+    rl_env_key = ""
+    org_name = "this organization"
     try:
         print("\n⏳ Connecting SDK to your browser session…")
         res = run_handshake()
-        user = res.get("user") or {}
         org = res.get("org") or {}
         keys = res.get("keys") or {}
         synth_key = str(keys.get("synth") or "").strip()
         rl_env_key = str(keys.get("rl_env") or "").strip()
-        if not synth_key or not rl_env_key:
-            raise HandshakeError("handshake returned missing keys")
-        # Overwrite .env with the latest values from the account/org
-        demo_core.persist_dotenv_values({
+        org_name = org.get("name") or "this organization"
+        print(f"✅ Connected to {org_name}!")
+    except (HandshakeError, Exception) as e:
+        print(f"⚠️  Failed to fetch keys from frontend: {e}")
+        print("Falling back to manual entry...")
+    # Prompt for manual input if any key is missing
+    if not synth_key:
+        try:
+            synth_key = input(
+                "Failed to fetch your Synth API key. Please enter your Synth API key here:\n> "
+            ).strip()
+        except (EOFError, KeyboardInterrupt):
+            print("\nSetup cancelled.")
+            return 1
+        if not synth_key:
+            print("Synth API key is required.")
+            return 1
+    if not rl_env_key:
+        try:
+            rl_env_key = input(
+                "Failed to fetch your RL Environment API key. Please enter your RL Environment API key here:\n> "
+            ).strip()
+        except (EOFError, KeyboardInterrupt):
+            print("\nSetup cancelled.")
+            return 1
+        if not rl_env_key:
+            print("RL Environment API key is required.")
+            return 1
+    # Persist both keys to .env
+    dotenv_path = demo_core.persist_dotenv_values(
+        {
             "SYNTH_API_KEY": synth_key,
             "ENVIRONMENT_API_KEY": rl_env_key,
-        })
-        org_name = (org.get("name") or "this organization")
-        print(f"✅ Connected to {org_name}!")
-    except HandshakeError as e:
-        print(f"Handshake failed: {e}")
-        return 1
-    except Exception as e:
-        print(f"Unexpected handshake error: {e}")
-        return 1
+        }
+    )
+    # Store .env path for subsequent commands
+    demo_core.persist_env_file_path(dotenv_path)
     # 2) Reload env after handshake to pick up values from .env (suppress env prints)
-    import io
     import contextlib
+    import io
     _buf = io.StringIO()
     with contextlib.redirect_stdout(_buf):
         env = demo_core.load_env()
@@ -71,22 +126,22 @@ def cmd_setup(_args: argparse.Namespace) -> int:
             return
         current = env.task_app_base_url
         needs_lookup = False
-        if not current:
-            needs_lookup = True
-        elif not _is_modal_public_url(current):
+        if not current or not _is_modal_public_url(current):
             needs_lookup = True
         if not needs_lookup:
             return
-        code, out = _popen_capture([
-            "uv",
-            "run",
-            "python",
-            "-m",
-            "modal",
-            "app",
-            "url",
-            env.task_app_name,
-        ])
+        code, out = _popen_capture(
+            [
+                "uv",
+                "run",
+                "python",
+                "-m",
+                "modal",
+                "app",
+                "url",
+                env.task_app_name,
+            ]
+        )
         if code != 0 or not out:
             return
         new_url = ""
@@ -100,7 +155,6 @@ def cmd_setup(_args: argparse.Namespace) -> int:
             dotenv_values = {
                 "TASK_APP_BASE_URL": new_url,
                 "TASK_APP_NAME": env.task_app_name,
-                "TASK_APP_SECRET_NAME": env.task_app_secret_name or f"{env.task_app_name}-secret",
             }
             demo_core.persist_dotenv_values(dotenv_values)
             os.environ["TASK_APP_BASE_URL"] = new_url
@@ -117,15 +171,16 @@ def cmd_setup(_args: argparse.Namespace) -> int:
     _maybe_fix_task_url()
-    ok_backend = False
-    ok_task = False
     if env.dev_backend_url:
-        api = env.dev_backend_url.rstrip("/") + ("" if env.dev_backend_url.endswith("/api") else "/api")
-        ok_backend = demo_core.assert_http_ok(api + "/health", method="GET")
+        api = env.dev_backend_url.rstrip("/") + (
+            "" if env.dev_backend_url.endswith("/api") else "/api"
+        )
+        demo_core.assert_http_ok(api + "/health", method="GET")
         # Intentionally suppress backend health print for concise output
     if env.task_app_base_url:
-        ok_task = demo_core.assert_http_ok(env.task_app_base_url.rstrip("/") + "/health", method="GET") or \
-                  demo_core.assert_http_ok(env.task_app_base_url.rstrip("/"), method="GET")
+        demo_core.assert_http_ok(
+            env.task_app_base_url.rstrip("/") + "/health", method="GET"
+        ) or demo_core.assert_http_ok(env.task_app_base_url.rstrip("/"), method="GET")
         # Intentionally suppress task app health print
     else:
         print("\nSet your task app URL by running:\nuvx synth-ai rl_demo deploy\n")
@@ -133,13 +188,19 @@ def cmd_setup(_args: argparse.Namespace) -> int:
     # Omit uv version print to keep output concise
     # Keep exit code neutral; not all checks are critical for pairing
+    print(f"\nKeys saved to: {dotenv_path}")
     return 0
-def _popen_capture(cmd: list[str], cwd: str | None = None, env: dict | None = None) -> tuple[int, str]:
+def _popen_capture(
+    cmd: list[str], cwd: str | None = None, env: dict | None = None
+) -> tuple[int, str]:
     import subprocess
     try:
-        proc = subprocess.Popen(cmd, cwd=cwd, env=env, stdout=subprocess.PIPE, stderr=subprocess.STDOUT, text=True)
+        proc = subprocess.Popen(
+            cmd, cwd=cwd, env=get_subprocess_env(env), stdout=subprocess.PIPE, stderr=subprocess.STDOUT, text=True
+        )
         out, _ = proc.communicate()
         return int(proc.returncode or 0), out or ""
     except Exception as e:
@@ -156,7 +217,7 @@ def _popen_stream(cmd: list[str], cwd: str | None = None, env: dict | None = Non
         proc = subprocess.Popen(
             cmd,
             cwd=cwd,
-            env=env,
+            env=get_subprocess_env(env),
             stdout=subprocess.PIPE,
             stderr=subprocess.STDOUT,
             text=True,
@@ -169,7 +230,8 @@ def _popen_stream(cmd: list[str], cwd: str | None = None, env: dict | None = Non
     def _pump(stdout) -> None:
         try:
             for line in stdout:
-                print(line.rstrip())
+                if not should_filter_log_line(line):
+                    print(line.rstrip())
         except Exception:
             pass
@@ -183,7 +245,9 @@ def _popen_stream(cmd: list[str], cwd: str | None = None, env: dict | None = Non
     return int(proc.returncode or 0)
-def _popen_stream_capture(cmd: list[str], cwd: str | None = None, env: dict | None = None) -> tuple[int, str]:
+def _popen_stream_capture(
+    cmd: list[str], cwd: str | None = None, env: dict | None = None
+) -> tuple[int, str]:
     """Stream subprocess output to stdout and also capture it into a buffer."""
     import subprocess
     import threading
@@ -193,7 +257,7 @@ def _popen_stream_capture(cmd: list[str], cwd: str | None = None, env: dict | No
         proc = subprocess.Popen(
             cmd,
             cwd=cwd,
-            env=env,
+            env=get_subprocess_env(env),
             stdout=subprocess.PIPE,
             stderr=subprocess.STDOUT,
             text=True,
@@ -207,8 +271,9 @@ def _popen_stream_capture(cmd: list[str], cwd: str | None = None, env: dict | No
         try:
             for line in stdout:
                 line = line.rstrip()
-                print(line)
-                buf_lines.append(line)
+                if not should_filter_log_line(line):
+                    print(line)
+                    buf_lines.append(line)
         except Exception:
             pass
@@ -222,55 +287,6 @@ def _popen_stream_capture(cmd: list[str], cwd: str | None = None, env: dict | No
     return int(proc.returncode or 0), "\n".join(buf_lines)
-def _mask_secret_args(args: list[str]) -> list[str]:
-    masked: list[str] = []
-    for a in args:
-        if "=" in a and any(a.startswith(prefix) for prefix in ("ENVIRONMENT_API_KEY=", "OPENAI_API_KEY=", "SYNTH_API_KEY=")):
-            try:
-                key, value = a.split("=", 1)
-                tail = value[-5:] if len(value) >= 5 else value
-                masked.append(f"{key}=***{tail}")
-            except Exception:
-                masked.append("<masked>")
-        else:
-            masked.append(a)
-    return masked
-def _ensure_modal_secret(
-    secret_name: str,
-    *,
-    values: dict[str, str],
-    label: str = "deploy",
-    replace: bool = False,
-) -> bool:
-    prefix = f"[{label}]"
-    if not secret_name.strip():
-        raise RuntimeError("Secret name is required")
-    if not values:
-        raise RuntimeError("No values provided to create Modal secret")
-    create_args = [f"{k}={v}" for k, v in values.items()]
-    create_cmd = ["uv", "run", "modal", "secret", "create", secret_name, *create_args]
-    if replace:
-        print(f"{prefix} Removing Modal secret '{secret_name}' (if present)…")
-        delete_cmd = ["bash", "-lc", f"printf 'y\\n' | uv run modal secret delete {secret_name}"]
-        print(f"{prefix} Command:", " ".join(delete_cmd))
-        delete_code = _popen_stream(delete_cmd)
-        if delete_code != 0:
-            print(f"{prefix} Warning: delete command exited with {delete_code}; continuing to create")
-    print(f"\n{prefix} Creating Modal secret '{secret_name}'…")
-    print(f"{prefix} Command:", " ".join(_mask_secret_args(create_cmd)))
-    code = _popen_stream(create_cmd)
-    if code != 0:
-        raise RuntimeError("Failed to provision Modal secret (see logs above)")
-    return True
 def _fmt_float(value: float) -> str:
     return f"{value:.10g}"
@@ -283,7 +299,19 @@ def _find_asgi_apps(root: Path) -> list[Path]:
       - "@modal.asgi_app()"
     """
     results: list[Path] = []
-    skip_dirs = {".git", ".hg", ".svn", "node_modules", "dist", "build", "__pycache__", ".ruff_cache", ".mypy_cache", "venv", ".venv"}
+    skip_dirs = {
+        ".git",
+        ".hg",
+        ".svn",
+        "node_modules",
+        "dist",
+        "build",
+        "__pycache__",
+        ".ruff_cache",
+        ".mypy_cache",
+        "venv",
+        ".venv",
+    }
     for dirpath, dirnames, filenames in os.walk(root):
         dirnames[:] = [d for d in dirnames if d not in skip_dirs]
         for name in filenames:
@@ -297,16 +325,20 @@ def _find_asgi_apps(root: Path) -> list[Path]:
                     results.append(path)
             except Exception:
                 continue
     # Stable order: prioritize files under synth_demo/ first, then alphabetical
     def _priority(p: Path) -> tuple[int, str]:
         rel = str(p.resolve())
         in_demo = "/synth_demo/" in rel or rel.endswith("/synth_demo/task_app.py")
         return (0 if in_demo else 1, rel)
     results.sort(key=_priority)
     return results
-def _prompt_value(label: str, default: str | int | float, cast: Callable[[str], Any] | None = None) -> Any:
+def _prompt_value(
+    label: str, default: str | int | float, cast: Callable[[str], Any] | None = None
+) -> Any:
     prompt = f"{label} [{default}]: "
     try:
         raw = input(prompt).strip()
@@ -325,7 +357,19 @@ def _prompt_value(label: str, default: str | int | float, cast: Callable[[str],
 def _find_vllm_tomls(root: Path) -> list[Path]:
     results: list[Path] = []
-    skip_dirs = {".git", ".hg", ".svn", "node_modules", "dist", "build", "__pycache__", ".ruff_cache", ".mypy_cache", "venv", ".venv"}
+    skip_dirs = {
+        ".git",
+        ".hg",
+        ".svn",
+        "node_modules",
+        "dist",
+        "build",
+        "__pycache__",
+        ".ruff_cache",
+        ".mypy_cache",
+        "venv",
+        ".venv",
+    }
     for dirpath, dirnames, filenames in os.walk(root):
         dirnames[:] = [d for d in dirnames if d not in skip_dirs]
         for name in filenames:
@@ -345,7 +389,9 @@ def _create_new_config(env: DemoEnv) -> str:
     default_path = os.path.join(os.getcwd(), "demo_config.toml")
     while True:
         try:
-            destination = input(f"Path to save new config [{default_path}]: ").strip() or default_path
+            destination = (
+                input(f"Path to save new config [{default_path}]: ").strip() or default_path
+            )
         except Exception:
             destination = default_path
         destination = os.path.abspath(destination)
@@ -354,7 +400,9 @@ def _create_new_config(env: DemoEnv) -> str:
             continue
         if os.path.exists(destination):
             try:
-                overwrite = input(f"{destination} exists. Overwrite? [y/N]: ").strip().lower() or "n"
+                overwrite = (
+                    input(f"{destination} exists. Overwrite? [y/N]: ").strip().lower() or "n"
+                )
             except Exception:
                 overwrite = "n"
             if not overwrite.startswith("y"):
@@ -366,7 +414,9 @@ def _create_new_config(env: DemoEnv) -> str:
     model_name = _prompt_value("Model name", "Qwen/Qwen3-0.6B")
     compute_gpu_type = _prompt_value("Compute GPU type", "H100")
     compute_gpu_count = _prompt_value("Compute GPU count", 4, int)
-    topology_gpu_type = _prompt_value("Topology GPU type", f"{compute_gpu_type}:{compute_gpu_count}")
+    topology_gpu_type = _prompt_value(
+        "Topology GPU type", f"{compute_gpu_type}:{compute_gpu_count}"
+    )
     gpus_for_vllm = _prompt_value("Topology gpus_for_vllm", 2, int)
     gpus_for_training = _prompt_value("Topology gpus_for_training", 1, int)
     tensor_parallel = _prompt_value("Topology tensor_parallel", 2, int)
@@ -384,8 +434,9 @@ def _create_new_config(env: DemoEnv) -> str:
     task_url_default = env.task_app_base_url or ""
     services_task_url = _prompt_value("services.task_url", task_url_default)
-    template = textwrap.dedent(
-        f"""\
+    template = (
+        textwrap.dedent(
+            f"""\
         # Crafter online RL training configuration (research local copy)
         [model]
@@ -527,7 +578,9 @@ def _create_new_config(env: DemoEnv) -> str:
         [services]
         task_url = \"{services_task_url}\"
         """
-    ).strip() + "\n"
+        ).strip()
+        + "\n"
+    )
     with open(destination, "w", encoding="utf-8") as fh:
         fh.write(template)
@@ -546,7 +599,11 @@ def _select_or_create_config(explicit: str | None, env: DemoEnv) -> str:
     discovered = _find_vllm_tomls(search_root)
     extras: list[Path] = []
-    packaged = Path(os.path.abspath(os.path.join(os.path.dirname(__file__), "..", "demo_task_apps", "math", "config.toml")))
+    packaged = Path(
+        os.path.abspath(
+            os.path.join(os.path.dirname(__file__), "..", "demo_task_apps", "math", "config.toml")
+        )
+    )
     extras.append(packaged)
     home_cfg = Path(os.path.expanduser("~/.synth-ai/demo_config.toml"))
     extras.append(home_cfg)
@@ -592,29 +649,36 @@ def _ensure_task_app_ready(env: DemoEnv, synth_key: str, *, label: str) -> DemoE
     env_key = (env.env_api_key or "").strip()
     if not env_key:
-        raise RuntimeError(f"[{label}] ENVIRONMENT_API_KEY missing. Run `uvx synth-ai rl_demo deploy` first.")
+        raise RuntimeError(
+            f"[{label}] ENVIRONMENT_API_KEY missing. Run `uvx synth-ai rl_demo deploy` first."
+        )
     task_url = env.task_app_base_url
     if not task_url or not _is_modal_public_url(task_url):
         resolved = ""
         if env.task_app_name:
             try:
-                choice = input(
-                    f"Resolve URL from Modal for app '{env.task_app_name}'? [Y/n]: "
-                ).strip().lower() or "y"
+                choice = (
+                    input(f"Resolve URL from Modal for app '{env.task_app_name}'? [Y/n]: ")
+                    .strip()
+                    .lower()
+                    or "y"
+                )
             except Exception:
                 choice = "y"
             if choice.startswith("y"):
-                code, out = _popen_capture([
-                    "uv",
-                    "run",
-                    "python",
-                    "-m",
-                    "modal",
-                    "app",
-                    "url",
-                    env.task_app_name,
-                ])
+                code, out = _popen_capture(
+                    [
+                        "uv",
+                        "run",
+                        "python",
+                        "-m",
+                        "modal",
+                        "app",
+                        "url",
+                        env.task_app_name,
+                    ]
+                )
                 if code == 0 and out:
                     for tok in out.split():
                         if _is_modal_public_url(tok):
@@ -623,7 +687,9 @@ def _ensure_task_app_ready(env: DemoEnv, synth_key: str, *, label: str) -> DemoE
         if not resolved:
             print(f"[{label}] Task app URL not configured or not a valid Modal public URL.")
             print("Examples: https://<app-name>-fastapi-app.modal.run")
-            entered = input("Enter Task App base URL (must contain '.modal.run'), or press Enter to abort: ").strip()
+            entered = input(
+                "Enter Task App base URL (must contain '.modal.run'), or press Enter to abort: "
+            ).strip()
             if not entered or not _is_modal_public_url(entered):
                 raise RuntimeError(f"[{label}] Valid Task App URL is required.")
             task_url = entered.rstrip("/")
@@ -639,30 +705,26 @@ def _ensure_task_app_ready(env: DemoEnv, synth_key: str, *, label: str) -> DemoE
         app_name = fallback
         demo_core.persist_task_url(task_url, name=app_name)
-    secret_name = env.task_app_secret_name.strip() or f"{app_name}-secret"
     demo_core.persist_task_url(task_url, name=app_name)
-    demo_core.persist_dotenv_values({
-        "TASK_APP_BASE_URL": task_url,
-        "TASK_APP_NAME": app_name,
-        "TASK_APP_SECRET_NAME": secret_name,
-    })
+    demo_core.persist_dotenv_values(
+        {
+            "TASK_APP_BASE_URL": task_url,
+            "TASK_APP_NAME": app_name,
+            "TASK_APP_SECRET_NAME": DEFAULT_TASK_APP_SECRET_NAME,
+        }
+    )
-    openai_key = (os.environ.get("OPENAI_API_KEY") or local_env.get("OPENAI_API_KEY") or "").strip()
-    secret_values: dict[str, str] = {"ENVIRONMENT_API_KEY": env_key}
-    if openai_key:
-        secret_values["OPENAI_API_KEY"] = openai_key
     if synth_key:
-        secret_values["SYNTH_API_KEY"] = synth_key
+        os.environ["SYNTH_API_KEY"] = synth_key
-    _ensure_modal_secret(secret_name, values=secret_values, label=label, replace=True)
+    openai_key = (os.environ.get("OPENAI_API_KEY") or local_env.get("OPENAI_API_KEY") or "").strip()
+    if openai_key:
+        os.environ["OPENAI_API_KEY"] = openai_key
-    rollout_url = task_url.rstrip("/") + "/health/rollout"
     print(f"[{label}] Verifying rollout health:")
     try:
         ek = (env_key or "").strip()
-        ek_len = len(ek)
-        ek_tail = ek[-5:] if ek_len >= 5 else ek
-        print(f"[{label}] Using ENVIRONMENT_API_KEY len={ek_len} last5={ek_tail}")
+        print(f"[{label}] {_key_preview(ek, 'ENVIRONMENT_API_KEY')}")
     except Exception:
         pass
     health_base = task_url.rstrip("/")
@@ -673,7 +735,6 @@ def _ensure_task_app_ready(env: DemoEnv, synth_key: str, *, label: str) -> DemoE
         print(f"[{label}] GET", h)
         rc, body = _http("GET", h, headers={"X-API-Key": env_key})
         if rc == 200:
-            rollout_url = h
             break
     print(f"[{label}] status: {rc}")
     try:
@@ -685,41 +746,64 @@ def _ensure_task_app_ready(env: DemoEnv, synth_key: str, *, label: str) -> DemoE
     print(f"[{label}] body:", preview)
     if rc != 200:
         print(f"[{label}] Warning: rollout health check failed ({rc}). Response: {body}")
+        with contextlib.suppress(Exception):
+            print(f"[{label}] Sent header X-API-Key → {_key_preview(env_key, 'X-API-Key')}")
     else:
         print(f"[{label}] Task app rollout health check OK.")
     os.environ["TASK_APP_BASE_URL"] = task_url
     os.environ["ENVIRONMENT_API_KEY"] = env_key
+    os.environ["TASK_APP_SECRET_NAME"] = DEFAULT_TASK_APP_SECRET_NAME
     updated_env = demo_core.load_env()
     updated_env.env_api_key = env_key
     updated_env.task_app_base_url = task_url
     updated_env.task_app_name = app_name
-    updated_env.task_app_secret_name = secret_name
+    updated_env.task_app_secret_name = DEFAULT_TASK_APP_SECRET_NAME
     return updated_env
-def cmd_deploy(args: argparse.Namespace) -> int:
+def deploy(
+    local: bool = False, app: str | None = None, name: str | None = None, script: str | None = None
+) -> int:
+    # Change to demo directory if stored
+    demo_dir = demo_core.load_demo_dir()
+    if demo_dir and os.path.isdir(demo_dir):
+        os.chdir(demo_dir)
+        print(f"Using demo directory: {demo_dir}")
     env = demo_core.load_env()
+    os.environ["TASK_APP_SECRET_NAME"] = DEFAULT_TASK_APP_SECRET_NAME
     cwd_env_path = os.path.join(os.getcwd(), ".env")
     local_env = demo_core.load_dotenv_file(cwd_env_path)
     url = ""
     app_name = env.task_app_name or ""
     try:
-        if args.local:
+        if local:
             print("Starting local Task App…")
             import subprocess
-            subprocess.Popen([sys.executable, "-c", "from synth_ai.demos.demo_task_apps.math.app import run; run()"],
-                             stdout=sys.stdout, stderr=sys.stderr)
+            subprocess.Popen(
+                [
+                    sys.executable,
+                    "-c",
+                    "from synth_ai.demos.demo_task_apps.math.app import run; run()",
+                ],
+                env=get_subprocess_env(),
+                stdout=sys.stdout,
+                stderr=sys.stderr,
+            )
             target = "http://127.0.0.1:8080"
             app_name = ""
             for _ in range(30):
-                if demo_core.assert_http_ok(target + "/health", method="GET") or demo_core.assert_http_ok(target, method="GET"):
+                if demo_core.assert_http_ok(
+                    target + "/health", method="GET"
+                ) or demo_core.assert_http_ok(target, method="GET"):
                     url = target
                     break
                 time.sleep(1)
         else:
             # Auto-detect app path if not supplied; prompt interactively from discovered ASGI apps
-            app_path = os.path.abspath(args.app) if args.app else None
+            app_path = os.path.abspath(app) if app else None
             if not app_path or not os.path.isfile(app_path):
                 # First pass: look for known common filenames
                 candidates = [
@@ -738,7 +822,9 @@ def cmd_deploy(args: argparse.Namespace) -> int:
                             rel = os.path.relpath(str(pth), os.getcwd())
                             print(f"  [{idx}] {rel}")
                         try:
-                            sel = input(f"Enter choice [1-{len(found)}] (default 1): ").strip() or "1"
+                            sel = (
+                                input(f"Enter choice [1-{len(found)}] (default 1): ").strip() or "1"
+                            )
                         except Exception:
                             sel = "1"
                         try:
@@ -747,12 +833,13 @@ def cmd_deploy(args: argparse.Namespace) -> int:
                             choice = 1
                         choice = max(1, min(choice, len(found)))
                         app_path = str(found[choice - 1].resolve())
-            if not app_path and args.script:
+            if not app_path and script:
                 # Legacy script fallback if user supplied --script explicitly
                 from synth_ai.demos.demo_task_apps.math.deploy_modal import deploy as modal_deploy
-                url = modal_deploy(script_path=args.script, env_api_key=env.env_api_key)
-                if args.name:
-                    app_name = args.name
+                url = modal_deploy(script_path=script, env_api_key=env.env_api_key)
+                if name:
+                    app_name = name
             else:
                 if not app_path:
                     entered = input("Path to Modal app.py (e.g., ./task_app.py): ").strip()
@@ -763,7 +850,10 @@ def cmd_deploy(args: argparse.Namespace) -> int:
                     raise FileNotFoundError(f"App file not found: {app_path}")
                 # Surface the app path before asking for the name
                 print(f"Using task app: {app_path}")
-                suggested_name = args.name or f"synth-{os.path.splitext(os.path.basename(app_path))[0]}"
+                existing_name = (name or env.task_app_name or "").strip()
+                if not existing_name:
+                    existing_name = f"synth-{os.path.splitext(os.path.basename(app_path))[0]}"
+                suggested_name = existing_name
                 name_in = input(f"Modal app name [{suggested_name}]: ").strip() or suggested_name
                 app_name = name_in
                 print("\nAbout to deploy with:")
@@ -774,21 +864,23 @@ def cmd_deploy(args: argparse.Namespace) -> int:
                     print("Aborted by user.")
                     return 1
-                secret_name = (env.task_app_secret_name or "").strip() or f"{name_in}-secret"
                 existing_env_key = (env.env_api_key or "").strip()
                 env_key: str | None = existing_env_key or None
                 if existing_env_key:
                     try:
-                        reuse_choice = input(
-                            "Use existing ENVIRONMENT_API_KEY from state/.env? [Y/n]: "
-                        ).strip().lower() or "y"
+                        reuse_choice = (
+                            input("Use existing ENVIRONMENT_API_KEY from state/.env? [Y/n]: ")
+                            .strip()
+                            .lower()
+                            or "y"
+                        )
                     except Exception:
                         reuse_choice = "y"
                     if not reuse_choice.startswith("y"):
                         env_key = None
                 if env_key is None:
-                    from synth_ai.rl.secrets import mint_environment_api_key
+                    from synth_ai.learning.rl.secrets import mint_environment_api_key
                     env_key = mint_environment_api_key()
                     demo_core.persist_env_api_key(env_key)
@@ -797,69 +889,90 @@ def cmd_deploy(args: argparse.Namespace) -> int:
                     env.env_api_key = env_key
                     local_env["ENVIRONMENT_API_KEY"] = env_key
                     print("[deploy] Minted new ENVIRONMENT_API_KEY")
+                elif env_key:
+                    os.environ["ENVIRONMENT_API_KEY"] = env_key
                 # Optionally upload the new key to the backend using sealed box helper
-                backend_base = env.dev_backend_url or ""
-                synth_key = (env.synth_api_key or os.environ.get("SYNTH_API_KEY") or local_env.get("SYNTH_API_KEY") or "").strip()
+                backend_base = (env.dev_backend_url or "").rstrip("/")
+                synth_key = (
+                    env.synth_api_key
+                    or os.environ.get("SYNTH_API_KEY")
+                    or local_env.get("SYNTH_API_KEY")
+                    or ""
+                ).strip()
                 if backend_base and synth_key:
-                        backend_base = backend_base.rstrip("/")
-                        if not backend_base.endswith("/api"):
-                            backend_base = f"{backend_base}/api"
+                    # Pass a base WITHOUT trailing /api to setup_environment_api_key,
+                    # since it appends /api/v1/... internally.
+                    non_api_base = (
+                        backend_base[:-4] if backend_base.endswith("/api") else backend_base
+                    )
+                    try:
+                        choice = (
+                            input(f"Upload ENVIRONMENT_API_KEY to backend {non_api_base}? [Y/n]: ")
+                            .strip()
+                            .lower()
+                            or "y"
+                        )
+                    except Exception:
+                        choice = "y"
+                    if choice.startswith("y"):
                         try:
-                            choice = input(
-                                f"Upload ENVIRONMENT_API_KEY to backend {backend_base}? [Y/n]: "
-                            ).strip().lower() or "y"
-                        except Exception:
-                            choice = "y"
-                        if choice.startswith("y"):
-                            try:
-                                print(f"[deploy] Uploading ENVIRONMENT_API_KEY to {backend_base} …")
-                                from synth_ai.rl.env_keys import setup_environment_api_key
-                                setup_environment_api_key(backend_base.rstrip("/"), synth_key, token=env_key)
-                                print("[deploy] Backend sealed-box upload complete.")
-                            except Exception as upload_err:
-                                print(f"[deploy] Failed to upload ENVIRONMENT_API_KEY: {upload_err}")
-                                print(
-                                    "Hint: run `uvx python -c \"from synth_ai.rl.env_keys import setup_environment_api_key as s;"
-                                    " s('<backend>', '<synth_api_key>')\"` once the backend is reachable."
-                                )
-                synth_key = (env.synth_api_key or os.environ.get("SYNTH_API_KEY") or local_env.get("SYNTH_API_KEY") or "").strip()
+                            print(f"[deploy] Uploading ENVIRONMENT_API_KEY to {non_api_base} …")
+                            from synth_ai.learning.rl.env_keys import setup_environment_api_key
+                            setup_environment_api_key(non_api_base, synth_key, token=env_key)
+                            print("[deploy] Backend sealed-box upload complete.")
+                        except Exception as upload_err:
+                            print(f"[deploy] Failed to upload ENVIRONMENT_API_KEY: {upload_err}")
+                            print(
+                                'Hint: run `uvx python -c "from synth_ai.learning.rl.env_keys import setup_environment_api_key as s;'
+                                " s('<backend>', '<synth_api_key>')\"` once the backend is reachable."
+                            )
+                synth_key = (
+                    env.synth_api_key
+                    or os.environ.get("SYNTH_API_KEY")
+                    or local_env.get("SYNTH_API_KEY")
+                    or ""
+                ).strip()
                 if not synth_key:
-                    synth_key = input("Enter SYNTH_API_KEY for Modal secret (required): ").strip()
+                    synth_key = input("Enter SYNTH_API_KEY for deployment (required): ").strip()
                     if not synth_key:
-                        print("SYNTH_API_KEY is required to create the Modal secret.")
+                        print("SYNTH_API_KEY is required for deployment.")
                         return 1
                     demo_core.persist_api_key(synth_key)
                     demo_core.persist_dotenv_values({"SYNTH_API_KEY": synth_key})
                     env.synth_api_key = synth_key
+                os.environ["SYNTH_API_KEY"] = synth_key
-                openai_key = (os.environ.get("OPENAI_API_KEY") or local_env.get("OPENAI_API_KEY") or "").strip()
+                openai_key = (
+                    os.environ.get("OPENAI_API_KEY") or local_env.get("OPENAI_API_KEY") or ""
+                ).strip()
                 if not openai_key:
                     openai_key = input(
                         "Enter your OpenAI API key, found at https://platform.openai.com/api-keys\n> "
                     ).strip()
                     if not openai_key:
-                        print("OPENAI_API_KEY is required to create the Modal secret.")
+                        print("OPENAI_API_KEY is required for deployment.")
                         return 1
                     demo_core.persist_dotenv_values({"OPENAI_API_KEY": openai_key})
                     local_env["OPENAI_API_KEY"] = openai_key
+                os.environ["OPENAI_API_KEY"] = openai_key
-                values = {"SYNTH_API_KEY": synth_key, "OPENAI_API_KEY": openai_key}
-                if env_key:
-                    values["ENVIRONMENT_API_KEY"] = env_key
-                try:
-                    created = _ensure_modal_secret(secret_name, values=values, label="deploy", replace=True)
-                except RuntimeError as secret_err:
-                    print(f"Failed to prepare Modal secret '{secret_name}': {secret_err}")
-                    return 2
-                if created:
-                    print(f"[deploy] Modal secret '{secret_name}' provisioned.")
-                deploy_cmd = ["uv", "run", "python", "-m", "modal", "deploy", "--name", name_in, app_path]
-                print("\nStreaming Modal build/deploy logs (this can take several minutes on first run)…\n")
+                deploy_cmd = [
+                    "uv",
+                    "run",
+                    "python",
+                    "-m",
+                    "modal",
+                    "deploy",
+                    "--name",
+                    name_in,
+                    app_path,
+                ]
+                print(
+                    "\nStreaming Modal build/deploy logs (this can take several minutes on first run)…\n"
+                )
                 code, deploy_logs = _popen_stream_capture(deploy_cmd)
                 if code != 0:
                     raise RuntimeError(f"modal deploy failed (exit {code})")
@@ -867,6 +980,7 @@ def cmd_deploy(args: argparse.Namespace) -> int:
                 if not url:
                     try:
                         import re as _re
                         m_all = _re.findall(r"https?://[^\s]+\.modal\.run", deploy_logs or "")
                         if m_all:
                             url = m_all[-1].strip().rstrip("/")
@@ -881,7 +995,9 @@ def cmd_deploy(args: argparse.Namespace) -> int:
                             break
                 # Fallback: try reading recent Modal logs for the app to find a URL line
                 if not url:
-                    code3, out3 = _popen_capture(["uv", "run", "python", "-m", "modal", "app", "list"])
+                    code3, out3 = _popen_capture(
+                        ["uv", "run", "python", "-m", "modal", "app", "list"]
+                    )
                     if code3 == 0 and out3:
                         for line in out3.splitlines():
                             if name_in in line:
@@ -894,7 +1010,9 @@ def cmd_deploy(args: argparse.Namespace) -> int:
                 # Prompt user if still no valid URL
                 if not url:
                     print("\nCould not auto-detect a public Modal URL for the app.")
-                    entered = input("Enter the Modal public URL (must contain '.modal.run'), or press Enter to abort: ").strip()
+                    entered = input(
+                        "Enter the Modal public URL (must contain '.modal.run'), or press Enter to abort: "
+                    ).strip()
                     if entered and _is_modal_public_url(entered):
                         url = entered.rstrip("/")
                 if not url:
@@ -906,7 +1024,7 @@ def cmd_deploy(args: argparse.Namespace) -> int:
         dotenv_values = {"TASK_APP_BASE_URL": url}
         if app_name:
             dotenv_values["TASK_APP_NAME"] = app_name
-            dotenv_values["TASK_APP_SECRET_NAME"] = f"{app_name}-secret"
+        dotenv_values["TASK_APP_SECRET_NAME"] = DEFAULT_TASK_APP_SECRET_NAME
         dotenv_path = demo_core.persist_dotenv_values(dotenv_values)
         print(f"TASK_APP_BASE_URL={url}")
         if app_name:
@@ -915,16 +1033,16 @@ def cmd_deploy(args: argparse.Namespace) -> int:
         print(f"  export TASK_APP_BASE_URL={url}")
         if app_name:
             print(f"  export TASK_APP_NAME={app_name}")
-            print(f"  export TASK_APP_SECRET_NAME={app_name}-secret")
         print(f"Persisted to {dotenv_path}")
-        print("Next: uvx synth-ai run")
+        print("\nNext step:\n$ uvx synth-ai run")
         return 0
     except Exception as e:
         print(f"Deploy error: {e}")
         return 2
-    print("`rl_demo configure` prepares environment and secrets; `synth-ai run` now handles launches.")
+    print(
+        "`rl_demo configure` prepares environment and secrets; `synth-ai run` now handles launches."
+    )
     env = demo_core.load_env()
     synth_key = (env.synth_api_key or "").strip()
     if not synth_key:
@@ -956,133 +1074,314 @@ def cmd_deploy(args: argparse.Namespace) -> int:
     return 0
-def cmd_init(args: argparse.Namespace) -> int:
-    """Initialize a Modal-ready Math Task App in the current directory.
+def _ensure_modal_installed() -> None:
+    """Install the modal package if it is not already available and check authentication."""
-    Copies `examples/rl/task_app.py` and `examples/rl/deploy_task_app.sh` into CWD.
-    Creates a `.env` with placeholders if it does not exist.
-    """
+    # Check if modal is installed
+    modal_installed = False
     try:
-        # Ensure `modal` is installed for deployment flows
-        def _has_modal() -> bool:
-            try:
-                import importlib.util as _iu
-                return _iu.find_spec("modal") is not None
-            except Exception:
-                return False
+        import importlib.util as _iu
-        if not _has_modal():
-            print("modal not found; installing…")
-            # Prefer uv if available; otherwise fallback to pip
-            try:
-                if shutil.which("uv"):
-                    code, out = _popen_capture(["uv", "pip", "install", "modal>=1.1.4"])
-                else:
-                    code, out = _popen_capture([sys.executable, "-m", "pip", "install", "modal>=1.1.4"])
-                if code != 0:
-                    print(out)
-                    print("Failed to install modal; continuing may fail.")
-                else:
-                    print("modal installed successfully.")
-            except Exception as e:
-                print(f"modal install error: {e}")
-            # Re-check
-            if not _has_modal():
-                print("Warning: modal is still not importable after install attempt.")
-        else:
-            print("modal found")
-        here = os.getcwd()
-        demo_dir = os.path.join(here, "synth_demo")
-        os.makedirs(demo_dir, exist_ok=True)
-        # Paths inside synth_demo/
-        dst_task_py = os.path.join(demo_dir, "task_app.py")
-        dst_deploy = os.path.join(demo_dir, "deploy_task_app.sh")
-        env_path = os.path.join(demo_dir, ".env")
-        dst_cfg = os.path.join(demo_dir, "demo_config.toml")
-        # Copy packaged math modal task app into synth_demo/task_app.py
-        src_modal = os.path.abspath(os.path.join(os.path.dirname(__file__), "..", "demo_task_apps", "math", "modal_task_app.py"))
-        if not os.path.isfile(src_modal):
-            print("Init failed: packaged math modal task app not found.")
-            print(f"Looked for: {src_modal}")
-            return 1
-        if os.path.exists(dst_task_py) and not getattr(args, "force", False):
-            print(f"Refusing to overwrite existing file: {dst_task_py} (use --force)")
-            return 1
-        shutil.copy2(src_modal, dst_task_py)
-        # Create deploy script in synth_demo/
-        deploy_text = r"""#!/usr/bin/env bash
-set -euo pipefail
-HERE=$(cd "$(dirname "$0")" && pwd)
-APP="$HERE/task_app.py"
-if [ -f "$HERE/.env" ]; then
-  # shellcheck disable=SC2046
-  export $(grep -v '^#' "$HERE/.env" | xargs -I{} echo {})
-fi
-uv run modal deploy "$APP" | tee "$HERE/.last_deploy.log"
-URL=$(grep -Eo 'https://[^ ]+\.modal\.run' "$HERE/.last_deploy.log" | tail -1 || true)
-if [ -n "$URL" ]; then
-  if grep -q '^TASK_APP_BASE_URL=' "$HERE/.env" 2>/dev/null; then
-    sed -i.bak "s#^TASK_APP_BASE_URL=.*#TASK_APP_BASE_URL=$URL#" "$HERE/.env" || true
-  else
-    echo "TASK_APP_BASE_URL=$URL" >> "$HERE/.env"
-  fi
-  echo "Saved TASK_APP_BASE_URL to $HERE/.env"
-fi
-"""
-        _write_text(dst_deploy, deploy_text)
+        if _iu.find_spec("modal") is not None:
+            modal_installed = True
+    except Exception:
+        pass
+    # Install modal if needed
+    if not modal_installed:
+        print("modal not found; installing…")
+        try:
+            if shutil.which("uv"):
+                code, out = _popen_capture(["uv", "pip", "install", "modal>=1.1.4"])
+            else:
+                code, out = _popen_capture([sys.executable, "-m", "pip", "install", "modal>=1.1.4"])
+            if code != 0:
+                print(out)
+                print("Failed to install modal; continuing may fail.")
+                return
+            else:
+                print("✓ modal installed successfully")
+                modal_installed = True
+        except Exception as exc:
+            print(f"modal install error: {exc}")
+            return
+    # Verify modal is importable
+    if modal_installed:
         try:
-            st = os.stat(dst_deploy)
-            os.chmod(dst_deploy, st.st_mode | stat.S_IXUSR | stat.S_IXGRP | stat.S_IXOTH)
+            import importlib.util as _iu
+            if _iu.find_spec("modal") is None:
+                print("Warning: modal is still not importable after install attempt.")
+                return
         except Exception:
-            pass
+            print("Warning: unable to verify modal installation.")
+            return
+    # Check modal authentication status
+    auth_ok, auth_msg = demo_core.modal_auth_status()
+    if auth_ok:
+        print(f"✓ Modal authenticated: {auth_msg}")
+    else:
+        print("\n⚠️  Modal authentication required")
+        print(f"   Status: {auth_msg}")
+        print("\n   To authenticate Modal, run:")
+        print("     modal setup")
+        print("\n   Or set environment variables:")
+        print("     export MODAL_TOKEN_ID=your-token-id")
+        print("     export MODAL_TOKEN_SECRET=your-token-secret")
+        print("\n   You can deploy later after authenticating.\n")
+def init(template: str | None = None, dest: str | None = None, force: bool = False) -> int:
+    """Materialise a demo task app template into the current directory."""
+    templates = list(list_demo_templates())
+    if not templates:
+        print("No demo templates registered. Update synth_ai/demo_registry.py to add entries.")
+        return 1
+    selected: DemoTemplate | None = None
+    if template:
+        selected = get_demo_template(template)
+        if selected is None:
+            available = ", ".join(t.template_id for t in templates)
+            print(f"Unknown template '{template}'. Available: {available}")
+            return 1
+    else:
+        if force:
+            selected = templates[0]
+            print(
+                f"Using default template: {selected.name} ({selected.template_id}) "
+                f"(pass --template to choose another)"
+            )
+        else:
+            print("Select a demo template:" + "\n")
+            for idx, tpl in enumerate(templates, start=1):
+                print(f"  [{idx}] {tpl.name} ({tpl.template_id})")
+                print(f"      {tpl.description}")
+            try:
+                choice_raw = input(f"Enter choice [1-{len(templates)}] (default 1): ").strip() or "1"
+            except Exception:
+                choice_raw = "1"
+            if not choice_raw.isdigit():
+                print("Selection must be a number.")
+                return 1
+            choice_idx = int(choice_raw)
+            if not 1 <= choice_idx <= len(templates):
+                print("Selection out of range.")
+                return 1
+            selected = templates[choice_idx - 1]
+    assert selected is not None
+    default_subdir = selected.default_subdir or selected.template_id
+    # Check if default destination is already occupied and switch to local_demos/ if needed
+    if dest:
+        default_dest = Path(dest).expanduser().resolve()
+    else:
+        primary_dest = Path.cwd() / default_subdir
+        if primary_dest.exists() and any(primary_dest.iterdir()):
+            # Switch to local_demos/ automatically if primary location is occupied
+            default_dest = (Path.cwd() / "local_demos" / default_subdir).resolve()
+        else:
+            default_dest = primary_dest.resolve()
-        # Seed .env if not present
-        if not os.path.exists(env_path):
-            _write_text(env_path, "\n".join([
-                "# Required for task app auth to environment service",
-                "ENVIRONMENT_API_KEY=",
-                "",
-                "# Optional: for CLI job submission and proxying OpenAI models",
-                "SYNTH_API_KEY=",
-                "OPENAI_API_KEY=",
-                "",
-                "# Optional: set to 'prod' to use production names",
-                "ENVIRONMENT=",
-            ]) + "\n")
-        # Seed demo_config.toml from packaged default if not present (or overwrite with --force)
-        packaged_cfg = os.path.abspath(os.path.join(os.path.dirname(__file__), "..", "demo_task_apps", "math", "config.toml"))
+    if force:
+        dest_input = ""
+    else:
         try:
-            if os.path.isfile(packaged_cfg):
-                if not os.path.exists(dst_cfg) or getattr(args, "force", False):
-                    shutil.copy2(packaged_cfg, dst_cfg)
+            dest_input = input(f"Destination directory [{default_dest}]: ").strip()
         except Exception:
-            pass
+            dest_input = ""
+    destination = Path(dest_input).expanduser().resolve() if dest_input else default_dest
+    # Track whether we should skip individual file prompts (if we already cleared the directory)
+    directory_cleared = False
+    if destination.exists():
+        if destination.is_file():
+            print(f"Destination {destination} is a file. Provide a directory path.")
+            return 1
+        if any(destination.iterdir()):
+            if force:
+                response = "y"
+            else:
+                try:
+                    response = (
+                        input(f"Destination {destination} is not empty. Overwrite? [y/N]: ")
+                        .strip()
+                        .lower()
+                    )
+                except (EOFError, KeyboardInterrupt):
+                    print("\nCancelled.")
+                    return 1
+            if response not in ("y", "yes"):
+                print("Cancelled. Choose another directory or delete the existing one.")
+                return 1
+            # User agreed to overwrite - clear the entire directory including hidden files
+            print(f"Clearing {destination}...")
+            try:
+                # Remove all contents including hidden files (.env, .git, etc.)
+                shutil.rmtree(destination)
+            except Exception as e:
+                print(f"Error clearing directory: {e}")
+                print("Please manually remove the directory and try again.")
+                return 1
+            # Recreate empty directory
+            destination.mkdir(parents=True, exist_ok=True)
+            # Verify it's actually empty
+            if any(destination.iterdir()):
+                print(f"Warning: Directory {destination} still contains files after clearing.")
+                print("Some files may not have been removed. Please check manually.")
+                return 1
+            directory_cleared = True
+    else:
+        destination.mkdir(parents=True, exist_ok=True)
+    if selected.requires_modal:
+        _ensure_modal_installed()
+    try:
+        for spec in selected.iter_copy_specs():
+            src_path = spec.absolute_source()
+            if not src_path.exists():
+                print(f"Template source missing: {src_path}")
+                return 1
+            dest_path = (destination / spec.destination).resolve()
+            # Handle directory copying
+            if src_path.is_dir():
+                if dest_path.exists() and not directory_cleared:
+                    if force:
+                        response = "y"
+                    else:
+                        try:
+                            response = (
+                                input(f"Directory {dest_path.name} exists. Overwrite? [y/N]: ")
+                                .strip()
+                                .lower()
+                            )
+                        except (EOFError, KeyboardInterrupt):
+                            print("\nCancelled.")
+                            return 1
+                    if response not in ("y", "yes"):
+                        print(f"Skipping {dest_path.name}")
+                        continue
+                    shutil.rmtree(dest_path)
+                elif dest_path.exists() and directory_cleared:
+                    shutil.rmtree(dest_path)
+                shutil.copytree(src_path, dest_path)
+            else:
+                # Handle file copying
+                dest_path.parent.mkdir(parents=True, exist_ok=True)
+                if dest_path.exists() and not directory_cleared:
+                    if force:
+                        response = "y"
+                    else:
+                        try:
+                            response = (
+                                input(f"File {dest_path.name} exists. Overwrite? [y/N]: ")
+                                .strip()
+                                .lower()
+                            )
+                        except (EOFError, KeyboardInterrupt):
+                            print("\nCancelled.")
+                            return 1
+                    if response not in ("y", "yes"):
+                        print(f"Skipping {dest_path.name}")
+                        continue
+                shutil.copy2(src_path, dest_path)
+                if spec.make_executable:
+                    try:
+                        st = os.stat(dest_path)
+                        os.chmod(dest_path, st.st_mode | stat.S_IXUSR | stat.S_IXGRP | stat.S_IXOTH)
+                    except Exception:
+                        pass
-        print("Initialized Math Task App in synth_demo/:")
-        print(f"  - {dst_task_py}")
-        print(f"  - {dst_deploy}")
-        print(f"  - {env_path} (created if missing)")
-        if os.path.exists(dst_cfg):
-            print(f"  - {dst_cfg} (seeded)")
-        print("")
-        print("Next steps:")
-        print("  1) cd synth_demo && put your ENVIRONMENT_API_KEY in ./.env")
-        print("  2) Deploy to Modal:")
-        print("     uvx bash ./deploy_task_app.sh")
-        print("  3) From project root, run: uvx synth-ai run")
+        if selected.env_lines:
+            env_path = destination / ".env"
+            should_write = True
+            if env_path.exists() and not directory_cleared:
+                if force:
+                    response = "y"
+                else:
+                    try:
+                        response = input("File .env exists. Overwrite? [y/N]: ").strip().lower()
+                    except (EOFError, KeyboardInterrupt):
+                        print("\nCancelled.")
+                        return 1
+                should_write = response in ("y", "yes")
+            if should_write:
+                _write_text(env_path, "\n".join(selected.env_lines) + "\n")
+            elif not directory_cleared:
+                print("Skipping .env")
+        config_src = selected.config_source_path()
+        if config_src and config_src.exists():
+            cfg_dst = (destination / selected.config_destination).resolve()
+            should_copy = True
+            if cfg_dst.exists() and not directory_cleared:
+                if force:
+                    response = "y"
+                else:
+                    try:
+                        response = (
+                            input(f"File {cfg_dst.name} exists. Overwrite? [y/N]: ").strip().lower()
+                        )
+                    except (EOFError, KeyboardInterrupt):
+                        print("\nCancelled.")
+                        return 1
+                should_copy = response in ("y", "yes")
+            if should_copy:
+                cfg_dst.parent.mkdir(parents=True, exist_ok=True)
+                shutil.copy2(config_src, cfg_dst)
+            elif not directory_cleared:
+                print(f"Skipping {cfg_dst.name}")
+        if selected.post_copy is not None:
+            try:
+                selected.post_copy(destination)
+            except Exception as post_exc:
+                print(f"Post-processing failed: {post_exc}")
+                return 1
+        # Store demo directory for subsequent commands
+        demo_core.persist_demo_dir(str(destination))
+        # Store .env path if it was created
+        env_file = destination / ".env"
+        if env_file.exists():
+            demo_core.persist_env_file_path(str(env_file))
+        print(f"Demo template '{selected.name}' materialised at {destination}.")
+        print("Files created:")
+        for spec in selected.iter_copy_specs():
+            print(f"  - {spec.destination}")
+        if selected.env_lines:
+            print("  - .env")
+        if selected.config_source_path():
+            print(f"  - {selected.config_destination}")
+        print("\nDemo directory stored. Subsequent commands will use this directory automatically.")
+        print("Review the files, edit .env, and run any provided deploy scripts when ready.")
         return 0
-    except Exception as e:
-        print(f"Init error: {e}")
-        return 2
+    except KeyboardInterrupt:
+        print("Aborted")
+        return 1
+    except Exception as exc:
+        print(f"Init failed: {exc}")
+        return 1
-def _http(method: str, url: str, headers: Dict[str, str] | None = None, body: Dict[str, Any] | None = None) -> tuple[int, Dict[str, Any] | str]:
-    import urllib.request, urllib.error, json as _json, ssl
+def _http(
+    method: str, url: str, headers: dict[str, str] | None = None, body: dict[str, Any] | None = None
+) -> tuple[int, dict[str, Any] | str]:
+    import json as _json
+    import ssl
+    import urllib.error
+    import urllib.request
     data = None
     if body is not None:
         data = _json.dumps(body).encode("utf-8")
@@ -1119,10 +1418,23 @@ def _write_text(path: str, content: str) -> None:
 # Note: `prepare` command has been removed; configuration now prepares TOML
-def cmd_run(args: argparse.Namespace) -> int:
+def run(
+    config: str | None = None,
+    batch_size: int | None = None,
+    group_size: int | None = None,
+    model: str | None = None,
+    timeout: int = 600,
+    dry_run: bool = False,
+) -> int:
+    # Change to demo directory if stored
+    demo_dir = demo_core.load_demo_dir()
+    if demo_dir and os.path.isdir(demo_dir):
+        os.chdir(demo_dir)
+        print(f"Using demo directory: {demo_dir}")
     env = demo_core.load_env()
     cwd_env_path = os.path.join(os.getcwd(), ".env")
-    local_env = demo_core.load_dotenv_file(cwd_env_path)
+    demo_core.load_dotenv_file(cwd_env_path)
     synth_key = (env.synth_api_key or "").strip()
     if not synth_key:
@@ -1154,7 +1466,7 @@ def cmd_run(args: argparse.Namespace) -> int:
     import tomllib
     try:
-        cfg_path = _select_or_create_config(getattr(args, "config", None), env)
+        cfg_path = _select_or_create_config(config, env)
     except FileNotFoundError as exc:
         print(exc)
         return 1
@@ -1162,7 +1474,11 @@ def cmd_run(args: argparse.Namespace) -> int:
     # Detect monorepo launcher and delegate if available (aligns with run_clustered.sh which works)
     launcher = "/Users/joshpurtell/Documents/GitHub/monorepo/tests/applications/math/rl/start_math_clustered.py"
     if os.path.isfile(launcher):
-        backend_base = env.dev_backend_url[:-4] if env.dev_backend_url.endswith("/api") else env.dev_backend_url
+        backend_base = (
+            env.dev_backend_url[:-4]
+            if env.dev_backend_url.endswith("/api")
+            else env.dev_backend_url
+        )
         run_env = os.environ.copy()
         run_env["BACKEND_URL"] = backend_base
         run_env["SYNTH_API_KEY"] = env.synth_api_key
@@ -1172,12 +1488,12 @@ def cmd_run(args: argparse.Namespace) -> int:
         # Optional: TRAINER_START_URL passthrough if already set in environment
         run_env["TRAINER_START_URL"] = run_env.get("TRAINER_START_URL", "")
         # Forward convenience knobs
-        if args.batch_size is not None:
-            run_env["RL_BATCH_SIZE"] = str(int(args.batch_size))
-        if args.group_size is not None:
-            run_env["RL_GROUP_SIZE"] = str(int(args.group_size))
-        if args.model:
-            run_env["RL_MODEL"] = args.model
+        if batch_size is not None:
+            run_env["RL_BATCH_SIZE"] = str(int(batch_size))
+        if group_size is not None:
+            run_env["RL_GROUP_SIZE"] = str(int(group_size))
+        if model:
+            run_env["RL_MODEL"] = model
         cmd = ["uv", "run", "python", launcher]
         print(f"Launching monorepo clustered runner: {' '.join(cmd)}")
         code = _popen_stream(cmd, env=run_env)
@@ -1192,33 +1508,33 @@ def cmd_run(args: argparse.Namespace) -> int:
             ek = (env.env_api_key or "").strip()
             print("Hint: If backend responded 401, verify SYNTH_API_KEY for:", base_url)
             if sk:
-                print(f"  SYNTH_API_KEY len={len(sk)} last5={sk[-5:]}")
+                print(f"  {_key_preview(sk, 'SYNTH_API_KEY')}")
             if ek:
-                print(f"  ENVIRONMENT_API_KEY len={len(ek)} last5={ek[-5:]}")
-            print("Also ensure your Modal secret contains ENVIRONMENT_API_KEY and matches the task app.")
+                print(f"  {_key_preview(ek, 'ENVIRONMENT_API_KEY')}")
+            print(
+                "Ensure the ENVIRONMENT_API_KEY you deployed with matches the task app and remains exported."
+            )
         return code
     # Fallback: legacy jobs API flow
     with open(cfg_path, "rb") as fh:
         inline_cfg = tomllib.load(fh)
-    with open(cfg_path, "r") as fh2:
+    with open(cfg_path) as fh2:
         toml_text = fh2.read()
-    if args.batch_size is not None:
-        inline_cfg.setdefault("training", {})["batch_size"] = int(args.batch_size)
-    if args.group_size is not None:
-        inline_cfg.setdefault("training", {})["group_size"] = int(args.group_size)
-    model_name = args.model or (inline_cfg.get("model", {}) or {}).get("name", "Qwen/Qwen3-0.6B")
+    if batch_size is not None:
+        inline_cfg.setdefault("training", {})["batch_size"] = int(batch_size)
+    if group_size is not None:
+        inline_cfg.setdefault("training", {})["group_size"] = int(group_size)
+    model_name = model or (inline_cfg.get("model", {}) or {}).get("name", "Qwen/Qwen3-0.6B")
     api = env.dev_backend_url.rstrip("/") + ("" if env.dev_backend_url.endswith("/api") else "/api")
     # Print backend and key preview before request for clearer diagnostics
     try:
         sk = (env.synth_api_key or "").strip()
-        sk_len = len(sk)
-        sk_tail = sk[-5:] if sk_len >= 5 else sk
         print(f"[run] Backend API: {api}")
-        print(f"[run] Using SYNTH_API_KEY len={sk_len} last5={sk_tail}")
+        print(f"[run] {_key_preview(sk, 'SYNTH_API_KEY')}")
     except Exception:
         pass
-    data_fragment: Dict[str, Any] = {
+    data_fragment: dict[str, Any] = {
         "model": model_name,
         "endpoint_base_url": env.task_app_base_url,
         "config": inline_cfg,
@@ -1236,23 +1552,28 @@ def cmd_run(args: argparse.Namespace) -> int:
         if inline_cfg["compute"].get("gpu_type"):
             compute["gpu_type"] = str(inline_cfg["compute"]["gpu_type"]).upper()
         if inline_cfg["compute"].get("gpu_count"):
-            compute["gpu_count"] = int(inline_cfg["compute"]["gpu_count"])
+            compute["gpu_count"] = int(inline_cfg["compute"]["gpu_count"])
     if not compute:
         topo = inline_cfg.get("topology") or {}
         gshape = str(topo.get("gpu_type") or "")
         if ":" in gshape:
             t, c = gshape.split(":", 1)
             compute = {"gpu_type": t.upper(), "gpu_count": int(c)}
-    body: Dict[str, Any] = {
+    body: dict[str, Any] = {
         "job_type": "rl",
         "data": data_fragment,
     }
     if compute:
         body["compute"] = compute
-    code, js = _http("POST", api + "/rl/jobs", headers={
-        "Content-Type": "application/json",
-        "Authorization": f"Bearer {env.synth_api_key}",
-    }, body=body)
+    code, js = _http(
+        "POST",
+        api + "/rl/jobs",
+        headers={
+            "Content-Type": "application/json",
+            "Authorization": f"Bearer {env.synth_api_key}",
+        },
+        body=body,
+    )
     if code not in (200, 201) or not isinstance(js, dict):
         print("Job create failed:", code)
         print(f"Backend: {api}")
@@ -1264,15 +1585,77 @@ def cmd_run(args: argparse.Namespace) -> int:
         except Exception:
             print(str(js))
         print("Request body was:\n" + json.dumps(body, indent=2))
+        try:
+            auth_preview = _key_preview(env.synth_api_key or "", "SYNTH_API_KEY (auth)")
+            print(f"[run] {auth_preview}")
+        except Exception:
+            pass
+        try:
+            data_block = body.get("data") if isinstance(body, dict) else None
+            env_key_body = ""
+            if isinstance(data_block, dict):
+                env_key_body = str(data_block.get("environment_api_key") or "")
+            if env_key_body:
+                print(f"[run] {_key_preview(env_key_body, 'environment_api_key (body)')}")
+        except Exception:
+            pass
+        try:
+            current_env_key = env.env_api_key or ""
+            if current_env_key:
+                print(f"[run] {_key_preview(current_env_key, 'ENVIRONMENT_API_KEY (current)')}")
+        except Exception:
+            pass
+        if isinstance(js, dict):
+            detail = js.get("detail")
+            if isinstance(detail, dict):
+                try:
+                    sent_key = detail.get("sent_key")
+                    if isinstance(sent_key, str):
+                        print(
+                            f"[run] Backend detail.sent_key {_key_preview(sent_key, 'detail.sent_key')}"
+                        )
+                except Exception:
+                    pass
+                try:
+                    sent_keys = detail.get("sent_keys")
+                    if isinstance(sent_keys, list | tuple):
+                        previews = []
+                        for idx, val in enumerate(sent_keys):
+                            if isinstance(val, str):
+                                previews.append(_key_preview(val, f"detail.sent_keys[{idx}]"))
+                        if previews:
+                            joined = "; ".join(previews)
+                            print(f"[run] Backend detail.sent_keys previews: {joined}")
+                except Exception:
+                    pass
+                try:
+                    key_prefix = detail.get("sent_key_prefix")
+                    if isinstance(key_prefix, str):
+                        print(f"[run] Backend detail.sent_key_prefix={key_prefix}")
+                except Exception:
+                    pass
+                try:
+                    health_url = detail.get("health_url")
+                    if isinstance(health_url, str):
+                        print(f"[run] Backend detail.health_url={health_url}")
+                except Exception:
+                    pass
         # Extra hints for auth failures
         try:
             sk = (env.synth_api_key or "").strip()
-            if int(code) == 401 or (isinstance(js, dict) and any(isinstance(v, str) and "Invalid API key" in v for v in js.values())):
+            if int(code) == 401 or (
+                isinstance(js, dict)
+                and any(isinstance(v, str) and "Invalid API key" in v for v in js.values())
+            ):
                 base_url = env.dev_backend_url
-                print("Hint: HTTP 401 Unauthorized from backend. Verify SYNTH_API_KEY for:", base_url)
+                print(
+                    "Hint: HTTP 401 Unauthorized from backend. Verify SYNTH_API_KEY for:", base_url
+                )
                 if sk:
-                    print(f"  SYNTH_API_KEY len={len(sk)} last5={sk[-5:]}")
-                print("Also ensure your Modal secret contains a valid ENVIRONMENT_API_KEY.")
+                    print(f"  {_key_preview(sk, 'SYNTH_API_KEY')}")
+                print(
+                    "Ensure the ENVIRONMENT_API_KEY and OPENAI_API_KEY used for deployment remain valid."
+                )
         except Exception:
             pass
         return 2
@@ -1324,9 +1707,7 @@ def cmd_run(args: argparse.Namespace) -> int:
                     "rl.performance.metrics",
                 ):
                     print(f"[{seq}] {typ}: {msg}")
-        mc, mj = _http(
-            "GET", api + f"/learning/jobs/{job_id}/metrics?after_step=-1&limit=50"
-        )
+        mc, mj = _http("GET", api + f"/learning/jobs/{job_id}/metrics?after_step=-1&limit=50")
         if mc == 200 and isinstance(mj, dict):
             pts = mj.get("points") or []
             for p in pts:
@@ -1334,60 +1715,8 @@ def cmd_run(args: argparse.Namespace) -> int:
                 if name == "eval.reward_mean":
                     print(f"metric eval.reward_mean step={p.get('step')} value={p.get('value')}")
                     break
-        if time.time() - start_t > (args.timeout or 600):
+        if time.time() - start_t > (timeout or 600):
             print("Timeout waiting for terminal state.")
             break
         time.sleep(2)
     return 0
-def main(argv: list[str] | None = None) -> int:
-    p = argparse.ArgumentParser(prog="synth-ai")
-    sub = p.add_subparsers(dest="cmd")
-    def _add_parser(names: list[str], *, configure: Callable[[argparse.ArgumentParser], None]) -> None:
-        for name in names:
-            parser = sub.add_parser(name)
-            configure(parser)
-    _add_parser(["rl_demo.setup", "demo.setup"], configure=lambda parser: parser.set_defaults(func=cmd_setup))
-    def _init_opts(parser):
-        parser.add_argument("--force", action="store_true", help="Overwrite existing files in CWD")
-        parser.set_defaults(func=cmd_init)
-    _add_parser(["rl_demo.init", "demo.init"], configure=_init_opts)
-    # (prepare command removed)
-    def _deploy_opts(parser):
-        parser.add_argument("--local", action="store_true", help="Run local FastAPI instead of Modal deploy")
-        parser.add_argument("--app", type=str, default=None, help="Path to Modal app.py for uv run modal deploy")
-        parser.add_argument("--name", type=str, default="synth-math-demo", help="Modal app name")
-        parser.add_argument("--script", type=str, default=None, help="Path to deploy_task_app.sh (optional legacy)")
-        parser.set_defaults(func=cmd_deploy)
-    _add_parser(["rl_demo.deploy", "demo.deploy"], configure=_deploy_opts)
-    _add_parser(["rl_demo.configure", "demo.configure"], configure=lambda parser: parser.set_defaults(func=cmd_run))
-    def _run_opts(parser):
-        parser.add_argument("--config", type=str, default=None, help="Path to TOML config (skip prompt)")
-        parser.add_argument("--batch-size", type=int, default=None)
-        parser.add_argument("--group-size", type=int, default=None)
-        parser.add_argument("--model", type=str, default=None)
-        parser.add_argument("--timeout", type=int, default=600)
-        parser.add_argument("--dry-run", action="store_true", help="Print request body and exit")
-        parser.set_defaults(func=cmd_run)
-    _add_parser(["run", "rl_demo.run", "demo.run"], configure=_run_opts)
-    args = p.parse_args(argv)
-    if not hasattr(args, "func"):
-        p.print_help()
-        return 1
-    return int(args.func(args) or 0)
-if __name__ == "__main__":
-    sys.exit(main())

synth-ai 0.2.8.dev4__py3-none-any.whl → 0.2.23.dev3__py3-none-any.whl

synth-ai 0.2.8.dev4py3-none-any.whl → 0.2.23.dev3py3-none-any.whl