PyPI - synth-ai - Versions diffs - 0.2.9.dev0__py3-none-any.whl → 0.2.23.dev3__py3-none-any.whl - Mend

synth-ai 0.2.9.dev0py3-none-any.whl → 0.2.23.dev3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (890) hide show

examples/README.md +1 -0
examples/__init__.py +16 -0
examples/analyze_semantic_words.sh +17 -0
examples/baseline/banking77_baseline.py +243 -0
examples/baseline/banking77_pipeline_baseline.py +294 -0
examples/baseline/crafter_baseline.py +407 -0
examples/baseline/pokemon_red_baseline.py +326 -0
examples/baseline/simple_baseline.py +56 -0
examples/baseline/warming_up_to_rl_baseline.py +239 -0
examples/blog_posts/gepa/README.md +355 -0
examples/blog_posts/gepa/configs/banking77_gepa_local.toml +95 -0
examples/blog_posts/gepa/configs/banking77_gepa_test.toml +80 -0
examples/blog_posts/gepa/configs/banking77_mipro_local.toml +50 -0
examples/blog_posts/gepa/configs/banking77_pipeline_gepa_local.toml +101 -0
examples/blog_posts/gepa/configs/banking77_pipeline_gepa_test.toml +96 -0
examples/blog_posts/gepa/configs/hotpotqa_gepa_local.toml +57 -0
examples/blog_posts/gepa/configs/hotpotqa_gepa_qwen.toml +35 -0
examples/blog_posts/gepa/configs/hotpotqa_mipro_local.toml +51 -0
examples/blog_posts/gepa/configs/hover_gepa_local.toml +57 -0
examples/blog_posts/gepa/configs/hover_gepa_qwen.toml +35 -0
examples/blog_posts/gepa/configs/hover_mipro_local.toml +51 -0
examples/blog_posts/gepa/configs/ifbench_gepa_local.toml +57 -0
examples/blog_posts/gepa/configs/ifbench_gepa_qwen.toml +35 -0
examples/blog_posts/gepa/configs/ifbench_mipro_local.toml +51 -0
examples/blog_posts/gepa/configs/pupa_gepa_local.toml +58 -0
examples/blog_posts/gepa/configs/pupa_mipro_local.toml +52 -0
examples/blog_posts/gepa/deploy_banking77_task_app.sh +54 -0
examples/blog_posts/gepa/gepa_baseline.py +204 -0
examples/blog_posts/gepa/query_prompts_example.py +97 -0
examples/blog_posts/gepa/run_gepa_banking77.sh +112 -0
examples/blog_posts/gepa/run_gepa_banking77_pipeline.sh +163 -0
examples/blog_posts/gepa/task_apps.py +105 -0
examples/blog_posts/gepa/test_gepa_local.sh +67 -0
examples/blog_posts/gepa/verify_banking77_setup.sh +123 -0
examples/blog_posts/mipro/README.md +415 -0
examples/blog_posts/mipro/configs/banking77_mipro_local.toml +91 -0
examples/blog_posts/mipro/configs/banking77_mipro_test.toml +87 -0
examples/blog_posts/mipro/configs/banking77_pipeline_mipro_gemini_flash_lite_local.toml +98 -0
examples/blog_posts/mipro/configs/banking77_pipeline_mipro_gpt41mini_local.toml +96 -0
examples/blog_posts/mipro/configs/banking77_pipeline_mipro_local.toml +94 -0
examples/blog_posts/mipro/configs/banking77_pipeline_mipro_test.toml +170 -0
examples/blog_posts/mipro/deploy_banking77_pipeline_task_app.sh +59 -0
examples/blog_posts/mipro/deploy_banking77_task_app.sh +41 -0
examples/blog_posts/mipro/multi_step.md +79 -0
examples/blog_posts/mipro/run_mipro_banking77.sh +191 -0
examples/blog_posts/mipro/run_mipro_banking77_pipeline.sh +171 -0
examples/blog_posts/mipro/run_mipro_banking77_pipeline_gemini_flash_lite.sh +177 -0
examples/blog_posts/mipro/run_mipro_banking77_pipeline_gpt41mini.sh +173 -0
examples/blog_posts/mipro/verify_banking77_setup.sh +117 -0
examples/blog_posts/pokemon_vl/README.md +98 -0
examples/blog_posts/pokemon_vl/configs/eval_gpt5nano.toml +26 -0
examples/blog_posts/pokemon_vl/configs/eval_qwen3_vl.toml +27 -0
examples/blog_posts/pokemon_vl/configs/eval_rl_final.toml +24 -0
examples/blog_posts/pokemon_vl/configs/filter_high_reward.toml +10 -0
examples/blog_posts/pokemon_vl/configs/train_rl_from_sft.toml +43 -0
examples/blog_posts/pokemon_vl/configs/train_sft_qwen4b_vl.toml +40 -0
examples/blog_posts/pokemon_vl/extract_images.py +239 -0
examples/blog_posts/pokemon_vl/pokemon_vl_baseline.py +326 -0
examples/blog_posts/pokemon_vl/run_eval_extract_images.py +209 -0
examples/blog_posts/pokemon_vl/run_qwen_eval_extract_images.py +212 -0
examples/blog_posts/pokemon_vl/text_box_analysis.md +106 -0
examples/blog_posts/warming_up_to_rl/ARCHITECTURE.md +195 -0
examples/blog_posts/warming_up_to_rl/FINAL_TEST_RESULTS.md +127 -0
examples/blog_posts/warming_up_to_rl/INFERENCE_SUCCESS.md +132 -0
examples/blog_posts/warming_up_to_rl/README.md +158 -0
examples/blog_posts/warming_up_to_rl/SMOKE_TESTING.md +164 -0
examples/blog_posts/warming_up_to_rl/SMOKE_TEST_COMPLETE.md +253 -0
examples/blog_posts/warming_up_to_rl/configs/eval_baseline_qwen32b_10x20.toml +25 -0
examples/blog_posts/warming_up_to_rl/configs/eval_ft_qwen4b.toml +25 -0
examples/blog_posts/warming_up_to_rl/configs/eval_ft_qwen4b_10x20.toml +26 -0
examples/blog_posts/warming_up_to_rl/configs/eval_groq_qwen32b.toml +25 -0
examples/blog_posts/warming_up_to_rl/configs/eval_openai_gpt_oss_120b.toml +29 -0
examples/blog_posts/warming_up_to_rl/configs/filter_high_reward_dataset.toml +10 -0
examples/blog_posts/warming_up_to_rl/configs/smoke_test.toml +75 -0
examples/blog_posts/warming_up_to_rl/configs/train_rl_from_sft.toml +91 -0
examples/blog_posts/warming_up_to_rl/configs/train_sft_qwen4b.toml +40 -0
examples/blog_posts/warming_up_to_rl/warming_up_to_rl_baseline.py +187 -0
examples/crafter_debug_render.py +186 -0
examples/dev/qwen3_32b_qlora_4xh100.toml +45 -0
examples/gepa/banking77_pipeline_gepa.toml +96 -0
examples/gepa/multi_stage_gepa_example.toml +84 -0
examples/gepa/run_gepa_banking77_pipeline.sh +157 -0
examples/multi_step/SFT_README.md +147 -0
examples/multi_step/configs/README_verilog_rl.md +77 -0
examples/multi_step/configs/VERILOG_REWARDS.md +103 -0
examples/multi_step/configs/VERILOG_RL_CHECKLIST.md +196 -0
examples/multi_step/configs/crafter_eval_synth_qwen4b.toml +35 -0
examples/multi_step/configs/crafter_eval_text_only_groq_qwen32b.toml +36 -0
examples/multi_step/configs/crafter_rl_outcome.toml +75 -0
examples/multi_step/configs/crafter_rl_stepwise_hosted_judge.toml +145 -0
examples/multi_step/configs/crafter_rl_stepwise_shaped.toml +84 -0
examples/multi_step/configs/crafter_rl_stepwise_simple.toml +79 -0
examples/multi_step/configs/crafter_rl_stepwise_simple_NEW_FORMAT.toml +105 -0
examples/multi_step/configs/crafter_sft_qwen30b_lora.toml +62 -0
examples/multi_step/configs/crafter_synth_backend.md +40 -0
examples/multi_step/configs/verilog_eval_groq_qwen32b.toml +31 -0
examples/multi_step/configs/verilog_eval_synth_qwen8b.toml +33 -0
examples/multi_step/configs/verilog_rl_lora.toml +147 -0
examples/multi_step/convert_traces_to_sft.py +84 -0
examples/multi_step/crafter_rl_lora.md +70 -0
examples/multi_step/judges/crafter_backend_judge.py +220 -0
examples/multi_step/judges/verilog_backend_judge.py +234 -0
examples/multi_step/readme.md +48 -0
examples/multi_step/run_sft_qwen30b.sh +45 -0
examples/multi_step/sse_metrics_streaming_notes.md +357 -0
examples/multi_step/task_app_config_notes.md +494 -0
examples/multi_step/verilog_rl_lora.md +218 -0
examples/qwen_coder/README.md +102 -0
examples/qwen_coder/_shared.py +113 -0
examples/qwen_coder/configs/coder_lora_30b.toml +60 -0
examples/qwen_coder/configs/coder_lora_4b.toml +61 -0
examples/qwen_coder/configs/coder_lora_small.toml +57 -0
examples/qwen_coder/generate_dataset.py +98 -0
examples/qwen_coder/infer_ft_smoke.py +65 -0
examples/qwen_coder/infer_prod_proxy.py +73 -0
examples/qwen_coder/infer_via_synth.py +87 -0
examples/qwen_coder/scripts/infer_coder.sh +19 -0
examples/qwen_coder/scripts/train_coder_30b.sh +22 -0
examples/qwen_coder/sft_full_17b.py +103 -0
examples/qwen_coder/sft_lora_30b.py +110 -0
examples/qwen_coder/subset_jsonl.py +39 -0
examples/qwen_coder/todos.md +38 -0
examples/qwen_coder/validate_jsonl.py +60 -0
examples/qwen_vl/BUGS_AND_FIXES.md +232 -0
examples/qwen_vl/IMAGE_VALIDATION_COMPLETE.md +271 -0
examples/qwen_vl/IMAGE_VALIDATION_SUMMARY.md +260 -0
examples/qwen_vl/INFERENCE_SFT_TESTS.md +412 -0
examples/qwen_vl/NEXT_STEPS_2B.md +325 -0
examples/qwen_vl/QUICKSTART.md +327 -0
examples/qwen_vl/QUICKSTART_RL_VISION.md +110 -0
examples/qwen_vl/README.md +152 -0
examples/qwen_vl/RL_VISION_COMPLETE.md +475 -0
examples/qwen_vl/RL_VISION_TESTING.md +333 -0
examples/qwen_vl/SDK_VISION_INTEGRATION.md +328 -0
examples/qwen_vl/SETUP_COMPLETE.md +274 -0
examples/qwen_vl/VISION_TESTS_COMPLETE.md +489 -0
examples/qwen_vl/VLM_PIPELINE_COMPLETE.md +242 -0
examples/qwen_vl/__init__.py +2 -0
examples/qwen_vl/collect_data_via_cli.md +415 -0
examples/qwen_vl/collect_vision_traces.py +368 -0
examples/qwen_vl/configs/crafter_rl_vision_qwen3vl4b.toml +110 -0
examples/qwen_vl/configs/crafter_vlm_sft_example.toml +59 -0
examples/qwen_vl/configs/eval_gpt4o_mini_vision.toml +26 -0
examples/qwen_vl/configs/eval_gpt4o_vision_proper.toml +29 -0
examples/qwen_vl/configs/eval_gpt5nano_vision.toml +26 -0
examples/qwen_vl/configs/eval_qwen3vl_vision.toml +26 -0
examples/qwen_vl/configs/filter_qwen3vl_sft.toml +49 -0
examples/qwen_vl/configs/filter_vision_sft.toml +52 -0
examples/qwen_vl/configs/filter_vision_test.toml +8 -0
examples/qwen_vl/configs/sft_qwen3_vl_2b_test.toml +54 -0
examples/qwen_vl/crafter_gpt5nano_agent.py +308 -0
examples/qwen_vl/crafter_qwen_vl_agent.py +300 -0
examples/qwen_vl/run_vision_comparison.sh +61 -0
examples/qwen_vl/run_vision_sft_pipeline.sh +175 -0
examples/qwen_vl/test_image_validation.py +201 -0
examples/qwen_vl/test_sft_vision_data.py +110 -0
examples/rl/README.md +169 -0
examples/rl/configs/eval_base_qwen.toml +17 -0
examples/rl/configs/eval_rl_qwen.toml +13 -0
examples/rl/configs/rl_from_base_qwen.toml +62 -0
examples/rl/configs/rl_from_base_qwen17.toml +80 -0
examples/rl/configs/rl_from_ft_qwen.toml +37 -0
examples/rl/download_dataset.py +80 -0
examples/rl/run_eval.py +436 -0
examples/rl/run_rl_and_save.py +111 -0
examples/rl/task_app/README.md +21 -0
{synth_ai/task/apps → examples/rl/task_app}/math_single_step.py +188 -50
examples/rl/task_app/math_task_app.py +111 -0
examples/run_crafter_demo.sh +10 -0
examples/sdk_prompt_learning_example.py +55 -0
examples/sft/README.md +139 -0
examples/sft/configs/crafter_fft_qwen0p6b.toml +49 -0
examples/sft/configs/crafter_lora_qwen0p6b.toml +49 -0
examples/sft/evaluate.py +117 -0
examples/sft/export_dataset.py +120 -0
examples/sft/generate_traces.py +164 -0
examples/swe/__init__.py +12 -0
examples/swe/task_app/README.md +135 -0
examples/swe/task_app/__init__.py +2 -0
examples/swe/task_app/grpo_swe_mini.py +604 -0
examples/swe/task_app/grpo_swe_mini_task_app.py +124 -0
examples/swe/task_app/hosted/README.md +173 -0
examples/swe/task_app/hosted/__init__.py +5 -0
examples/swe/task_app/hosted/branching.py +143 -0
examples/swe/task_app/hosted/environment_routes.py +1289 -0
examples/swe/task_app/hosted/envs/__init__.py +1 -0
examples/swe/task_app/hosted/envs/crafter/__init__.py +6 -0
examples/swe/task_app/hosted/envs/crafter/app.py +1 -0
examples/swe/task_app/hosted/envs/crafter/environment.py +522 -0
examples/swe/task_app/hosted/envs/crafter/policy.py +478 -0
examples/swe/task_app/hosted/envs/crafter/react_agent.py +108 -0
examples/swe/task_app/hosted/envs/crafter/shared.py +305 -0
examples/swe/task_app/hosted/envs/crafter/tools.py +47 -0
examples/swe/task_app/hosted/envs/mini_swe/__init__.py +8 -0
examples/swe/task_app/hosted/envs/mini_swe/environment.py +1191 -0
examples/swe/task_app/hosted/envs/mini_swe/policy.py +355 -0
examples/swe/task_app/hosted/envs/mini_swe/shared.py +83 -0
examples/swe/task_app/hosted/envs/mini_swe/tools.py +96 -0
examples/swe/task_app/hosted/hosted_app.py +204 -0
examples/swe/task_app/hosted/inference/__init__.py +5 -0
examples/swe/task_app/hosted/inference/openai_client.py +584 -0
examples/swe/task_app/hosted/main.py +100 -0
examples/swe/task_app/hosted/policy_routes.py +1094 -0
examples/swe/task_app/hosted/registry.py +195 -0
examples/swe/task_app/hosted/rollout.py +1905 -0
examples/swe/task_app/hosted/storage/__init__.py +5 -0
examples/swe/task_app/hosted/storage/volume.py +211 -0
examples/swe/task_app/hosted/test_agents.py +161 -0
examples/swe/task_app/hosted/test_service.py +136 -0
examples/swe/task_app/hosted/utils.py +62 -0
examples/swe/task_app/morph_backend.py +178 -0
examples/task_apps/IMAGE_ONLY_EVAL_QUICKSTART.md +258 -0
examples/task_apps/TESTING.md +275 -0
examples/task_apps/banking77/__init__.py +6 -0
examples/task_apps/banking77/banking77_task_app.py +912 -0
examples/task_apps/banking77/deploy_wrapper.py +46 -0
examples/task_apps/banking77_pipeline/__init__.py +6 -0
examples/task_apps/banking77_pipeline/banking77_pipeline_task_app.py +489 -0
examples/task_apps/banking77_pipeline/deploy_wrapper.py +50 -0
examples/task_apps/crafter/CREATE_SFT_DATASET.md +286 -0
examples/task_apps/crafter/EVAL_IMAGE_ONLY_RESULTS.md +152 -0
examples/task_apps/crafter/FILTER_COMMAND_STATUS.md +187 -0
examples/task_apps/crafter/FILTER_COMMAND_SUCCESS.md +281 -0
examples/task_apps/crafter/QUERY_EXAMPLES.md +203 -0
examples/task_apps/crafter/README_IMAGE_ONLY_EVAL.md +316 -0
examples/task_apps/crafter/eval_image_only_gpt4o.toml +28 -0
examples/task_apps/crafter/eval_text_only_groq_llama.toml +36 -0
examples/task_apps/crafter/filter_sft_dataset.toml +16 -0
examples/task_apps/crafter/task_app/README.md +42 -0
examples/task_apps/crafter/task_app/__init__.py +5 -0
examples/task_apps/crafter/task_app/grpo_crafter.py +1055 -0
examples/task_apps/crafter/task_app/grpo_crafter_task_app.py +146 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/README.md +173 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/__init__.py +5 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/branching.py +143 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/environment_routes.py +1226 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/__init__.py +1 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/__init__.py +6 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/app.py +1 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/environment.py +532 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/policy.py +583 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/react_agent.py +122 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/shared.py +305 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/envs/crafter/tools.py +47 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/hosted_app.py +253 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/inference/__init__.py +5 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/inference/openai_client.py +999 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/main.py +100 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/policy_routes.py +1252 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/registry.py +195 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/rollout.py +2233 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/storage/__init__.py +5 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/storage/volume.py +211 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/test_agents.py +161 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/test_service.py +136 -0
examples/task_apps/crafter/task_app/synth_envs_hosted/utils.py +411 -0
examples/task_apps/dev/pokemon_emerald/__init__.py +2 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/README.md +811 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/__init__.py +120 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/action.py +160 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/memory.py +155 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/perception.py +69 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/planning.py +96 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/simple.py +1502 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/agent/system_prompt.py +4 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/grab_map.py +68 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/manual.py +216 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/__init__.py +35 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/emerald_utils.py +631 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/emulator.py +1544 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/enums.py +1428 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/memory_reader.py +4848 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/types.py +41 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pokemon_env/utils.py +298 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/pyproject.toml +95 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/run.py +204 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/server/app.py +2152 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/server/client.py +429 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/server/frame_server.py +155 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/README.md +78 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/run_tests.py +122 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_agent_direct.py +76 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_agent_prompts.py +413 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_battle_state_formatting.py +204 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_dialogue_detection.py +133 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_dialogue_detection_comprehensive.py +229 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_direct_agent_emulator.py +300 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_fps_adjustment_pytest.py +205 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_house_to_outside_direct.py +200 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_house_to_outside_transition.py +284 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_map_ground_truth_comparison.py +468 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_memory_map.py +575 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_server_map_validation.py +311 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests/test_torchic_state.py +259 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/anticheat.py +372 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/checkpoint.py +296 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/error_handler.py +275 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/get_local_ip.py +22 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/helpers.py +44 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/llm_logger.py +514 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/map_formatter.py +415 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/map_stitcher.py +1763 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/map_stitcher_singleton.py +33 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/map_trimmer.py +106 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/map_visualizer.py +334 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/ocr_dialogue.py +1020 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/recording.py +188 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/state_formatter.py +1481 -0
examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/vlm.py +862 -0
examples/task_apps/dev/pokemon_emerald/modal_app.py +114 -0
examples/task_apps/dev/pokemon_emerald/task_app/README.md +81 -0
examples/task_apps/dev/pokemon_emerald/task_app/__init__.py +6 -0
examples/task_apps/dev/pokemon_emerald/task_app/pokemon_emerald.py +685 -0
examples/task_apps/enron/__init__.py +2 -0
examples/task_apps/enron/eval_groq_qwen32.toml +16 -0
examples/task_apps/enron/filter_sft.toml +5 -0
examples/task_apps/enron/task_app/README.md +14 -0
examples/task_apps/enron/task_app/__init__.py +1 -0
examples/task_apps/enron/task_app/grpo_enron.py +906 -0
examples/task_apps/enron/task_app/grpo_enron_task_app.py +146 -0
examples/task_apps/enron/tests/__init__.py +4 -0
examples/task_apps/enron/tests/conftest.py +115 -0
examples/task_apps/enron/tests/integration/__init__.py +4 -0
examples/task_apps/enron/tests/integration/test_enron_eval.py +179 -0
examples/task_apps/enron/tests/integration/test_enron_rollout.py +135 -0
examples/task_apps/enron/tests/unit/__init__.py +4 -0
examples/task_apps/enron/tests/unit/test_enron_environment.py +126 -0
examples/task_apps/gepa_benchmarks/__init__.py +7 -0
examples/task_apps/gepa_benchmarks/common.py +260 -0
examples/task_apps/gepa_benchmarks/hotpotqa_task_app.py +507 -0
examples/task_apps/gepa_benchmarks/hover_task_app.py +436 -0
examples/task_apps/gepa_benchmarks/ifbench_task_app.py +563 -0
examples/task_apps/gepa_benchmarks/pupa_task_app.py +460 -0
examples/task_apps/math/README.md +21 -0
examples/task_apps/math/math_single_step.py +1000 -0
examples/task_apps/math/math_task_app.py +115 -0
examples/task_apps/pokemon_battle/__init__.py +2 -0
examples/task_apps/pokemon_battle/modal_app.py +104 -0
examples/task_apps/pokemon_battle/task_app/README.md +68 -0
examples/task_apps/pokemon_battle/task_app/__init__.py +6 -0
examples/task_apps/pokemon_battle/task_app/pokemon_showdown.py +932 -0
examples/task_apps/pokemon_red/EVAL_IMAGE_ONLY_COMPLETE.md +283 -0
examples/task_apps/pokemon_red/EVAL_IMAGE_ONLY_STATUS.md +155 -0
examples/task_apps/pokemon_red/README.md +356 -0
examples/task_apps/pokemon_red/README_IMAGE_ONLY_EVAL.md +428 -0
examples/task_apps/pokemon_red/__init__.py +3 -0
examples/task_apps/pokemon_red/eval_image_only_gpt4o.toml +30 -0
examples/task_apps/pokemon_red/eval_pokemon_red_policy.py +224 -0
examples/task_apps/pokemon_red/pallet_town_rl_config.toml +75 -0
examples/task_apps/pokemon_red/task_app.py +1048 -0
examples/task_apps/pokemon_red/test_pallet_town_rewards.py +193 -0
examples/task_apps/sokoban/README.md +306 -0
examples/task_apps/sokoban/__init__.py +3 -0
examples/task_apps/sokoban/eval_groq_qwen32.toml +16 -0
examples/task_apps/sokoban/eval_openai_gpt5.toml +16 -0
examples/task_apps/sokoban/filter_sft.toml +5 -0
examples/task_apps/sokoban/task_app.py +1058 -0
examples/task_apps/sokoban/tests/__init__.py +4 -0
examples/task_apps/sokoban/tests/conftest.py +113 -0
examples/task_apps/sokoban/tests/integration/__init__.py +4 -0
examples/task_apps/sokoban/tests/integration/test_sokoban_eval.py +57 -0
examples/task_apps/sokoban/tests/integration/test_sokoban_rollout.py +198 -0
examples/task_apps/sokoban/tests/unit/__init__.py +4 -0
examples/task_apps/sokoban/tests/unit/test_sokoban_environment.py +114 -0
examples/task_apps/verilog/__init__.py +1 -0
examples/task_apps/verilog/eval_groq_qwen32b.toml +22 -0
examples/task_apps/verilog/filter_sft.toml +5 -0
examples/task_apps/verilog/task_app/README.md +12 -0
examples/task_apps/verilog/task_app/__init__.py +1 -0
examples/task_apps/verilog/task_app/grpo_verilog.py +1166 -0
examples/task_apps/verilog/task_app/grpo_verilog_task_app.py +145 -0
examples/task_apps/verilog/tests/__init__.py +4 -0
examples/task_apps/verilog/tests/conftest.py +115 -0
examples/task_apps/verilog/tests/integration/__init__.py +4 -0
examples/task_apps/verilog/tests/integration/test_verilog_eval.py +181 -0
examples/task_apps/verilog/tests/integration/test_verilog_rollout.py +55 -0
examples/task_apps/verilog/tests/unit/__init__.py +4 -0
examples/task_apps/verilog/tests/unit/test_verilog_scoring.py +118 -0
examples/tunnel_gepa_banking77/README.md +106 -0
examples/tunnel_gepa_banking77/banking77_gepa_tunnel.toml +95 -0
examples/tunnel_gepa_banking77/keep_tunnel_running.py +60 -0
examples/tunnel_gepa_banking77/run_gepa_with_tunnel.sh +226 -0
examples/vlm/PROPOSAL.md +53 -0
examples/vlm/README.md +68 -0
examples/vlm/configs/crafter_vlm_gpt4o.toml +49 -0
examples/vlm/crafter_image_only_agent.py +207 -0
examples/vlm/crafter_openai_vlm_agent.py +275 -0
examples/vlm/filter_image_rows.py +63 -0
examples/vlm/run_crafter_vlm_benchmark.py +316 -0
examples/warming_up_to_rl/_utils.py +92 -0
examples/warming_up_to_rl/analyze_trace_db.py +422 -0
examples/warming_up_to_rl/configs/crafter_fft.toml +53 -0
examples/warming_up_to_rl/configs/crafter_fft_4b.toml +54 -0
examples/warming_up_to_rl/configs/eval_fft_qwen4b.toml +22 -0
examples/warming_up_to_rl/configs/eval_groq_qwen32b.toml +15 -0
examples/warming_up_to_rl/configs/eval_modal_qwen4b.toml +24 -0
examples/warming_up_to_rl/configs/eval_stepwise_complex.toml +35 -0
examples/warming_up_to_rl/configs/eval_stepwise_consistent.toml +26 -0
examples/warming_up_to_rl/configs/eval_stepwise_per_achievement.toml +36 -0
examples/warming_up_to_rl/configs/eval_stepwise_simple.toml +32 -0
examples/warming_up_to_rl/configs/rl_from_base_qwen4b.toml +85 -0
examples/warming_up_to_rl/configs/rl_from_ft.toml +58 -0
examples/warming_up_to_rl/export_trace_sft.py +837 -0
examples/warming_up_to_rl/groq_test.py +97 -0
examples/warming_up_to_rl/manage_secrets.py +131 -0
examples/warming_up_to_rl/old/event_rewards.md +234 -0
examples/warming_up_to_rl/old/notes.md +73 -0
examples/warming_up_to_rl/readme.md +110 -0
examples/warming_up_to_rl/run_eval.py +736 -0
examples/warming_up_to_rl/run_fft_and_save.py +380 -0
examples/warming_up_to_rl/run_local_rollout.py +239 -0
examples/warming_up_to_rl/run_local_rollout_modal.py +248 -0
examples/warming_up_to_rl/run_local_rollout_parallel.py +405 -0
examples/warming_up_to_rl/run_local_rollout_traced.py +477 -0
examples/warming_up_to_rl/run_rl_and_save.py +124 -0
examples/warming_up_to_rl/run_rollout_remote.py +156 -0
examples/warming_up_to_rl/task_app/README.md +42 -0
examples/warming_up_to_rl/task_app/grpo_crafter.py +876 -0
examples/warming_up_to_rl/task_app/grpo_crafter_task_app.py +135 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/README.md +173 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/__init__.py +5 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/branching.py +143 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/environment_routes.py +1226 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/__init__.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/__init__.py +6 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/app.py +1 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/environment.py +522 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/policy.py +454 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/react_agent.py +108 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/shared.py +305 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/envs/crafter/tools.py +47 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/hosted_app.py +253 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/__init__.py +5 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/inference/openai_client.py +729 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/main.py +100 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/policy_routes.py +1114 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/registry.py +195 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/rollout.py +1891 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/__init__.py +5 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/storage/volume.py +211 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_agents.py +161 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/test_service.py +137 -0
examples/warming_up_to_rl/task_app/synth_envs_hosted/utils.py +129 -0
examples/workflows/math_rl/configs/eval_base_qwen.toml +15 -0
examples/workflows/math_rl/configs/eval_rl_qwen.toml +11 -0
examples/workflows/math_rl/configs/rl_from_base_qwen.toml +62 -0
examples/workflows/math_rl/configs/rl_from_base_qwen17.toml +80 -0
examples/workflows/math_rl/configs/rl_from_ft_qwen.toml +35 -0
examples/workflows/math_rl/download_dataset.py +80 -0
examples/workflows/math_rl/run_eval.py +436 -0
examples/workflows/math_rl/run_rl_and_save.py +111 -0
synth_ai/__init__.py +47 -23
synth_ai/_utils/__init__.py +47 -0
synth_ai/_utils/base_url.py +10 -0
synth_ai/_utils/http.py +10 -0
synth_ai/_utils/prompts.py +10 -0
synth_ai/_utils/task_app_state.py +12 -0
synth_ai/_utils/user_config.py +10 -0
synth_ai/api/models/supported.py +514 -0
synth_ai/api/train/__init__.py +60 -2
synth_ai/api/train/builders.py +347 -39
synth_ai/api/train/cli.py +895 -160
synth_ai/api/train/config_finder.py +103 -25
synth_ai/api/train/configs/__init__.py +65 -0
synth_ai/api/train/configs/prompt_learning.py +496 -0
synth_ai/api/train/configs/rl.py +188 -0
synth_ai/api/train/configs/sft.py +99 -0
synth_ai/api/train/configs/shared.py +81 -0
synth_ai/api/train/env_resolver.py +70 -20
synth_ai/api/train/pollers.py +29 -4
synth_ai/api/train/prompt_learning.py +425 -0
synth_ai/api/train/sft.py +390 -0
synth_ai/api/train/supported_algos.py +147 -0
synth_ai/api/train/task_app.py +6 -4
synth_ai/api/train/utils.py +64 -52
synth_ai/api/train/validators.py +1117 -0
synth_ai/api/tunnel.py +49 -0
synth_ai/auth/credentials.py +94 -0
synth_ai/baseline/__init__.py +25 -0
synth_ai/baseline/config.py +209 -0
synth_ai/baseline/discovery.py +214 -0
synth_ai/baseline/execution.py +146 -0
synth_ai/cfgs.py +227 -0
synth_ai/cli/__init__.py +85 -63
synth_ai/cli/_modal_wrapper.py +31 -0
synth_ai/cli/_storage.py +20 -0
synth_ai/cli/_typer_patch.py +47 -0
synth_ai/cli/_validate_task_app.py +29 -0
synth_ai/cli/balance.py +16 -4
synth_ai/cli/calc.py +36 -21
synth_ai/cli/claude.py +70 -0
synth_ai/cli/codex.py +267 -0
synth_ai/cli/commands/__init__.py +18 -0
synth_ai/cli/commands/baseline/__init__.py +12 -0
synth_ai/cli/commands/baseline/core.py +637 -0
synth_ai/cli/commands/baseline/list.py +93 -0
synth_ai/cli/commands/demo/__init__.py +6 -0
synth_ai/cli/commands/demo/core.py +163 -0
synth_ai/cli/commands/eval/__init__.py +19 -0
synth_ai/cli/commands/eval/core.py +1112 -0
synth_ai/cli/commands/eval/errors.py +81 -0
synth_ai/cli/commands/eval/validation.py +133 -0
synth_ai/cli/commands/filter/__init__.py +12 -0
synth_ai/cli/commands/filter/core.py +424 -0
synth_ai/cli/commands/filter/errors.py +55 -0
synth_ai/cli/commands/filter/validation.py +77 -0
synth_ai/cli/commands/help/__init__.py +185 -0
synth_ai/cli/commands/help/core.py +72 -0
synth_ai/cli/commands/smoke/__init__.py +7 -0
synth_ai/cli/commands/smoke/core.py +1437 -0
synth_ai/cli/commands/status/__init__.py +66 -0
synth_ai/cli/commands/status/client.py +192 -0
synth_ai/cli/commands/status/config.py +92 -0
synth_ai/cli/commands/status/errors.py +20 -0
synth_ai/cli/commands/status/formatters.py +164 -0
synth_ai/cli/commands/status/subcommands/__init__.py +9 -0
synth_ai/cli/commands/status/subcommands/files.py +79 -0
synth_ai/cli/commands/status/subcommands/jobs.py +334 -0
synth_ai/cli/commands/status/subcommands/models.py +79 -0
synth_ai/cli/commands/status/subcommands/pricing.py +22 -0
synth_ai/cli/commands/status/subcommands/runs.py +81 -0
synth_ai/cli/commands/status/subcommands/session.py +183 -0
synth_ai/cli/commands/status/subcommands/summary.py +47 -0
synth_ai/cli/commands/status/subcommands/usage.py +203 -0
synth_ai/cli/commands/status/utils.py +114 -0
synth_ai/cli/commands/train/__init__.py +53 -0
synth_ai/cli/commands/train/core.py +21 -0
synth_ai/cli/commands/train/errors.py +117 -0
synth_ai/cli/commands/train/judge_schemas.py +200 -0
synth_ai/cli/commands/train/judge_validation.py +305 -0
synth_ai/cli/commands/train/validation.py +386 -0
synth_ai/cli/demo.py +32 -140
synth_ai/cli/deploy.py +233 -0
synth_ai/cli/eval/__init__.py +36 -0
synth_ai/cli/eval/core.py +5 -0
synth_ai/cli/eval/errors.py +31 -0
synth_ai/cli/eval/validation.py +5 -0
synth_ai/cli/filter/__init__.py +28 -0
synth_ai/cli/filter/core.py +5 -0
synth_ai/cli/filter/errors.py +23 -0
synth_ai/cli/filter/validation.py +5 -0
synth_ai/cli/legacy_root_backup.py +28 -22
synth_ai/cli/lib/__init__.py +10 -0
synth_ai/cli/lib/task_app_discovery.py +7 -0
synth_ai/cli/lib/task_app_env.py +518 -0
synth_ai/cli/mcp.py +34 -0
synth_ai/cli/modal_serve/__init__.py +12 -0
synth_ai/cli/modal_serve/core.py +14 -0
synth_ai/cli/modal_serve/errors.py +8 -0
synth_ai/cli/modal_serve/validation.py +11 -0
synth_ai/cli/opencode.py +256 -0
synth_ai/cli/recent.py +13 -7
synth_ai/cli/rl_demo.py +156 -116
synth_ai/cli/root.py +131 -132
synth_ai/cli/serve/__init__.py +12 -0
synth_ai/cli/serve/core.py +14 -0
synth_ai/cli/serve/errors.py +8 -0
synth_ai/cli/serve/validation.py +11 -0
synth_ai/cli/setup.py +49 -0
synth_ai/cli/status.py +7 -125
synth_ai/cli/task_app_deploy.py +7 -0
synth_ai/cli/task_app_list.py +25 -0
synth_ai/cli/task_app_modal_serve.py +11 -0
synth_ai/cli/task_app_serve.py +11 -0
synth_ai/cli/task_apps.py +2284 -257
synth_ai/cli/traces.py +9 -5
synth_ai/cli/train/__init__.py +12 -0
synth_ai/cli/train/core.py +21 -0
synth_ai/cli/train/errors.py +8 -0
synth_ai/cli/train/validation.py +24 -0
synth_ai/cli/train.py +5 -0
synth_ai/cli/turso.py +73 -0
synth_ai/cli/watch.py +13 -18
synth_ai/demos/__init__.py +10 -0
synth_ai/demos/core/__init__.py +28 -1
synth_ai/demos/core/cli.py +579 -291
synth_ai/demos/crafter/__init__.py +1 -0
synth_ai/demos/crafter/crafter_fft_4b.toml +55 -0
synth_ai/demos/crafter/grpo_crafter_task_app.py +185 -0
synth_ai/demos/crafter/rl_from_base_qwen4b.toml +74 -0
synth_ai/demos/demo_registry.py +176 -0
synth_ai/demos/demo_task_apps/__init__.py +3 -3
synth_ai/demos/demo_task_apps/core.py +64 -28
synth_ai/demos/demo_task_apps/crafter/__init__.py +1 -0
synth_ai/demos/demo_task_apps/crafter/configs/crafter_fft_4b.toml +53 -0
synth_ai/demos/demo_task_apps/crafter/configs/rl_from_base_qwen4b.toml +73 -0
synth_ai/demos/demo_task_apps/crafter/grpo_crafter_task_app.py +184 -0
synth_ai/demos/demo_task_apps/math/_common.py +1 -2
synth_ai/demos/demo_task_apps/math/app.py +2 -1
synth_ai/demos/demo_task_apps/math/deploy_modal.py +3 -6
synth_ai/demos/demo_task_apps/math/modal_task_app.py +185 -83
synth_ai/demos/demo_task_apps/math/task_app_entry.py +0 -2
synth_ai/demos/math/__init__.py +1 -0
synth_ai/demos/math/_common.py +16 -0
synth_ai/demos/math/app.py +38 -0
synth_ai/demos/math/config.toml +76 -0
synth_ai/demos/math/deploy_modal.py +54 -0
synth_ai/demos/math/modal_task_app.py +703 -0
synth_ai/demos/math/task_app_entry.py +51 -0
synth_ai/environments/environment/core.py +7 -1
synth_ai/environments/examples/bandit/engine.py +12 -5
synth_ai/environments/examples/bandit/environment.py +0 -1
synth_ai/environments/examples/bandit/taskset.py +4 -4
synth_ai/environments/examples/crafter_classic/engine_deterministic_patch.py +7 -4
synth_ai/environments/examples/crafter_classic/engine_serialization_patch_v3.py +9 -5
synth_ai/environments/examples/crafter_classic/environment.py +93 -2
synth_ai/environments/examples/crafter_classic/world_config_patch_simple.py +4 -3
synth_ai/environments/examples/enron/engine.py +7 -2
synth_ai/environments/examples/enron/environment.py +68 -0
synth_ai/environments/examples/red/engine.py +60 -12
synth_ai/environments/examples/red/engine_helpers/memory_map.py +7 -0
synth_ai/environments/examples/red/engine_helpers/reward_components.py +151 -179
synth_ai/environments/examples/red/engine_helpers/reward_library/pallet_town_progression.py +477 -0
synth_ai/environments/examples/red/engine_helpers/state_extraction.py +32 -0
synth_ai/environments/examples/red/environment.py +86 -0
synth_ai/environments/examples/red/trace_hooks_v3.py +168 -0
synth_ai/environments/examples/sokoban/taskset.py +116 -0
synth_ai/environments/examples/verilog/engine.py +104 -12
synth_ai/environments/examples/wordle/environment.py +0 -1
synth_ai/environments/reproducibility/tree.py +5 -6
synth_ai/environments/service/app.py +11 -12
synth_ai/environments/service/core_routes.py +10 -9
synth_ai/environments/stateful/engine.py +1 -1
synth_ai/environments/tasks/core.py +1 -0
synth_ai/environments/tasks/filters.py +5 -6
synth_ai/environments/tasks/utils.py +4 -5
synth_ai/evals/__init__.py +15 -0
synth_ai/evals/base.py +14 -5
synth_ai/evals/client.py +82 -0
synth_ai/evals/types.py +42 -0
synth_ai/http.py +8 -22
synth_ai/http_client.py +45 -12
synth_ai/inference/__init__.py +0 -2
synth_ai/inference/client.py +21 -7
synth_ai/jobs/client.py +129 -80
synth_ai/judge_schemas.py +127 -0
synth_ai/learning/__init__.py +51 -6
synth_ai/learning/algorithms.py +14 -0
synth_ai/learning/client.py +122 -30
synth_ai/learning/config.py +2 -40
synth_ai/learning/constants.py +0 -2
synth_ai/learning/ft_client.py +4 -56
synth_ai/learning/health.py +14 -8
synth_ai/learning/jobs.py +43 -47
synth_ai/learning/prompt_learning_client.py +276 -0
synth_ai/learning/prompt_learning_types.py +185 -0
synth_ai/{rl → learning/rl}/__init__.py +14 -5
synth_ai/learning/rl/client.py +269 -0
synth_ai/learning/rl/config.py +31 -0
synth_ai/{rl → learning/rl}/contracts.py +5 -10
synth_ai/{rl → learning/rl}/env_keys.py +45 -16
synth_ai/learning/rl/secrets.py +13 -0
synth_ai/learning/rl_client.py +2 -253
synth_ai/learning/sft/__init__.py +29 -0
synth_ai/learning/sft/client.py +68 -0
synth_ai/learning/sft/config.py +270 -0
synth_ai/learning/sft/data.py +698 -0
synth_ai/learning/sse.py +25 -26
synth_ai/learning/validators.py +29 -25
synth_ai/mcp/__init__.py +5 -0
synth_ai/mcp/__main__.py +8 -0
synth_ai/mcp/main.py +254 -0
synth_ai/mcp/setup.py +100 -0
synth_ai/modal.py +257 -0
synth_ai/pricing/__init__.py +3 -0
synth_ai/pricing/model_pricing.py +64 -0
synth_ai/session/__init__.py +75 -0
synth_ai/session/client.py +383 -0
synth_ai/session/constants.py +63 -0
synth_ai/session/exceptions.py +105 -0
synth_ai/session/manager.py +139 -0
synth_ai/session/models.py +89 -0
synth_ai/session/query.py +110 -0
synth_ai/spec/__init__.py +46 -0
synth_ai/spec/dataclasses.py +149 -0
synth_ai/spec/loader.py +144 -0
synth_ai/spec/serializer.py +199 -0
synth_ai/spec/validation.py +250 -0
synth_ai/streaming/__init__.py +29 -0
synth_ai/streaming/config.py +94 -0
synth_ai/streaming/handlers.py +589 -0
synth_ai/streaming/streamer.py +320 -0
synth_ai/streaming/types.py +95 -0
synth_ai/task/__init__.py +50 -30
synth_ai/task/apps/__init__.py +63 -19
synth_ai/task/auth.py +35 -23
synth_ai/task/client.py +15 -13
synth_ai/task/config.py +261 -0
synth_ai/task/contracts.py +165 -64
synth_ai/task/datasets.py +9 -6
synth_ai/task/errors.py +11 -10
synth_ai/task/health.py +17 -11
synth_ai/task/inference_api.py +101 -0
synth_ai/task/json.py +58 -24
synth_ai/task/proxy.py +59 -66
synth_ai/task/rubrics/__init__.py +55 -0
synth_ai/task/rubrics/loaders.py +156 -0
synth_ai/task/rubrics/models.py +57 -0
synth_ai/task/rubrics/scoring.py +116 -0
synth_ai/task/rubrics/strict.py +149 -0
synth_ai/task/rubrics.py +22 -15
synth_ai/task/server.py +65 -31
synth_ai/task/trace_correlation_helpers.py +328 -0
synth_ai/task/tracing_utils.py +44 -28
synth_ai/task/validators.py +449 -6
synth_ai/task/vendors.py +5 -7
synth_ai/tracing_v3/__init__.py +4 -0
synth_ai/tracing_v3/abstractions.py +21 -4
synth_ai/tracing_v3/config.py +167 -22
synth_ai/tracing_v3/constants.py +21 -0
synth_ai/tracing_v3/db_config.py +42 -29
synth_ai/tracing_v3/decorators.py +80 -45
synth_ai/tracing_v3/examples/basic_usage.py +15 -9
synth_ai/tracing_v3/hooks.py +6 -4
synth_ai/tracing_v3/llm_call_record_helpers.py +161 -61
synth_ai/tracing_v3/migration_helper.py +1 -2
synth_ai/tracing_v3/replica_sync.py +12 -7
synth_ai/tracing_v3/serialization.py +130 -0
synth_ai/tracing_v3/session_tracer.py +73 -16
synth_ai/tracing_v3/storage/base.py +89 -1
synth_ai/tracing_v3/storage/config.py +63 -16
synth_ai/tracing_v3/storage/factory.py +11 -9
synth_ai/tracing_v3/storage/utils.py +15 -11
synth_ai/tracing_v3/trace_utils.py +317 -0
synth_ai/tracing_v3/turso/__init__.py +8 -21
synth_ai/tracing_v3/turso/daemon.py +123 -15
synth_ai/tracing_v3/turso/models.py +5 -2
synth_ai/tracing_v3/turso/native_manager.py +1293 -0
synth_ai/tracing_v3/utils.py +5 -4
synth_ai/tunnel.py +143 -0
synth_ai/tunnel_deploy.py +278 -0
synth_ai/types.py +8 -0
synth_ai/urls.py +11 -0
synth_ai/utils/__init__.py +166 -0
synth_ai/utils/agents.py +74 -0
synth_ai/utils/apps.py +152 -0
synth_ai/utils/base_url.py +94 -0
synth_ai/utils/bin.py +39 -0
synth_ai/utils/claude.py +36 -0
synth_ai/utils/cli.py +284 -0
synth_ai/utils/config.py +81 -0
synth_ai/utils/env.py +346 -0
synth_ai/utils/errors.py +85 -0
synth_ai/utils/http.py +172 -0
synth_ai/utils/json.py +72 -0
synth_ai/utils/log_filter.py +99 -0
synth_ai/utils/logging.py +198 -0
synth_ai/utils/modal.py +299 -0
synth_ai/utils/paths.py +95 -0
synth_ai/utils/process.py +233 -0
synth_ai/utils/prompts.py +39 -0
synth_ai/utils/sqld.py +122 -0
synth_ai/utils/ssl.py +25 -0
synth_ai/utils/task_app_discovery.py +882 -0
synth_ai/utils/task_app_env.py +186 -0
synth_ai/utils/task_app_state.py +318 -0
synth_ai/utils/tunnel/__init__.py +12 -0
synth_ai/utils/tunnel/config.py +55 -0
synth_ai/utils/user_config.py +137 -0
synth_ai/uvicorn.py +77 -0
synth_ai-0.2.23.dev3.dist-info/METADATA +357 -0
synth_ai-0.2.23.dev3.dist-info/RECORD +983 -0
{synth_ai-0.2.9.dev0.dist-info → synth_ai-0.2.23.dev3.dist-info}/entry_points.txt +0 -1
{synth_ai-0.2.9.dev0.dist-info → synth_ai-0.2.23.dev3.dist-info}/top_level.txt +1 -0
synth_ai/cli/man.py +0 -106
synth_ai/core/experiment.py +0 -15
synth_ai/core/system.py +0 -15
synth_ai/demo_registry.py +0 -258
synth_ai/environments/examples/sokoban/units/astar_common.py +0 -95
synth_ai/experimental/synth_oss.py +0 -446
synth_ai/handshake.py +0 -107
synth_ai/install_sqld.sh +0 -40
synth_ai/learning/offline/dpo.py +0 -0
synth_ai/learning/offline/providers.py +0 -7
synth_ai/learning/offline/sft.py +0 -0
synth_ai/learning/offline/shared.py +0 -0
synth_ai/learning/online/grpo.py +0 -0
synth_ai/learning/online/irft.py +0 -0
synth_ai/learning/prompts/banking77_injection_eval.py +0 -168
synth_ai/learning/prompts/gepa.py +0 -0
synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +0 -213
synth_ai/learning/prompts/mipro.py +0 -289
synth_ai/learning/prompts/random_search.py +0 -246
synth_ai/learning/prompts/run_mipro_banking77.py +0 -172
synth_ai/learning/prompts/run_random_search_banking77.py +0 -324
synth_ai/lm/__init__.py +0 -51
synth_ai/lm/caching/constants.py +0 -6
synth_ai/lm/caching/dbs.py +0 -0
synth_ai/lm/caching/ephemeral.py +0 -102
synth_ai/lm/caching/handler.py +0 -137
synth_ai/lm/caching/initialize.py +0 -11
synth_ai/lm/caching/persistent.py +0 -114
synth_ai/lm/config.py +0 -110
synth_ai/lm/constants.py +0 -32
synth_ai/lm/core/__init__.py +0 -8
synth_ai/lm/core/all.py +0 -73
synth_ai/lm/core/exceptions.py +0 -7
synth_ai/lm/core/main.py +0 -319
synth_ai/lm/core/main_v3.py +0 -594
synth_ai/lm/core/synth_models.py +0 -48
synth_ai/lm/core/vendor_clients.py +0 -188
synth_ai/lm/cost/monitor.py +0 -1
synth_ai/lm/cost/statefulness.py +0 -1
synth_ai/lm/injection.py +0 -80
synth_ai/lm/overrides.py +0 -206
synth_ai/lm/provider_support/__init__.py +0 -8
synth_ai/lm/provider_support/anthropic.py +0 -972
synth_ai/lm/provider_support/openai.py +0 -1139
synth_ai/lm/provider_support/suppress_logging.py +0 -31
synth_ai/lm/structured_outputs/handler.py +0 -440
synth_ai/lm/structured_outputs/inject.py +0 -297
synth_ai/lm/structured_outputs/rehabilitate.py +0 -185
synth_ai/lm/tools/__init__.py +0 -3
synth_ai/lm/tools/base.py +0 -172
synth_ai/lm/unified_interface.py +0 -202
synth_ai/lm/vendors/base.py +0 -81
synth_ai/lm/vendors/core/anthropic_api.py +0 -387
synth_ai/lm/vendors/core/gemini_api.py +0 -292
synth_ai/lm/vendors/core/mistral_api.py +0 -322
synth_ai/lm/vendors/core/openai_api.py +0 -225
synth_ai/lm/vendors/core/synth_dev_api.py +0 -0
synth_ai/lm/vendors/local/ollama.py +0 -0
synth_ai/lm/vendors/openai_standard.py +0 -780
synth_ai/lm/vendors/openai_standard_responses.py +0 -256
synth_ai/lm/vendors/retries.py +0 -22
synth_ai/lm/vendors/supported/custom_endpoint.py +0 -417
synth_ai/lm/vendors/supported/deepseek.py +0 -69
synth_ai/lm/vendors/supported/grok.py +0 -75
synth_ai/lm/vendors/supported/groq.py +0 -16
synth_ai/lm/vendors/supported/ollama.py +0 -15
synth_ai/lm/vendors/supported/openrouter.py +0 -74
synth_ai/lm/vendors/supported/together.py +0 -11
synth_ai/lm/vendors/synth_client.py +0 -808
synth_ai/lm/warmup.py +0 -186
synth_ai/rl/secrets.py +0 -19
synth_ai/scripts/verify_rewards.py +0 -100
synth_ai/task/apps/grpo_crafter.py +0 -438
synth_ai/tracing/__init__.py +0 -30
synth_ai/tracing_v1/__init__.py +0 -33
synth_ai/tracing_v3/turso/manager.py +0 -774
synth_ai/v0/tracing/abstractions.py +0 -224
synth_ai/v0/tracing/base_client.py +0 -91
synth_ai/v0/tracing/client_manager.py +0 -131
synth_ai/v0/tracing/config.py +0 -142
synth_ai/v0/tracing/context.py +0 -146
synth_ai/v0/tracing/decorators.py +0 -682
synth_ai/v0/tracing/events/__init__.py +0 -0
synth_ai/v0/tracing/events/manage.py +0 -147
synth_ai/v0/tracing/events/scope.py +0 -86
synth_ai/v0/tracing/events/store.py +0 -228
synth_ai/v0/tracing/immediate_client.py +0 -151
synth_ai/v0/tracing/local.py +0 -18
synth_ai/v0/tracing/log_client_base.py +0 -73
synth_ai/v0/tracing/retry_queue.py +0 -186
synth_ai/v0/tracing/trackers.py +0 -515
synth_ai/v0/tracing/upload.py +0 -512
synth_ai/v0/tracing/utils.py +0 -9
synth_ai/v0/tracing_v1/__init__.py +0 -16
synth_ai/v0/tracing_v1/abstractions.py +0 -224
synth_ai/v0/tracing_v1/base_client.py +0 -91
synth_ai/v0/tracing_v1/client_manager.py +0 -131
synth_ai/v0/tracing_v1/config.py +0 -142
synth_ai/v0/tracing_v1/context.py +0 -146
synth_ai/v0/tracing_v1/decorators.py +0 -703
synth_ai/v0/tracing_v1/events/__init__.py +0 -0
synth_ai/v0/tracing_v1/events/manage.py +0 -147
synth_ai/v0/tracing_v1/events/scope.py +0 -86
synth_ai/v0/tracing_v1/events/store.py +0 -228
synth_ai/v0/tracing_v1/immediate_client.py +0 -151
synth_ai/v0/tracing_v1/local.py +0 -18
synth_ai/v0/tracing_v1/log_client_base.py +0 -73
synth_ai/v0/tracing_v1/retry_queue.py +0 -186
synth_ai/v0/tracing_v1/trackers.py +0 -515
synth_ai/v0/tracing_v1/upload.py +0 -527
synth_ai/v0/tracing_v1/utils.py +0 -9
synth_ai/zyk/__init__.py +0 -30
synth_ai-0.2.9.dev0.dist-info/METADATA +0 -131
synth_ai-0.2.9.dev0.dist-info/RECORD +0 -444
{synth_ai/lm/caching → examples/task_apps}/__init__.py +0 -0
{synth_ai/lm/cost → examples/task_apps/crafter}/__init__.py +0 -0
{synth_ai/lm/structured_outputs → examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/server}/__init__.py +0 -0
{synth_ai/lm/vendors → examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/tests}/__init__.py +0 -0
{synth_ai/lm/vendors/core → examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils}/__init__.py +0 -0
{synth_ai/lm/vendors/local → examples/task_apps/math}/__init__.py +0 -0
{synth_ai/lm/vendors/supported → examples/workflows}/__init__.py +0 -0
{synth_ai/v0/tracing → examples/workflows/math_rl}/__init__.py +0 -0
/synth_ai/{compound/cais.py → cli/__main__.py} +0 -0
/synth_ai/{learning/filtering.py → py.typed} +0 -0
{synth_ai-0.2.9.dev0.dist-info → synth_ai-0.2.23.dev3.dist-info}/WHEEL +0 -0
{synth_ai-0.2.9.dev0.dist-info → synth_ai-0.2.23.dev3.dist-info}/licenses/LICENSE +0 -0

examples/task_apps/dev/pokemon_emerald/external/pokeagent-speedrun/utils/ocr_dialogue.py ADDED Viewed

@@ -0,0 +1,1020 @@
+"""
+OCR-based dialogue detection for Pokemon Emerald.
+Provides fallback text detection when memory reading fails or returns stale data.
+"""
+import cv2
+import numpy as np
+from PIL import Image
+from typing import Optional, List, Tuple
+import re
+import logging
+try:
+    import pytesseract
+    OCR_AVAILABLE = True
+except ImportError:
+    OCR_AVAILABLE = False
+    logging.warning("pytesseract not available - OCR dialogue detection disabled")
+logger = logging.getLogger(__name__)
+class OCRDialogueDetector:
+    """OCR-based dialogue detection for Pokemon Emerald"""
+    # Pokemon Emerald dialogue box coordinates (corrected for actual dialogue position)
+    DIALOGUE_BOX_COORDS = {
+        'x': 0,       # Full width - dialogue spans entire bottom
+        'y': 104,     # Dialogue starts around row 104 (from debug analysis)
+        'width': 240, # Full screen width
+        'height': 56  # Bottom portion height (160-104=56)
+    }
+    # Tighter OCR coordinates - just the text area inside the border (adjusted lower)
+    OCR_TEXT_COORDS = {
+        'x': 8,       # Skip left border
+        'y': 116,     # Moved down 4px for better text alignment (104 + 12)
+        'width': 224, # Skip both side borders (240 - 16)
+        'height': 36  # Reduced height to maintain bottom margin (56 - 20)
+    }
+    # Pokemon Emerald dialogue text colors (based on actual RGB values)
+    DIALOGUE_TEXT_COLORS = [
+        # Exact text color from user
+        (99, 99, 99),      # Exact text color
+        # Close variations for anti-aliasing and slight rendering differences
+        (95, 95, 95),      # Slightly darker
+        (103, 103, 103),   # Slightly lighter
+        (91, 91, 91),      # Darker variant
+        (107, 107, 107),   # Lighter variant
+        (99, 99, 95),      # Slight color shift
+        (99, 95, 99),      # Slight color shift
+        (95, 99, 99),      # Slight color shift
+        # Additional gray tones that might appear due to rendering
+        (87, 87, 87),      # Darker gray
+        (111, 111, 111),   # Lighter gray
+        (79, 79, 79),      # Much darker
+        (119, 119, 119),   # Much lighter
+        # Shadow colors (darker, often with slight offset)
+        (64, 64, 64),      # Dark shadow
+        (72, 72, 72),      # Medium shadow
+        (56, 56, 56),      # Darker shadow
+        (48, 48, 48),      # Very dark shadow
+        # Possible highlighting/special text colors
+        (99, 99, 128),     # Blue-tinted for names
+        (128, 99, 99),     # Red-tinted for special text
+        (99, 128, 99),     # Green-tinted for special text
+    ]
+    # Color tolerance for matching (RGB distance) - increased to capture more text pixels
+    COLOR_TOLERANCE = 40
+    # Pokemon Emerald dialogue box background colors (based on actual RGB values)
+    DIALOGUE_BOX_BACKGROUND_COLORS = [
+        # Exact green line/border color from user
+        (85, 204, 128),    # Exact green border color
+        # Variations of the green border for anti-aliasing and shadows
+        (80, 199, 123),    # Slightly darker green
+        (90, 209, 133),    # Slightly lighter green
+        (85, 204, 128),    # Exact match (duplicate for emphasis)
+        (75, 194, 118),    # Darker green variant
+        (95, 214, 138),    # Lighter green variant
+        # Exact white text background from user
+        (255, 255, 255),   # Exact white text background
+        # Close variations for anti-aliasing and compression artifacts
+        (254, 254, 254),   # Very close to white
+        (253, 253, 253),   # Slightly off white
+        (252, 252, 252),   # Light gray-white
+        (248, 248, 248),   # Near white
+        (240, 240, 240),   # Light off-white
+        (255, 255, 254),   # Slight yellow tint
+        (254, 255, 255),   # Slight cyan tint
+    ]
+    # How much of the dialogue box should be background color to consider it "active"
+    DIALOGUE_BOX_BACKGROUND_THRESHOLD = 0.4  # 40% of dialogue area should be box color (mostly off-white background)
+    # Battle text area (different position)
+    BATTLE_TEXT_COORDS = {
+        'x': 8,
+        'y': 120,
+        'width': 224,
+        'height': 40
+    }
+    def __init__(self):
+        self.last_detected_text = ""
+        self.text_stability_threshold = 2  # Frames text must be stable
+        self.stable_text_count = 0
+        self.debug_color_detection = False  # Set to True for color debugging
+        self.use_full_frame_scan = False  # Set to True to enable full-frame scanning (may pick up noise)
+        self.skip_dialogue_box_detection = False  # Set to True to temporarily bypass dialogue box detection
+    def detect_dialogue_from_screenshot(self, screenshot: Image.Image) -> Optional[str]:
+        """
+        Detect dialogue text from Pokemon Emerald dialogue regions only.
+        First verifies dialogue box is visible to prevent false positives.
+        Args:
+            screenshot: PIL Image of the game screen
+        Returns:
+            Detected dialogue text or None if no text found
+        """
+        if not OCR_AVAILABLE:
+            return None
+        try:
+            screenshot_np = np.array(screenshot)
+            # STEP 1: Check if dialogue box is actually visible (unless bypassed)
+            if not self.skip_dialogue_box_detection and not self.is_dialogue_box_visible(screenshot):
+                logger.debug("No dialogue box detected - skipping OCR")
+                return None
+            # STEP 2: Primary dialogue box area (most common) - use tighter text coordinates
+            dialogue_text = self._extract_text_from_region(
+                screenshot_np,
+                self.OCR_TEXT_COORDS
+            )
+            if dialogue_text:
+                validated = self._validate_and_clean_text(dialogue_text)
+                if validated:
+                    return validated
+            # Method 2: Battle text area (different position)
+            battle_text = self._extract_text_from_region(
+                screenshot_np,
+                self.BATTLE_TEXT_COORDS
+            )
+            if battle_text:
+                validated = self._validate_and_clean_text(battle_text)
+                if validated:
+                    return validated
+            # Method 3: Full frame scan (only if explicitly enabled - can pick up noise)
+            if self.use_full_frame_scan:
+                full_frame_text = self._extract_text_from_full_frame(screenshot)
+                if full_frame_text:
+                    validated = self._validate_and_clean_text(full_frame_text)
+                    if validated:
+                        return validated
+            return None
+        except Exception as e:
+            logger.debug(f"OCR dialogue detection failed: {e}")
+            return None
+    def _extract_text_from_full_frame(self, screenshot: Image.Image) -> Optional[str]:
+        """
+        Extract text from the entire screenshot using OCR
+        This is more comprehensive than region-specific detection
+        """
+        try:
+            # Convert PIL to numpy array
+            screenshot_np = np.array(screenshot)
+            # Preprocess the entire frame for better OCR
+            processed_frame = self._preprocess_full_frame_for_ocr(screenshot_np)
+            # OCR configuration optimized for Pokemon text detection
+            # Use different settings for full frame vs regions
+            full_frame_config = r'--oem 3 --psm 6'  # Assume uniform block of text
+            # Extract text from entire frame
+            full_text = pytesseract.image_to_string(processed_frame, config=full_frame_config)
+            # Clean and validate the text
+            cleaned_text = self._clean_full_frame_text(full_text)
+            if cleaned_text:
+                return cleaned_text
+            # If that fails, try with different PSM mode
+            alt_config = r'--oem 3 --psm 11'  # Sparse text, find as much as possible
+            alt_text = pytesseract.image_to_string(processed_frame, config=alt_config)
+            alt_cleaned = self._clean_full_frame_text(alt_text)
+            return alt_cleaned if alt_cleaned else None
+        except Exception as e:
+            logger.debug(f"Full frame OCR failed: {e}")
+            return None
+    def _preprocess_full_frame_for_ocr(self, image_np: np.ndarray) -> np.ndarray:
+        """Preprocess entire frame using Pokemon-specific dialogue color matching"""
+        # Ensure we have color information
+        if len(image_np.shape) != 3:
+            # Convert grayscale to color by duplicating channels
+            image_np = cv2.cvtColor(image_np, cv2.COLOR_GRAY2RGB)
+        # Scale up for better color detection precision
+        scaled = cv2.resize(image_np, None, fx=3, fy=3, interpolation=cv2.INTER_CUBIC)
+        # Create mask for dialogue text colors across entire frame
+        text_mask = self._create_dialogue_color_mask(scaled)
+        # Apply color mask - black text on white background (better for OCR)
+        binary = np.where(text_mask, 0, 255).astype(np.uint8)
+        # Enhanced morphological operations for full frame
+        # Close gaps and thicken text
+        kernel_close = np.ones((2, 2), np.uint8)
+        cleaned = cv2.morphologyEx(binary, cv2.MORPH_CLOSE, kernel_close)
+        # Dilate to make text more readable
+        kernel_dilate = np.ones((1, 1), np.uint8)
+        cleaned = cv2.dilate(cleaned, kernel_dilate, iterations=1)
+        return cleaned
+    def _clean_full_frame_text(self, raw_text: str) -> Optional[str]:
+        """Clean and validate text extracted from full frame"""
+        if not raw_text:
+            return None
+        # Remove excessive whitespace and special characters
+        lines = []
+        for line in raw_text.split('\n'):
+            # Clean each line
+            cleaned_line = re.sub(r'\s+', ' ', line.strip())
+            # Filter out lines that are likely noise
+            if len(cleaned_line) >= 2:  # Minimum meaningful length
+                # Check if line has reasonable character content
+                alpha_ratio = sum(c.isalpha() for c in cleaned_line) / len(cleaned_line)
+                if alpha_ratio >= 0.3:  # At least 30% alphabetic characters
+                    lines.append(cleaned_line)
+        if not lines:
+            return None
+        # Join lines and do final cleanup
+        full_text = ' '.join(lines)
+        # Remove common OCR artifacts for Pokemon games
+        # These are characters commonly misread by OCR
+        ocr_artifacts = [
+            r'[|\\/_]',  # Common line artifacts
+            r'^\W+',     # Leading non-word characters
+            r'\W+$',     # Trailing non-word characters
+        ]
+        for artifact in ocr_artifacts:
+            full_text = re.sub(artifact, ' ', full_text)
+        # Final cleanup
+        full_text = re.sub(r'\s+', ' ', full_text).strip()
+        # Validate final result
+        if len(full_text) < 3:
+            return None
+        # Check for reasonable content (not just numbers/symbols)
+        alpha_count = sum(c.isalpha() for c in full_text)
+        if alpha_count < 3:  # Need at least 3 letters
+            return None
+        return full_text
+    def detect_all_text_regions(self, screenshot: Image.Image) -> List[dict]:
+        """
+        Detect all text regions in the screenshot with their locations
+        Useful for debugging and comprehensive text detection
+        """
+        if not OCR_AVAILABLE:
+            return []
+        try:
+            # Convert to numpy array
+            screenshot_np = np.array(screenshot)
+            processed = self._preprocess_full_frame_for_ocr(screenshot_np)
+            # Use pytesseract to get text with bounding boxes
+            data = pytesseract.image_to_data(processed, output_type=pytesseract.Output.DICT)
+            text_regions = []
+            n_boxes = len(data['level'])
+            for i in range(n_boxes):
+                # Get confidence and text
+                confidence = int(data['conf'][i])
+                text = data['text'][i].strip()
+                # Only include text with reasonable confidence and content
+                if confidence > 30 and len(text) > 1:
+                    # Get bounding box (scale back from 2x preprocessing)
+                    x = data['left'][i] // 2  # Scale back from 2x
+                    y = data['top'][i] // 2
+                    w = data['width'][i] // 2
+                    h = data['height'][i] // 2
+                    # Validate text content
+                    alpha_ratio = sum(c.isalpha() for c in text) / len(text)
+                    if alpha_ratio >= 0.3:  # At least 30% letters
+                        text_regions.append({
+                            'text': text,
+                            'confidence': confidence,
+                            'bbox': (x, y, w, h),
+                            'area': w * h
+                        })
+            # Sort by confidence and area (larger, more confident regions first)
+            text_regions.sort(key=lambda r: (r['confidence'], r['area']), reverse=True)
+            return text_regions
+        except Exception as e:
+            logger.debug(f"Text region detection failed: {e}")
+            return []
+    def _extract_text_from_region(self, image_np: np.ndarray, coords: dict) -> str:
+        """Extract text from a specific region of the image"""
+        # Extract region of interest
+        y1 = coords['y']
+        y2 = y1 + coords['height']
+        x1 = coords['x']
+        x2 = x1 + coords['width']
+        roi = image_np[y1:y2, x1:x2]
+        # Preprocessing for better OCR accuracy
+        roi = self._preprocess_for_ocr(roi)
+        # OCR configuration optimized for Pokemon Emerald text
+        custom_config = r'--oem 3 --psm 6'
+        # Extract text
+        text = pytesseract.image_to_string(roi, config=custom_config)
+        return text.strip()
+    def _preprocess_for_ocr(self, roi: np.ndarray) -> np.ndarray:
+        """Preprocess image region using Pokemon-specific dialogue color matching"""
+        # Keep original color information for color matching
+        if len(roi.shape) != 3:
+            # Convert grayscale back to color for processing (duplicate channels)
+            roi = cv2.cvtColor(roi, cv2.COLOR_GRAY2RGB)
+        # Scale up first for better color detection precision
+        roi = cv2.resize(roi, None, fx=4, fy=4, interpolation=cv2.INTER_CUBIC)
+        # Create mask for dialogue text colors
+        text_mask = self._create_dialogue_color_mask(roi)
+        # Apply color mask to create clean binary image
+        # Black text on white background (better for OCR)
+        binary_roi = np.where(text_mask, 0, 255).astype(np.uint8)
+        # Ensure we have a proper binary image (pure black and white only)
+        binary_roi = np.where(binary_roi > 127, 255, 0).astype(np.uint8)
+        # Enhanced morphological operations to thicken and connect text
+        # Close gaps in letters
+        kernel_close = np.ones((2, 2), np.uint8)
+        binary_roi = cv2.morphologyEx(binary_roi, cv2.MORPH_CLOSE, kernel_close)
+        # Dilate to make text thicker and more readable (balanced approach)
+        kernel_dilate = np.ones((2, 2), np.uint8)
+        binary_roi = cv2.dilate(binary_roi, kernel_dilate, iterations=2)
+        # Remove small noise while preserving text
+        kernel_open = np.ones((1, 1), np.uint8)
+        binary_roi = cv2.morphologyEx(binary_roi, cv2.MORPH_OPEN, kernel_open)
+        return binary_roi
+    def _create_dialogue_color_mask(self, image: np.ndarray) -> np.ndarray:
+        """Create binary mask for pixels matching Pokemon dialogue text colors"""
+        if len(image.shape) != 3:
+            return np.zeros(image.shape[:2], dtype=bool)
+        mask = np.zeros(image.shape[:2], dtype=bool)
+        matched_pixels_per_color = []
+        # Check each dialogue color
+        for i, target_color in enumerate(self.DIALOGUE_TEXT_COLORS):
+            # Calculate color distance for all pixels
+            color_diff = np.sqrt(np.sum((image - target_color) ** 2, axis=2))
+            # Add pixels within tolerance to mask
+            color_mask = (color_diff <= self.COLOR_TOLERANCE)
+            mask |= color_mask
+            # Debug information
+            if self.debug_color_detection:
+                matched_count = np.sum(color_mask)
+                matched_pixels_per_color.append(matched_count)
+        # Log color detection results for debugging
+        if self.debug_color_detection and any(matched_pixels_per_color):
+            total_matched = np.sum(mask)
+            logger.debug(f"Color matching: {total_matched} pixels matched dialogue colors")
+            for i, count in enumerate(matched_pixels_per_color):
+                if count > 0:
+                    color = self.DIALOGUE_TEXT_COLORS[i]
+                    logger.debug(f"  Color {color}: {count} pixels")
+        return mask
+    def is_dialogue_box_visible(self, screenshot: Image.Image) -> bool:
+        """
+        Check if a dialogue box is actually visible by looking for green horizontal border lines.
+        Searches for the characteristic green lines above and below the dialogue text.
+        Args:
+            screenshot: PIL Image of the game screen
+        Returns:
+            True if dialogue box is detected, False otherwise
+        """
+        if not screenshot:
+            return False
+        try:
+            # Convert to numpy array
+            image_np = np.array(screenshot)
+            if len(image_np.shape) != 3:
+                return False
+            # Extract extended dialogue region to catch border lines
+            coords = self.DIALOGUE_BOX_COORDS
+            # Extend the search area to catch top and bottom borders
+            extended_region = image_np[
+                max(0, coords['y'] - 5):min(image_np.shape[0], coords['y'] + coords['height'] + 5),
+                coords['x']:coords['x'] + coords['width']
+            ]
+            if extended_region.size == 0:
+                return False
+            # Look for horizontal border lines using actual dialogue border colors
+            border_colors = [
+                (66, 181, 132),   # Main teal border color from debug analysis
+                (24, 165, 107),   # Secondary border color
+                (57, 140, 49),    # Darker border variant
+                (0, 255, 156),    # Bright border accent
+                (115, 198, 165)   # Light border variant
+            ]
+            border_tolerance = 20  # Tolerance for color matching
+            # Check each row for horizontal border lines
+            border_line_rows = []
+            height, width = extended_region.shape[:2]
+            for row_idx in range(height):
+                row_pixels = extended_region[row_idx]
+                # Count border color pixels in this row
+                border_pixels_in_row = 0
+                for pixel in row_pixels:
+                    # Check if pixel matches any of the border colors
+                    for border_color in border_colors:
+                        color_diff = np.sqrt(np.sum((pixel - np.array(border_color)) ** 2))
+                        if color_diff <= border_tolerance:
+                            border_pixels_in_row += 1
+                            break  # Don't double-count pixels
+                # If significant portion of row has border colors, it's likely a border line
+                border_percentage = border_pixels_in_row / width
+                if border_percentage > 0.2:  # 20% of row width has border colors (lower threshold)
+                    border_line_rows.append(row_idx)
+            # VERY strict detection to avoid false positives from environment colors
+            # Require many border lines for robust detection
+            has_sufficient_border_lines = len(border_line_rows) >= 5  # Need at least 5 border lines
+            # MUST have top AND bottom border lines (no exceptions for false positive prevention)
+            has_top_and_bottom_lines = False
+            if len(border_line_rows) >= 3:
+                # Check if we have lines at different heights (top and bottom)
+                min_line = min(border_line_rows)
+                max_line = max(border_line_rows)
+                if max_line - min_line > 15:  # Lines must be at least 15 pixels apart (very strict)
+                    has_top_and_bottom_lines = True
+            # Additional check: look for proper dialogue box pattern (rectangular border)
+            has_rectangular_pattern = False
+            if len(border_line_rows) >= 5:
+                # Check if we have border lines spread across the dialogue region
+                height_quarter = height // 4
+                top_lines = [r for r in border_line_rows if r < height_quarter]
+                middle_lines = [r for r in border_line_rows if height_quarter <= r <= 3 * height_quarter]
+                bottom_lines = [r for r in border_line_rows if r > 3 * height_quarter]
+                # Must have lines in top AND bottom, and some in middle for a proper box
+                if len(top_lines) >= 2 and len(bottom_lines) >= 2 and len(middle_lines) >= 1:
+                    has_rectangular_pattern = True
+            # Extra check: ensure lines are actually horizontal (consistent across width)
+            has_proper_horizontal_lines = False
+            if len(border_line_rows) >= 3:
+                # Check that border lines extend across significant width (not just scattered pixels)
+                proper_lines = 0
+                for row_idx in border_line_rows[:10]:  # Check first 10 lines
+                    row_pixels = extended_region[row_idx]
+                    border_pixels_in_row = 0
+                    for pixel in row_pixels:
+                        for border_color in border_colors:
+                            color_diff = np.sqrt(np.sum((pixel - np.array(border_color)) ** 2))
+                            if color_diff <= border_tolerance:
+                                border_pixels_in_row += 1
+                                break
+                    # Line must span at least 50% of width to be considered a proper horizontal line
+                    if border_pixels_in_row / width > 0.5:
+                        proper_lines += 1
+                if proper_lines >= 3:  # Need at least 3 proper horizontal lines
+                    has_proper_horizontal_lines = True
+            # Log detection results
+            if self.debug_color_detection:
+                logger.debug(f"Border line detection: Found {len(border_line_rows)} border horizontal lines")
+                logger.debug(f"Line rows: {border_line_rows[:5]}")  # Show first 5
+                logger.debug(f"Has sufficient lines (≥5): {has_sufficient_border_lines}")
+                logger.debug(f"Has top+bottom lines (≥15px apart): {has_top_and_bottom_lines}")
+                logger.debug(f"Has rectangular pattern: {has_rectangular_pattern}")
+                logger.debug(f"Has proper horizontal lines (≥50% width): {has_proper_horizontal_lines}")
+            # Final check: look for actual dialogue box background (light/white area inside borders)
+            has_dialogue_background = False
+            if len(border_line_rows) >= 3:
+                # Check middle area for dialogue background colors (light colors)
+                middle_start = height // 4
+                middle_end = 3 * height // 4
+                middle_region = extended_region[middle_start:middle_end, width//4:3*width//4]
+                if middle_region.size > 0:
+                    # Look for light background colors typical of dialogue boxes
+                    light_pixels = 0
+                    total_pixels = middle_region.size // 3  # Divide by 3 for RGB
+                    for pixel in middle_region.reshape(-1, 3):
+                        # Light colors: high brightness (sum of RGB > 400) or white-ish
+                        brightness = np.sum(pixel)
+                        if brightness > 400 or (pixel[0] > 200 and pixel[1] > 200 and pixel[2] > 200):
+                            light_pixels += 1
+                    light_percentage = light_pixels / total_pixels
+                    if light_percentage > 0.3:  # At least 30% of middle area should be light (dialogue background)
+                        has_dialogue_background = True
+            # Log all criteria
+            if self.debug_color_detection:
+                logger.debug(f"Has dialogue background (light area): {has_dialogue_background}")
+            # Use simplified detection method to avoid false positives
+            # Check for white background in center area
+            center_h = extended_region.shape[0] // 2
+            center_w = extended_region.shape[1] // 2
+            margin = 20
+            center_area = extended_region[
+                max(0, center_h - margin):min(extended_region.shape[0], center_h + margin),
+                max(0, center_w - margin):min(extended_region.shape[1], center_w + margin)
+            ]
+            if center_area.size > 0:
+                # Count white/light pixels (dialogue background)
+                light_mask = (center_area[:,:,0] > 200) & (center_area[:,:,1] > 200) & (center_area[:,:,2] > 200)
+                light_percentage = np.sum(light_mask) / light_mask.size
+                # Count text-like colors (dark gray)
+                text_mask = ((center_area[:,:,0] > 80) & (center_area[:,:,0] < 130) &
+                            (center_area[:,:,1] > 80) & (center_area[:,:,1] < 130) &
+                            (center_area[:,:,2] > 80) & (center_area[:,:,2] < 130))
+                text_percentage = np.sum(text_mask) / text_mask.size
+                # Simple, robust criteria
+                is_visible = light_percentage > 0.3 and text_percentage > 0.02
+                if self.debug_color_detection:
+                    logger.debug(f"Simplified detection - Light bg: {light_percentage:.1%}, Text: {text_percentage:.1%}")
+            else:
+                is_visible = False
+            if self.debug_color_detection:
+                logger.debug(f"Dialogue box {'VISIBLE' if is_visible else 'NOT VISIBLE'} "
+                           f"(found {len(border_line_rows)} border lines)")
+            return is_visible
+        except Exception as e:
+            logger.debug(f"Dialogue box detection error: {e}")
+            return False
+    def enable_color_debug(self, enabled: bool = True):
+        """Enable/disable color detection debugging"""
+        self.debug_color_detection = enabled
+        if enabled:
+            logger.info("OCR color detection debugging enabled")
+        else:
+            logger.info("OCR color detection debugging disabled")
+    def analyze_dialogue_colors(self, screenshot: Image.Image) -> dict:
+        """
+        Analyze a screenshot to find the actual colors used in the dialogue box.
+        This helps fine-tune the DIALOGUE_TEXT_COLORS list.
+        """
+        if not screenshot:
+            return {}
+        # Convert to numpy array
+        image_np = np.array(screenshot)
+        if len(image_np.shape) != 3:
+            return {}
+        # Extract dialogue region
+        coords = self.DIALOGUE_BOX_COORDS
+        dialogue_region = image_np[
+            coords['y']:coords['y'] + coords['height'],
+            coords['x']:coords['x'] + coords['width']
+        ]
+        if dialogue_region.size == 0:
+            return {}
+        # Find unique colors and their frequencies
+        pixels = dialogue_region.reshape(-1, 3)
+        unique_colors, counts = np.unique(pixels, axis=0, return_counts=True)
+        # Sort by frequency (most common first)
+        sorted_indices = np.argsort(counts)[::-1]
+        # Analyze the most common colors
+        color_analysis = {
+            'total_pixels': len(pixels),
+            'unique_colors': len(unique_colors),
+            'top_colors': []
+        }
+        # Show top 20 most common colors
+        for i in range(min(20, len(unique_colors))):
+            idx = sorted_indices[i]
+            color = tuple(unique_colors[idx])
+            count = counts[idx]
+            percentage = (count / len(pixels)) * 100
+            color_analysis['top_colors'].append({
+                'rgb': color,
+                'count': int(count),
+                'percentage': round(percentage, 2)
+            })
+        return color_analysis
+    def print_color_analysis(self, screenshot: Image.Image):
+        """Print color analysis in a readable format"""
+        analysis = self.analyze_dialogue_colors(screenshot)
+        if not analysis:
+            print("❌ Could not analyze colors")
+            return
+        print(f"\n🎨 DIALOGUE COLOR ANALYSIS")
+        print(f"={'='*50}")
+        print(f"Total pixels: {analysis['total_pixels']:,}")
+        print(f"Unique colors: {analysis['unique_colors']:,}")
+        print(f"\nTop Colors (most frequent first):")
+        print(f"{'Rank':<4} {'RGB Color':<20} {'Count':<8} {'%':<6} {'Color Type':<15}")
+        print(f"{'-'*70}")
+        for i, color_info in enumerate(analysis['top_colors'][:15], 1):
+            rgb = color_info['rgb']
+            count = color_info['count']
+            pct = color_info['percentage']
+            # Classify the color
+            if rgb[0] > 240 and rgb[1] > 240 and rgb[2] > 240:
+                color_type = "Background"
+            elif rgb[0] < 120 and rgb[1] < 120 and rgb[2] < 120:
+                color_type = "Text/Shadow"
+            elif abs(rgb[0] - rgb[1]) < 10 and abs(rgb[1] - rgb[2]) < 10:
+                color_type = "Gray text"
+            else:
+                color_type = "Other"
+            print(f"{i:<4} {str(rgb):<20} {count:<8} {pct:<6.1f} {color_type:<15}")
+        print(f"\n💡 Suggested dialogue colors to add:")
+        suggested = []
+        for color_info in analysis['top_colors'][:10]:
+            rgb = color_info['rgb']
+            # Suggest colors that look like text (not pure white background)
+            if rgb[0] < 200 and color_info['percentage'] > 0.5:
+                suggested.append(rgb)
+        for color in suggested[:5]:  # Show top 5 suggestions
+            print(f"    {color},")
+        print(f"{'='*50}")
+    def update_dialogue_colors_from_analysis(self, screenshot: Image.Image, threshold_percentage: float = 1.0):
+        """
+        Update DIALOGUE_TEXT_COLORS based on analysis of actual screenshot.
+        Only adds colors that appear frequently enough (above threshold_percentage).
+        """
+        analysis = self.analyze_dialogue_colors(screenshot)
+        if not analysis:
+            logger.warning("Could not analyze colors to update dialogue colors")
+            return
+        # Find colors that appear frequently and look like text
+        new_colors = []
+        for color_info in analysis['top_colors']:
+            rgb = color_info['rgb']
+            pct = color_info['percentage']
+            # Only consider colors that:
+            # 1. Appear frequently enough
+            # 2. Are not pure white (background)
+            # 3. Are not already in our color list
+            if (pct >= threshold_percentage and
+                not (rgb[0] > 240 and rgb[1] > 240 and rgb[2] > 240) and
+                rgb not in self.DIALOGUE_TEXT_COLORS):
+                new_colors.append(rgb)
+        if new_colors:
+            logger.info(f"Adding {len(new_colors)} new dialogue colors from analysis")
+            for color in new_colors[:5]:  # Limit to top 5 new colors
+                logger.info(f"  Added color: {color}")
+            # Add new colors to the existing list
+            self.DIALOGUE_TEXT_COLORS.extend(new_colors[:5])
+        else:
+            logger.info("No new dialogue colors found to add")
+    def analyze_dialogue_box_background(self, screenshot: Image.Image):
+        """
+        Analyze dialogue box region to find actual background colors.
+        Useful for fine-tuning DIALOGUE_BOX_BACKGROUND_COLORS.
+        """
+        analysis = self.analyze_dialogue_colors(screenshot)
+        if not analysis:
+            print("❌ Could not analyze dialogue box background")
+            return
+        print(f"\n📦 DIALOGUE BOX BACKGROUND ANALYSIS")
+        print(f"{'='*50}")
+        print(f"Total pixels: {analysis['total_pixels']:,}")
+        print(f"Unique colors: {analysis['unique_colors']:,}")
+        print(f"\nTop Background Colors (most frequent first):")
+        print(f"{'Rank':<4} {'RGB Color':<20} {'Count':<8} {'%':<6} {'Type':<15}")
+        print(f"{'-'*70}")
+        for i, color_info in enumerate(analysis['top_colors'][:15], 1):
+            rgb = color_info['rgb']
+            count = color_info['count']
+            pct = color_info['percentage']
+            # Classify as likely background vs text
+            if pct > 10:  # Very common = likely background
+                color_type = "Background"
+            elif rgb[0] < 150 and rgb[1] < 150 and rgb[2] < 150:
+                color_type = "Text/Shadow"
+            else:
+                color_type = "Other"
+            print(f"{i:<4} {str(rgb):<20} {count:<8} {pct:<6.1f} {color_type:<15}")
+        print(f"\n💡 Suggested background colors (>5% pixels):")
+        for color_info in analysis['top_colors'][:10]:
+            rgb = color_info['rgb']
+            pct = color_info['percentage']
+            # Suggest colors that are common and not text-like
+            if pct > 5.0 and not (rgb[0] < 150 and rgb[1] < 150 and rgb[2] < 150):
+                print(f"    {rgb},")
+        print(f"{'='*50}")
+    def test_dialogue_box_detection(self, screenshot: Image.Image):
+        """Test dialogue box detection with detailed output for green line method"""
+        print(f"\n🔍 DIALOGUE BOX DETECTION TEST (Green Line Method)")
+        print(f"{'='*50}")
+        # Enable debug mode for detailed output
+        old_debug = self.debug_color_detection
+        self.debug_color_detection = True
+        is_visible = self.is_dialogue_box_visible(screenshot)
+        # Get detailed green line analysis
+        image_np = np.array(screenshot)
+        coords = self.DIALOGUE_BOX_COORDS
+        # Extended region for border detection
+        extended_region = image_np[
+            max(0, coords['y'] - 5):min(image_np.shape[0], coords['y'] + coords['height'] + 5),
+            coords['x']:coords['x'] + coords['width']
+        ]
+        height, width = extended_region.shape[:2]
+        green_border_color = (85, 204, 128)
+        green_tolerance = 15
+        print(f"Search region: {coords['x']},{coords['y']-5} {coords['width']}x{height+10}")
+        print(f"Green border color: {green_border_color}")
+        print(f"Green tolerance: ±{green_tolerance}")
+        # Analyze each row
+        green_line_rows = []
+        for row_idx in range(height):
+            row_pixels = extended_region[row_idx]
+            green_pixels_in_row = 0
+            for pixel in row_pixels:
+                color_diff = np.sqrt(np.sum((pixel - green_border_color) ** 2))
+                if color_diff <= green_tolerance:
+                    green_pixels_in_row += 1
+            green_percentage = green_pixels_in_row / width
+            if green_percentage > 0.3:  # 30% threshold
+                green_line_rows.append({
+                    'row': row_idx,
+                    'green_pixels': green_pixels_in_row,
+                    'percentage': green_percentage * 100
+                })
+        print(f"Found {len(green_line_rows)} green horizontal lines:")
+        for line_info in green_line_rows[:5]:  # Show first 5
+            row = line_info['row']
+            pixels = line_info['green_pixels']
+            pct = line_info['percentage']
+            print(f"  Row {row}: {pixels}/{width} pixels ({pct:.1f}% green)")
+        print(f"\nResult: {'✅ DIALOGUE BOX VISIBLE' if is_visible else '❌ NOT VISIBLE'}")
+        print(f"{'='*50}")
+        # Restore debug setting
+        self.debug_color_detection = old_debug
+        return is_visible
+    def _validate_and_clean_text(self, text: str) -> Optional[str]:
+        """Validate and clean detected text"""
+        if not text or len(text.strip()) < 3:
+            return None
+        # Clean up common OCR errors
+        text = re.sub(r'\n+', ' ', text)  # Replace newlines with spaces
+        text = re.sub(r'\s+', ' ', text)  # Normalize whitespace
+        text = text.strip()
+        # Filter out obviously wrong detections
+        if len(text) < 3 or len(text) > 200:
+            return None
+        # Check for minimum alphabetic content (avoid detecting UI elements)
+        alpha_ratio = sum(c.isalpha() for c in text) / len(text)
+        if alpha_ratio < 0.5:
+            return None
+        # Comprehensive random letter filtering - catch ANY nonsense patterns
+        if self._is_random_nonsense(text):
+            logger.debug(f"OCR validation: Rejected as random nonsense: '{text[:50]}...'")
+            return None
+        return text
+    def _is_random_nonsense(self, text: str) -> bool:
+        """
+        Comprehensive detection of random letter sequences and nonsense text.
+        Catches any type of random letters that don't form meaningful dialogue.
+        """
+        if not text or len(text.strip()) < 3:
+            return True
+        text_lower = text.lower().strip()
+        words = text_lower.split()
+        if len(words) == 0:
+            return True
+        # Pattern 1: Excessive single/double character "words"
+        short_words = [w for w in words if len(w) <= 2]
+        if len(short_words) > len(words) * 0.6:  # More than 60% are very short
+            return True
+        # Pattern 2: Repetitive patterns (like "a a a a a")
+        word_counts = {}
+        for word in words:
+            word_counts[word] = word_counts.get(word, 0) + 1
+        for word, count in word_counts.items():
+            if len(word) <= 2 and count >= 3:  # Short word repeated 3+ times
+                return True
+        # Pattern 3: Too many words (dialogue is usually concise)
+        if len(words) > 30:
+            return True
+        # Pattern 4: Check for valid English-like words
+        valid_words = 0
+        dialogue_words = {
+            'the', 'a', 'an', 'and', 'or', 'but', 'in', 'on', 'at', 'to', 'for', 'of', 'with', 'by',
+            'you', 'i', 'we', 'they', 'he', 'she', 'it', 'this', 'that', 'these', 'those',
+            'is', 'are', 'was', 'were', 'be', 'been', 'being', 'have', 'has', 'had', 'do', 'does', 'did',
+            'will', 'would', 'could', 'should', 'can', 'may', 'might', 'must',
+            'get', 'got', 'give', 'take', 'go', 'come', 'see', 'look', 'want', 'need', 'know', 'think',
+            'pokemon', 'trainer', 'battle', 'items', 'store', 'pc', 'computer', 'use', 'hello', 'hi'
+        }
+        for word in words:
+            clean_word = ''.join(c for c in word if c.isalnum()).lower()
+            if len(clean_word) >= 2:
+                # Check if it's a known good word
+                if clean_word in dialogue_words:
+                    valid_words += 1
+                # Check if it has reasonable letter patterns
+                elif self._has_valid_letter_pattern(clean_word):
+                    valid_words += 1
+        # Need at least 30% valid words
+        valid_ratio = valid_words / len(words) if len(words) > 0 else 0
+        if valid_ratio < 0.3:
+            return True
+        # Pattern 5: Detect excessive mixed case (OCR noise pattern)
+        mixed_case_words = 0
+        for word in words:
+            if len(word) >= 3:
+                has_lower = any(c.islower() for c in word)
+                has_upper = any(c.isupper() for c in word)
+                if has_lower and has_upper and not word[0].isupper():  # Not normal capitalization
+                    mixed_case_words += 1
+        if mixed_case_words > len(words) * 0.4:  # More than 40% have weird capitalization
+            return True
+        return False
+    def _has_valid_letter_pattern(self, word: str) -> bool:
+        """Check if word has valid English-like letter patterns"""
+        if len(word) < 2:
+            return False
+        # Must have at least one vowel (unless very short)
+        vowels = 'aeiou'
+        has_vowel = any(c in vowels for c in word.lower())
+        if len(word) >= 3 and not has_vowel:
+            return False
+        # Check for reasonable consonant clusters
+        consonants = 'bcdfghjklmnpqrstvwxyz'
+        consonant_streak = 0
+        max_consonant_streak = 0
+        for char in word.lower():
+            if char in consonants:
+                consonant_streak += 1
+                max_consonant_streak = max(max_consonant_streak, consonant_streak)
+            else:
+                consonant_streak = 0
+        # Too many consonants in a row suggests OCR noise
+        if max_consonant_streak > 4:
+            return False
+        # Check for excessive repeated characters
+        repeated = 0
+        for i in range(len(word) - 1):
+            if word[i] == word[i + 1]:
+                repeated += 1
+        if repeated > len(word) * 0.4:  # More than 40% repeated chars
+            return False
+        return True
+    def get_stable_dialogue_text(self, screenshot: Image.Image) -> Optional[str]:
+        """
+        Get dialogue text that has been stable across multiple frames.
+        This helps avoid detecting transitional/partial text.
+        """
+        current_text = self.detect_dialogue_from_screenshot(screenshot)
+        if current_text == self.last_detected_text:
+            self.stable_text_count += 1
+        else:
+            self.stable_text_count = 0
+            self.last_detected_text = current_text
+        # Return text only if it's been stable for threshold frames
+        if self.stable_text_count >= self.text_stability_threshold and current_text:
+            return current_text
+        return None
+def create_ocr_detector() -> Optional[OCRDialogueDetector]:
+    """Factory function to create OCR detector if available"""
+    if OCR_AVAILABLE:
+        return OCRDialogueDetector()
+    else:
+        logger.warning("OCR not available - install pytesseract and tesseract-ocr system package")
+        return None

synth-ai 0.2.9.dev0__py3-none-any.whl → 0.2.23.dev3__py3-none-any.whl

synth-ai 0.2.9.dev0py3-none-any.whl → 0.2.23.dev3py3-none-any.whl