PyPI - synth-ai - Versions diffs - 0.2.4.dev6__py3-none-any.whl → 0.2.4.dev8__py3-none-any.whl - Mend

synth-ai 0.2.4.dev6py3-none-any.whl → 0.2.4.dev8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (256) hide show

synth_ai/__init__.py +18 -9
synth_ai/cli/__init__.py +10 -5
synth_ai/cli/balance.py +25 -32
synth_ai/cli/calc.py +2 -3
synth_ai/cli/demo.py +3 -5
synth_ai/cli/legacy_root_backup.py +58 -32
synth_ai/cli/man.py +22 -19
synth_ai/cli/recent.py +9 -8
synth_ai/cli/root.py +58 -13
synth_ai/cli/status.py +13 -6
synth_ai/cli/traces.py +45 -21
synth_ai/cli/watch.py +40 -37
synth_ai/config/base_url.py +47 -2
synth_ai/core/experiment.py +1 -2
synth_ai/environments/__init__.py +2 -6
synth_ai/environments/environment/artifacts/base.py +3 -1
synth_ai/environments/environment/db/sqlite.py +1 -1
synth_ai/environments/environment/registry.py +19 -20
synth_ai/environments/environment/resources/sqlite.py +2 -3
synth_ai/environments/environment/rewards/core.py +3 -2
synth_ai/environments/environment/tools/__init__.py +6 -4
synth_ai/environments/examples/crafter_classic/__init__.py +1 -1
synth_ai/environments/examples/crafter_classic/engine.py +13 -13
synth_ai/environments/examples/crafter_classic/engine_deterministic_patch.py +1 -0
synth_ai/environments/examples/crafter_classic/engine_helpers/action_map.py +2 -1
synth_ai/environments/examples/crafter_classic/engine_helpers/serialization.py +2 -1
synth_ai/environments/examples/crafter_classic/engine_serialization_patch_v3.py +3 -2
synth_ai/environments/examples/crafter_classic/environment.py +16 -15
synth_ai/environments/examples/crafter_classic/taskset.py +2 -2
synth_ai/environments/examples/crafter_classic/trace_hooks_v3.py +2 -3
synth_ai/environments/examples/crafter_classic/world_config_patch_simple.py +2 -1
synth_ai/environments/examples/crafter_custom/crafter/__init__.py +2 -2
synth_ai/environments/examples/crafter_custom/crafter/config.py +2 -2
synth_ai/environments/examples/crafter_custom/crafter/env.py +1 -5
synth_ai/environments/examples/crafter_custom/crafter/objects.py +1 -2
synth_ai/environments/examples/crafter_custom/crafter/worldgen.py +1 -2
synth_ai/environments/examples/crafter_custom/dataset_builder.py +5 -5
synth_ai/environments/examples/crafter_custom/environment.py +13 -13
synth_ai/environments/examples/crafter_custom/run_dataset.py +5 -5
synth_ai/environments/examples/enron/art_helpers/email_search_tools.py +2 -2
synth_ai/environments/examples/enron/art_helpers/local_email_db.py +5 -4
synth_ai/environments/examples/enron/art_helpers/types_enron.py +2 -1
synth_ai/environments/examples/enron/engine.py +18 -14
synth_ai/environments/examples/enron/environment.py +12 -11
synth_ai/environments/examples/enron/taskset.py +7 -7
synth_ai/environments/examples/minigrid/__init__.py +6 -6
synth_ai/environments/examples/minigrid/engine.py +6 -6
synth_ai/environments/examples/minigrid/environment.py +6 -6
synth_ai/environments/examples/minigrid/puzzle_loader.py +3 -2
synth_ai/environments/examples/minigrid/taskset.py +13 -13
synth_ai/environments/examples/nethack/achievements.py +1 -1
synth_ai/environments/examples/nethack/engine.py +8 -7
synth_ai/environments/examples/nethack/environment.py +10 -9
synth_ai/environments/examples/nethack/helpers/__init__.py +8 -9
synth_ai/environments/examples/nethack/helpers/action_mapping.py +1 -1
synth_ai/environments/examples/nethack/helpers/nle_wrapper.py +2 -1
synth_ai/environments/examples/nethack/helpers/observation_utils.py +1 -1
synth_ai/environments/examples/nethack/helpers/recording_wrapper.py +3 -4
synth_ai/environments/examples/nethack/helpers/trajectory_recorder.py +6 -5
synth_ai/environments/examples/nethack/helpers/visualization/replay_viewer.py +5 -5
synth_ai/environments/examples/nethack/helpers/visualization/visualizer.py +7 -6
synth_ai/environments/examples/nethack/taskset.py +5 -5
synth_ai/environments/examples/red/engine.py +9 -8
synth_ai/environments/examples/red/engine_helpers/reward_components.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/__init__.py +7 -7
synth_ai/environments/examples/red/engine_helpers/reward_library/adaptive_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/battle_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/composite_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/economy_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/efficiency_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/exploration_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/novelty_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/pallet_town_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/pokemon_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/social_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/story_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/screen_analysis.py +3 -2
synth_ai/environments/examples/red/engine_helpers/state_extraction.py +2 -1
synth_ai/environments/examples/red/environment.py +18 -15
synth_ai/environments/examples/red/taskset.py +5 -3
synth_ai/environments/examples/sokoban/engine.py +16 -13
synth_ai/environments/examples/sokoban/engine_helpers/room_utils.py +3 -2
synth_ai/environments/examples/sokoban/engine_helpers/vendored/__init__.py +2 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/__init__.py +1 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/boxoban_env.py +7 -5
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/render_utils.py +1 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/room_utils.py +2 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env.py +5 -4
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_fixed_targets.py +3 -2
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_pull.py +2 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_two_player.py +5 -4
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_variations.py +1 -1
synth_ai/environments/examples/sokoban/environment.py +15 -14
synth_ai/environments/examples/sokoban/generate_verified_puzzles.py +5 -3
synth_ai/environments/examples/sokoban/puzzle_loader.py +3 -2
synth_ai/environments/examples/sokoban/taskset.py +13 -10
synth_ai/environments/examples/tictactoe/engine.py +6 -6
synth_ai/environments/examples/tictactoe/environment.py +8 -7
synth_ai/environments/examples/tictactoe/taskset.py +6 -5
synth_ai/environments/examples/verilog/engine.py +4 -3
synth_ai/environments/examples/verilog/environment.py +11 -10
synth_ai/environments/examples/verilog/taskset.py +14 -12
synth_ai/environments/examples/wordle/__init__.py +5 -5
synth_ai/environments/examples/wordle/engine.py +32 -25
synth_ai/environments/examples/wordle/environment.py +21 -16
synth_ai/environments/examples/wordle/helpers/generate_instances_wordfreq.py +6 -6
synth_ai/environments/examples/wordle/taskset.py +20 -12
synth_ai/environments/reproducibility/core.py +1 -1
synth_ai/environments/reproducibility/tree.py +21 -21
synth_ai/environments/service/app.py +3 -2
synth_ai/environments/service/core_routes.py +104 -110
synth_ai/environments/service/external_registry.py +1 -2
synth_ai/environments/service/registry.py +1 -1
synth_ai/environments/stateful/core.py +1 -2
synth_ai/environments/stateful/engine.py +1 -1
synth_ai/environments/tasks/api.py +4 -4
synth_ai/environments/tasks/core.py +14 -12
synth_ai/environments/tasks/filters.py +6 -4
synth_ai/environments/tasks/utils.py +13 -11
synth_ai/evals/base.py +2 -3
synth_ai/experimental/synth_oss.py +4 -4
synth_ai/http.py +102 -0
synth_ai/inference/__init__.py +7 -0
synth_ai/inference/client.py +20 -0
synth_ai/jobs/client.py +246 -0
synth_ai/learning/__init__.py +24 -0
synth_ai/learning/client.py +149 -0
synth_ai/learning/config.py +43 -0
synth_ai/learning/constants.py +29 -0
synth_ai/learning/ft_client.py +59 -0
synth_ai/learning/gateway.py +1 -3
synth_ai/learning/health.py +43 -0
synth_ai/learning/jobs.py +205 -0
synth_ai/learning/prompts/banking77_injection_eval.py +15 -10
synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +26 -14
synth_ai/learning/prompts/mipro.py +61 -52
synth_ai/learning/prompts/random_search.py +42 -43
synth_ai/learning/prompts/run_mipro_banking77.py +32 -20
synth_ai/learning/prompts/run_random_search_banking77.py +71 -52
synth_ai/learning/rl_client.py +256 -0
synth_ai/learning/sse.py +58 -0
synth_ai/learning/validators.py +48 -0
synth_ai/lm/__init__.py +5 -5
synth_ai/lm/caching/ephemeral.py +9 -9
synth_ai/lm/caching/handler.py +20 -20
synth_ai/lm/caching/persistent.py +10 -10
synth_ai/lm/config.py +3 -3
synth_ai/lm/constants.py +7 -7
synth_ai/lm/core/all.py +17 -3
synth_ai/lm/core/exceptions.py +0 -2
synth_ai/lm/core/main.py +26 -41
synth_ai/lm/core/main_v3.py +33 -10
synth_ai/lm/core/synth_models.py +48 -0
synth_ai/lm/core/vendor_clients.py +26 -22
synth_ai/lm/injection.py +7 -8
synth_ai/lm/overrides.py +21 -19
synth_ai/lm/provider_support/__init__.py +1 -1
synth_ai/lm/provider_support/anthropic.py +15 -15
synth_ai/lm/provider_support/openai.py +23 -21
synth_ai/lm/structured_outputs/handler.py +34 -32
synth_ai/lm/structured_outputs/inject.py +24 -27
synth_ai/lm/structured_outputs/rehabilitate.py +19 -15
synth_ai/lm/tools/base.py +17 -16
synth_ai/lm/unified_interface.py +17 -18
synth_ai/lm/vendors/base.py +20 -18
synth_ai/lm/vendors/core/anthropic_api.py +36 -27
synth_ai/lm/vendors/core/gemini_api.py +31 -36
synth_ai/lm/vendors/core/mistral_api.py +19 -19
synth_ai/lm/vendors/core/openai_api.py +42 -13
synth_ai/lm/vendors/openai_standard.py +158 -101
synth_ai/lm/vendors/openai_standard_responses.py +74 -61
synth_ai/lm/vendors/retries.py +9 -1
synth_ai/lm/vendors/supported/custom_endpoint.py +38 -28
synth_ai/lm/vendors/supported/deepseek.py +10 -10
synth_ai/lm/vendors/supported/grok.py +8 -8
synth_ai/lm/vendors/supported/ollama.py +2 -1
synth_ai/lm/vendors/supported/openrouter.py +11 -9
synth_ai/lm/vendors/synth_client.py +425 -75
synth_ai/lm/warmup.py +8 -7
synth_ai/rl/__init__.py +30 -0
synth_ai/rl/contracts.py +32 -0
synth_ai/rl/env_keys.py +137 -0
synth_ai/rl/secrets.py +19 -0
synth_ai/scripts/verify_rewards.py +100 -0
synth_ai/task/__init__.py +10 -0
synth_ai/task/contracts.py +120 -0
synth_ai/task/health.py +28 -0
synth_ai/task/validators.py +12 -0
synth_ai/tracing/__init__.py +22 -10
synth_ai/tracing_v1/__init__.py +22 -20
synth_ai/tracing_v3/__init__.py +7 -7
synth_ai/tracing_v3/abstractions.py +56 -52
synth_ai/tracing_v3/config.py +4 -2
synth_ai/tracing_v3/db_config.py +6 -8
synth_ai/tracing_v3/decorators.py +29 -30
synth_ai/tracing_v3/examples/basic_usage.py +12 -12
synth_ai/tracing_v3/hooks.py +24 -22
synth_ai/tracing_v3/llm_call_record_helpers.py +85 -98
synth_ai/tracing_v3/lm_call_record_abstractions.py +2 -4
synth_ai/tracing_v3/migration_helper.py +3 -5
synth_ai/tracing_v3/replica_sync.py +30 -32
synth_ai/tracing_v3/session_tracer.py +158 -31
synth_ai/tracing_v3/storage/__init__.py +1 -1
synth_ai/tracing_v3/storage/base.py +8 -7
synth_ai/tracing_v3/storage/config.py +4 -4
synth_ai/tracing_v3/storage/factory.py +4 -4
synth_ai/tracing_v3/storage/utils.py +9 -9
synth_ai/tracing_v3/turso/__init__.py +3 -3
synth_ai/tracing_v3/turso/daemon.py +9 -9
synth_ai/tracing_v3/turso/manager.py +278 -48
synth_ai/tracing_v3/turso/models.py +77 -19
synth_ai/tracing_v3/utils.py +5 -5
synth_ai/v0/tracing/abstractions.py +28 -28
synth_ai/v0/tracing/base_client.py +9 -9
synth_ai/v0/tracing/client_manager.py +7 -7
synth_ai/v0/tracing/config.py +7 -7
synth_ai/v0/tracing/context.py +6 -6
synth_ai/v0/tracing/decorators.py +6 -5
synth_ai/v0/tracing/events/manage.py +1 -1
synth_ai/v0/tracing/events/store.py +5 -4
synth_ai/v0/tracing/immediate_client.py +4 -5
synth_ai/v0/tracing/local.py +3 -3
synth_ai/v0/tracing/log_client_base.py +4 -5
synth_ai/v0/tracing/retry_queue.py +5 -6
synth_ai/v0/tracing/trackers.py +25 -25
synth_ai/v0/tracing/upload.py +6 -0
synth_ai/v0/tracing_v1/__init__.py +1 -1
synth_ai/v0/tracing_v1/abstractions.py +28 -28
synth_ai/v0/tracing_v1/base_client.py +9 -9
synth_ai/v0/tracing_v1/client_manager.py +7 -7
synth_ai/v0/tracing_v1/config.py +7 -7
synth_ai/v0/tracing_v1/context.py +6 -6
synth_ai/v0/tracing_v1/decorators.py +7 -6
synth_ai/v0/tracing_v1/events/manage.py +1 -1
synth_ai/v0/tracing_v1/events/store.py +5 -4
synth_ai/v0/tracing_v1/immediate_client.py +4 -5
synth_ai/v0/tracing_v1/local.py +3 -3
synth_ai/v0/tracing_v1/log_client_base.py +4 -5
synth_ai/v0/tracing_v1/retry_queue.py +5 -6
synth_ai/v0/tracing_v1/trackers.py +25 -25
synth_ai/v0/tracing_v1/upload.py +25 -24
synth_ai/zyk/__init__.py +1 -0
synth_ai-0.2.4.dev8.dist-info/METADATA +635 -0
synth_ai-0.2.4.dev8.dist-info/RECORD +317 -0
synth_ai/tui/__init__.py +0 -1
synth_ai/tui/__main__.py +0 -13
synth_ai/tui/cli/__init__.py +0 -1
synth_ai/tui/cli/query_experiments.py +0 -165
synth_ai/tui/cli/query_experiments_v3.py +0 -165
synth_ai/tui/dashboard.py +0 -329
synth_ai-0.2.4.dev6.dist-info/METADATA +0 -203
synth_ai-0.2.4.dev6.dist-info/RECORD +0 -299
{synth_ai-0.2.4.dev6.dist-info → synth_ai-0.2.4.dev8.dist-info}/WHEEL +0 -0
{synth_ai-0.2.4.dev6.dist-info → synth_ai-0.2.4.dev8.dist-info}/entry_points.txt +0 -0
{synth_ai-0.2.4.dev6.dist-info → synth_ai-0.2.4.dev8.dist-info}/licenses/LICENSE +0 -0
{synth_ai-0.2.4.dev6.dist-info → synth_ai-0.2.4.dev8.dist-info}/top_level.txt +0 -0

synth_ai/lm/vendors/openai_standard.py CHANGED Viewed

@@ -1,24 +1,28 @@
-from typing import Any, Dict, List, Optional, Union
 import asyncio
+import os
 import time
+from typing import Any
+import backoff
 import groq
 import openai
-import os
 import pydantic_core
 from pydantic import BaseModel
 from synth_ai.lm.caching.initialize import (
     get_cache_handler,
 )
+from synth_ai.lm.constants import SPECIAL_BASE_TEMPS
+from synth_ai.lm.injection import apply_injection
+from synth_ai.lm.overrides import (
+    apply_param_overrides,
+    apply_tool_overrides,
+    use_overrides_for_messages,
+)
 from synth_ai.lm.tools.base import BaseTool
 from synth_ai.lm.vendors.base import BaseLMResponse, VendorBase
-from synth_ai.lm.injection import apply_injection
-from synth_ai.lm.overrides import use_overrides_for_messages, apply_param_overrides, apply_tool_overrides
-from synth_ai.lm.constants import SPECIAL_BASE_TEMPS
-from synth_ai.lm.vendors.retries import MAX_BACKOFF
 from synth_ai.lm.vendors.openai_standard_responses import OpenAIResponsesAPIMixin
-import backoff
+from synth_ai.lm.vendors.retries import MAX_BACKOFF
 DEFAULT_EXCEPTIONS_TO_RETRY = (
     pydantic_core._pydantic_core.ValidationError,
@@ -30,14 +34,14 @@ DEFAULT_EXCEPTIONS_TO_RETRY = (
 )
-def special_orion_transform(model: str, messages: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
+def special_orion_transform(model: str, messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
     """
     Transform messages for O1 series models which don't support system messages.
     Args:
         model: Model name to check
         messages: Original messages list
     Returns:
         Transformed messages list with system content merged into user message
     """
@@ -59,18 +63,19 @@ def _silent_backoff_handler(_details):
 class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
     """
     Standard OpenAI-compatible vendor implementation.
     This class provides a standard implementation for OpenAI-compatible APIs,
     including proper retry logic, caching, and support for various model features.
     Attributes:
         used_for_structured_outputs: Whether this client supports structured outputs
         exceptions_to_retry: List of exceptions that trigger automatic retries
         sync_client: Synchronous API client
         async_client: Asynchronous API client
     """
     used_for_structured_outputs: bool = True
-    exceptions_to_retry: List = DEFAULT_EXCEPTIONS_TO_RETRY
+    exceptions_to_retry: list = DEFAULT_EXCEPTIONS_TO_RETRY
     sync_client: Any
     async_client: Any
@@ -78,19 +83,20 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         self,
         sync_client: Any,
         async_client: Any,
-        exceptions_to_retry: List[Exception] = DEFAULT_EXCEPTIONS_TO_RETRY,
+        exceptions_to_retry: list[Exception] = DEFAULT_EXCEPTIONS_TO_RETRY,
         used_for_structured_outputs: bool = False,
     ):
         self.sync_client = sync_client
         self.async_client = async_client
         self.used_for_structured_outputs = used_for_structured_outputs
         self.exceptions_to_retry = exceptions_to_retry
         # Initialize Harmony support for OSS models
         self.harmony_available = False
         self.harmony_enc = None
         try:
-            from openai_harmony import load_harmony_encoding, HarmonyEncodingName
+            from openai_harmony import HarmonyEncodingName, load_harmony_encoding
             self.harmony_available = True
             self.harmony_enc = load_harmony_encoding(HarmonyEncodingName.HARMONY_GPT_OSS)
         except ImportError:
@@ -106,24 +112,24 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
     async def _hit_api_async(
         self,
         model: str,
-        messages: List[Dict[str, Any]],
-        lm_config: Dict[str, Any],
+        messages: list[dict[str, Any]],
+        lm_config: dict[str, Any],
         use_ephemeral_cache_only: bool = False,
         reasoning_effort: str = "high",
-        tools: Optional[List[BaseTool]] = None,
+        tools: list[BaseTool] | None = None,
     ) -> BaseLMResponse:
-        assert lm_config.get("response_model", None) is None, (
+        assert lm_config.get("response_model") is None, (
             "response_model is not supported for standard calls"
         )
-        DEBUG = os.getenv("SYNTH_OPENAI_DEBUG") == "1"
-        if DEBUG:
-            print(f"🔍 OPENAI DEBUG: _hit_api_async called with:")
+        debug = os.getenv("SYNTH_OPENAI_DEBUG") == "1"
+        if debug:
+            print("🔍 OPENAI DEBUG: _hit_api_async called with:")
             print(f"   Model: {model}")
-            print(f"   Messages: {len(messages)} messages")
+            print(f"   Messages: {len(messages)} messages")
             print(f"   Tools: {len(tools) if tools else 0} tools")
             print(f"   LM config: {lm_config}")
         messages = special_orion_transform(model, messages)
         # Apply context-scoped overrides and prompt injection just before building API params
         with use_overrides_for_messages(messages):
@@ -133,15 +139,14 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         cache_result = used_cache_handler.hit_managed_cache(
             model, messages, lm_config=lm_config, tools=tools
         )
-        if cache_result:
-            if DEBUG:
-                print(f"🔍 OPENAI DEBUG: Cache hit! Returning cached result")
-                print(f"   Cache result type: {type(cache_result)}")
-                print(f"🔍 OPENAI DEBUG: DISABLING CACHE FOR DEBUGGING - forcing API call")
-            # return cache_result  # Commented out to force API call
-        if DEBUG:
-            print(f"🔍 OPENAI DEBUG: Cache miss, making actual API call")
+        if cache_result and debug:
+            print("🔍 OPENAI DEBUG: Cache hit! Returning cached result")
+            print(f"   Cache result type: {type(cache_result)}")
+            print("🔍 OPENAI DEBUG: DISABLING CACHE FOR DEBUGGING - forcing API call")
+            # return cache_result  # Commented out intentionally when debug is on
+        if debug:
+            print("🔍 OPENAI DEBUG: Cache miss, making actual API call")
         # Common API call params
         api_params = {
@@ -202,7 +207,22 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
             api_params = apply_tool_overrides(api_params)
             api_params = apply_param_overrides(api_params)
-        # Forward Qwen3 chat template kwargs via extra_body when requested
+        # Thinking controls: route via extra_body.chat_template_kwargs for compatibility
+        thinking_mode_val = lm_config.get("thinking_mode")
+        thinking_budget_val = lm_config.get("thinking_budget")
+        if thinking_mode_val is not None or thinking_budget_val is not None:
+            api_params["extra_body"] = api_params.get("extra_body", {})
+            ctk = api_params["extra_body"].get("chat_template_kwargs", {})
+            if thinking_mode_val is not None:
+                ctk["thinking_mode"] = thinking_mode_val
+            if thinking_budget_val is not None:
+                try:
+                    ctk["thinking_budget"] = int(thinking_budget_val)
+                except Exception:
+                    ctk["thinking_budget"] = thinking_budget_val
+            api_params["extra_body"]["chat_template_kwargs"] = ctk
+        # Backward-compatible: forward legacy enable_thinking only via extra_body for callers still using it
         if lm_config.get("enable_thinking") is not None:
             api_params["extra_body"] = api_params.get("extra_body", {})
             ctk = api_params["extra_body"].get("chat_template_kwargs", {})
@@ -211,8 +231,11 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         # Forward arbitrary extra_body from lm_config if provided (merge)
         if lm_config.get("extra_body") is not None:
             # Shallow-merge top-level keys; nested keys (like chat_template_kwargs) should be provided whole
-            api_params["extra_body"] = {**api_params.get("extra_body", {}), **(lm_config.get("extra_body") or {})}
-        # Forward Qwen3 chat template kwargs via extra_body when requested
+            api_params["extra_body"] = {
+                **api_params.get("extra_body", {}),
+                **(lm_config.get("extra_body") or {}),
+            }
+        # Ensure legacy extra_body flag remains merged (do not override top-level fields)
         if lm_config.get("enable_thinking") is not None:
             api_params["extra_body"] = api_params.get("extra_body", {})
             ctk = api_params["extra_body"].get("chat_template_kwargs", {})
@@ -233,9 +256,7 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         except Exception:
             base_url_str = ""
-        is_external_provider = (
-            "openai.com" in base_url_str or "api.groq.com" in base_url_str
-        )
+        is_external_provider = "openai.com" in base_url_str or "api.groq.com" in base_url_str
         if is_external_provider:
             # Remove extra_body entirely; this is Synth-specific plumbing
@@ -257,18 +278,18 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                     api_params.pop("temperature", None)
         # Call API with better auth error reporting
-        #try:
-        if DEBUG:
-            print(f"🔍 OPENAI DEBUG: Making request with params:")
+        # try:
+        if debug:
+            print("🔍 OPENAI DEBUG: Making request with params:")
             print(f"   Model: {api_params.get('model')}")
             print(f"   Messages: {len(api_params.get('messages', []))} messages")
             print(f"   Tools: {len(api_params.get('tools', []))} tools")
             print(f"   Max tokens: {api_params.get('max_tokens', 'NOT SET')}")
             print(f"   Temperature: {api_params.get('temperature', 'NOT SET')}")
-            if 'tools' in api_params:
+            if "tools" in api_params:
                 print(f"   First tool: {api_params['tools'][0]}")
             print(f"   FULL API PARAMS: {api_params}")
         # Quiet targeted retry for OpenAI 400 tool_use_failed during tool-calling
         try:
             max_attempts_for_tool_use = int(os.getenv("SYNTH_TOOL_USE_RETRIES", "5"))
@@ -294,7 +315,9 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                         err_obj = body.get("error") if isinstance(body.get("error"), dict) else {}
                         code_val = err_obj.get("code")
                         msg_val = err_obj.get("message")
-                        if code_val == "tool_use_failed" or (isinstance(msg_val, str) and "Failed to call a function" in msg_val):
+                        if code_val == "tool_use_failed" or (
+                            isinstance(msg_val, str) and "Failed to call a function" in msg_val
+                        ):
                             should_retry = True
                     except Exception:
                         pass
@@ -308,7 +331,10 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                                 err_obj = j.get("error") if isinstance(j.get("error"), dict) else {}
                                 code_val = err_obj.get("code")
                                 msg_val = err_obj.get("message")
-                                if code_val == "tool_use_failed" or (isinstance(msg_val, str) and "Failed to call a function" in msg_val):
+                                if code_val == "tool_use_failed" or (
+                                    isinstance(msg_val, str)
+                                    and "Failed to call a function" in msg_val
+                                ):
                                     should_retry = True
                     except Exception:
                         pass
@@ -323,33 +349,37 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                     attempt_index += 1
                     continue
                 raise
-        if DEBUG:
-            print(f"🔍 OPENAI DEBUG: Response received:")
+        if debug:
+            print("🔍 OPENAI DEBUG: Response received:")
             print(f"   Type: {type(output)}")
             print(f"   Choices: {len(output.choices) if hasattr(output, 'choices') else 'N/A'}")
-            if hasattr(output, 'choices') and output.choices:
+            if hasattr(output, "choices") and output.choices:
                 choice = output.choices[0]
                 print(f"   Choice type: {type(choice)}")
-                if hasattr(choice, 'message'):
+                if hasattr(choice, "message"):
                     message = choice.message
                     print(f"   Message type: {type(message)}")
                     print(f"   Has tool_calls: {hasattr(message, 'tool_calls')}")
-                    if hasattr(message, 'tool_calls'):
+                    if hasattr(message, "tool_calls"):
                         print(f"   Tool calls: {message.tool_calls}")
-                    print(f"   Content: {message.content[:200] if hasattr(message, 'content') and message.content else 'None'}...")
+                    print(
+                        f"   Content: {message.content[:200] if hasattr(message, 'content') and message.content else 'None'}..."
+                    )
                 # Show finish_reason and usage if available
                 try:
                     print(f"   finish_reason: {getattr(choice, 'finish_reason', None)}")
-                    usage = getattr(output, 'usage', None)
+                    usage = getattr(output, "usage", None)
                     if usage:
-                        print(f"   usage: prompt_tokens={getattr(usage, 'prompt_tokens', None)}, completion_tokens={getattr(usage, 'completion_tokens', None)}, total_tokens={getattr(usage, 'total_tokens', None)}")
+                        print(
+                            f"   usage: prompt_tokens={getattr(usage, 'prompt_tokens', None)}, completion_tokens={getattr(usage, 'completion_tokens', None)}, total_tokens={getattr(usage, 'total_tokens', None)}"
+                        )
                 except Exception:
                     pass
-        if DEBUG:
-            print(f"🔍 OPENAI DEBUG: FULL RAW RESPONSE:")
-            if hasattr(output.choices[0].message, 'content') and output.choices[0].message.content:
+        if debug:
+            print("🔍 OPENAI DEBUG: FULL RAW RESPONSE:")
+            if hasattr(output.choices[0].message, "content") and output.choices[0].message.content:
                 print(f"   FULL CONTENT:\n{output.choices[0].message.content}")
             print(f"   Raw choice: {choice}")
             print(f"   Raw message: {message}")
@@ -372,30 +402,46 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         #     raise
         message = output.choices[0].message
-        # Convert tool calls to dict format
+        # Convert tool calls to dict format, preferring dict-shaped entries first
         tool_calls = None
         if message.tool_calls:
-            tool_calls = [
-                {
-                    "id": tc.id,
-                    "type": tc.type,
-                    "function": {
-                        "name": tc.function.name,
-                        "arguments": tc.function.arguments,
-                    },
-                }
-                for tc in message.tool_calls
-            ]
+            converted: list[dict] = []
+            for tc in message.tool_calls:
+                if isinstance(tc, dict):
+                    fn = tc.get("function") or {}
+                    converted.append(
+                        {
+                            "id": tc.get("id"),
+                            "type": tc.get("type", "function"),
+                            "function": {
+                                "name": fn.get("name") or tc.get("name"),
+                                "arguments": fn.get("arguments") or tc.get("arguments"),
+                            },
+                        }
+                    )
+                else:
+                    # SDK object path
+                    converted.append(
+                        {
+                            "id": getattr(tc, "id", None),
+                            "type": getattr(tc, "type", "function"),
+                            "function": {
+                                "name": getattr(getattr(tc, "function", None), "name", None),
+                                "arguments": getattr(getattr(tc, "function", None), "arguments", None),
+                            },
+                        }
+                    )
+            tool_calls = converted or None
         # Attach basic usage if available
         usage_dict = None
         try:
-            usage_obj = getattr(output, 'usage', None)
+            usage_obj = getattr(output, "usage", None)
             if usage_obj is not None:
                 usage_dict = {
-                    "prompt_tokens": getattr(usage_obj, 'prompt_tokens', None),
-                    "completion_tokens": getattr(usage_obj, 'completion_tokens', None),
-                    "total_tokens": getattr(usage_obj, 'total_tokens', None),
+                    "prompt_tokens": getattr(usage_obj, "prompt_tokens", None),
+                    "completion_tokens": getattr(usage_obj, "completion_tokens", None),
+                    "total_tokens": getattr(usage_obj, "total_tokens", None),
                 }
         except Exception:
             usage_dict = None
@@ -422,13 +468,13 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
     def _hit_api_sync(
         self,
         model: str,
-        messages: List[Dict[str, Any]],
-        lm_config: Dict[str, Any],
+        messages: list[dict[str, Any]],
+        lm_config: dict[str, Any],
         use_ephemeral_cache_only: bool = False,
         reasoning_effort: str = "high",
-        tools: Optional[List[BaseTool]] = None,
+        tools: list[BaseTool] | None = None,
     ) -> BaseLMResponse:
-        assert lm_config.get("response_model", None) is None, (
+        assert lm_config.get("response_model") is None, (
             "response_model is not supported for standard calls"
         )
         messages = special_orion_transform(model, messages)
@@ -441,8 +487,8 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
             model, messages, lm_config=lm_config, tools=tools
         )
         # During pytest runs, bypass returning cache to allow tests to inspect outgoing params
-        IN_PYTEST = os.getenv("PYTEST_CURRENT_TEST") is not None
-        if cache_result and not IN_PYTEST:
+        in_pytest = os.getenv("PYTEST_CURRENT_TEST") is not None
+        if cache_result and not in_pytest:
             return cache_result
         # Common API call params
@@ -514,7 +560,9 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                         err_obj = body.get("error") if isinstance(body.get("error"), dict) else {}
                         code_val = err_obj.get("code")
                         msg_val = err_obj.get("message")
-                        if code_val == "tool_use_failed" or (isinstance(msg_val, str) and "Failed to call a function" in msg_val):
+                        if code_val == "tool_use_failed" or (
+                            isinstance(msg_val, str) and "Failed to call a function" in msg_val
+                        ):
                             should_retry = True
                     except Exception:
                         pass
@@ -527,7 +575,10 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                                 err_obj = j.get("error") if isinstance(j.get("error"), dict) else {}
                                 code_val = err_obj.get("code")
                                 msg_val = err_obj.get("message")
-                                if code_val == "tool_use_failed" or (isinstance(msg_val, str) and "Failed to call a function" in msg_val):
+                                if code_val == "tool_use_failed" or (
+                                    isinstance(msg_val, str)
+                                    and "Failed to call a function" in msg_val
+                                ):
                                     should_retry = True
                     except Exception:
                         pass
@@ -542,13 +593,17 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                     continue
                 raise
         message = output.choices[0].message
-        DEBUG = os.getenv("SYNTH_OPENAI_DEBUG") == "1"
-        if DEBUG:
+        debug_sync = os.getenv("SYNTH_OPENAI_DEBUG") == "1"
+        if debug_sync:
             try:
-                print(f"🔍 OPENAI DEBUG (sync): finish_reason={getattr(output.choices[0], 'finish_reason', None)}")
-                usage = getattr(output, 'usage', None)
+                print(
+                    f"🔍 OPENAI DEBUG (sync): finish_reason={getattr(output.choices[0], 'finish_reason', None)}"
+                )
+                usage = getattr(output, "usage", None)
                 if usage:
-                    print(f"🔍 OPENAI DEBUG (sync): usage prompt_tokens={getattr(usage, 'prompt_tokens', None)}, completion_tokens={getattr(usage, 'completion_tokens', None)}, total_tokens={getattr(usage, 'total_tokens', None)}")
+                    print(
+                        f"🔍 OPENAI DEBUG (sync): usage prompt_tokens={getattr(usage, 'prompt_tokens', None)}, completion_tokens={getattr(usage, 'completion_tokens', None)}, total_tokens={getattr(usage, 'total_tokens', None)}"
+                    )
             except Exception:
                 pass
@@ -570,12 +625,12 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         # Attach basic usage if available
         usage_dict = None
         try:
-            usage_obj = getattr(output, 'usage', None)
+            usage_obj = getattr(output, "usage", None)
             if usage_obj is not None:
                 usage_dict = {
-                    "prompt_tokens": getattr(usage_obj, 'prompt_tokens', None),
-                    "completion_tokens": getattr(usage_obj, 'completion_tokens', None),
-                    "total_tokens": getattr(usage_obj, 'total_tokens', None),
+                    "prompt_tokens": getattr(usage_obj, "prompt_tokens", None),
+                    "completion_tokens": getattr(usage_obj, "completion_tokens", None),
+                    "total_tokens": getattr(usage_obj, "total_tokens", None),
                 }
         except Exception:
             usage_dict = None
@@ -595,12 +650,12 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
     async def _hit_api_async_structured_output(
         self,
         model: str,
-        messages: List[Dict[str, Any]],
+        messages: list[dict[str, Any]],
         response_model: BaseModel,
         temperature: float,
         use_ephemeral_cache_only: bool = False,
         reasoning_effort: str = "high",
-        tools: Optional[List[BaseTool]] = None,
+        tools: list[BaseTool] | None = None,
     ) -> BaseLMResponse:
         lm_config = {
             "temperature": temperature,
@@ -608,7 +663,7 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
             "reasoning_effort": reasoning_effort,
         }
         used_cache_handler = get_cache_handler(use_ephemeral_cache_only)
-        cache_result: Union[BaseLMResponse, None] = used_cache_handler.hit_managed_cache(
+        cache_result: BaseLMResponse | None = used_cache_handler.hit_managed_cache(
             model, messages, lm_config=lm_config, tools=tools
         )
         if cache_result is not None:
@@ -654,12 +709,12 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
     def _hit_api_sync_structured_output(
         self,
         model: str,
-        messages: List[Dict[str, Any]],
+        messages: list[dict[str, Any]],
         response_model: BaseModel,
         temperature: float,
         use_ephemeral_cache_only: bool = False,
         reasoning_effort: str = "high",
-        tools: Optional[List[BaseTool]] = None,
+        tools: list[BaseTool] | None = None,
     ) -> BaseLMResponse:
         lm_config = {
             "temperature": temperature,
@@ -667,7 +722,7 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
             "reasoning_effort": reasoning_effort,
         }
         used_cache_handler = get_cache_handler(use_ephemeral_cache_only)
-        cache_result: Union[BaseLMResponse, None] = used_cache_handler.hit_managed_cache(
+        cache_result: BaseLMResponse | None = used_cache_handler.hit_managed_cache(
             model, messages, lm_config=lm_config, tools=tools
         )
         if cache_result is not None:
@@ -701,7 +756,9 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
             base_url_str_sync = str(base_url_obj) if base_url_obj is not None else ""
         except Exception:
             base_url_str_sync = ""
-        if ("openai.com" in base_url_str_sync or "api.groq.com" in base_url_str_sync) and model.startswith("gpt-5"):
+        if (
+            "openai.com" in base_url_str_sync or "api.groq.com" in base_url_str_sync
+        ) and model.startswith("gpt-5"):
             if "max_tokens" in api_params:
                 api_params["max_completion_tokens"] = api_params.pop("max_tokens")
             if "temperature" in api_params:

synth-ai 0.2.4.dev6__py3-none-any.whl → 0.2.4.dev8__py3-none-any.whl

synth-ai 0.2.4.dev6py3-none-any.whl → 0.2.4.dev8py3-none-any.whl