PyPI - synth-ai - Versions diffs - 0.2.4.dev5__py3-none-any.whl → 0.2.4.dev7__py3-none-any.whl - Mend

synth-ai 0.2.4.dev5py3-none-any.whl → 0.2.4.dev7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (229) hide show

synth_ai/__init__.py +18 -9
synth_ai/cli/__init__.py +10 -5
synth_ai/cli/balance.py +22 -17
synth_ai/cli/calc.py +2 -3
synth_ai/cli/demo.py +3 -5
synth_ai/cli/legacy_root_backup.py +58 -32
synth_ai/cli/man.py +22 -19
synth_ai/cli/recent.py +9 -8
synth_ai/cli/root.py +58 -13
synth_ai/cli/status.py +13 -6
synth_ai/cli/traces.py +45 -21
synth_ai/cli/watch.py +40 -37
synth_ai/config/base_url.py +1 -3
synth_ai/core/experiment.py +1 -2
synth_ai/environments/__init__.py +2 -6
synth_ai/environments/environment/artifacts/base.py +3 -1
synth_ai/environments/environment/db/sqlite.py +1 -1
synth_ai/environments/environment/registry.py +19 -20
synth_ai/environments/environment/resources/sqlite.py +2 -3
synth_ai/environments/environment/rewards/core.py +3 -2
synth_ai/environments/environment/tools/__init__.py +6 -4
synth_ai/environments/examples/crafter_classic/__init__.py +1 -1
synth_ai/environments/examples/crafter_classic/engine.py +21 -17
synth_ai/environments/examples/crafter_classic/engine_deterministic_patch.py +1 -0
synth_ai/environments/examples/crafter_classic/engine_helpers/action_map.py +2 -1
synth_ai/environments/examples/crafter_classic/engine_helpers/serialization.py +2 -1
synth_ai/environments/examples/crafter_classic/engine_serialization_patch_v3.py +3 -2
synth_ai/environments/examples/crafter_classic/environment.py +16 -15
synth_ai/environments/examples/crafter_classic/taskset.py +2 -2
synth_ai/environments/examples/crafter_classic/trace_hooks_v3.py +2 -3
synth_ai/environments/examples/crafter_classic/world_config_patch_simple.py +2 -1
synth_ai/environments/examples/crafter_custom/crafter/__init__.py +2 -2
synth_ai/environments/examples/crafter_custom/crafter/config.py +2 -2
synth_ai/environments/examples/crafter_custom/crafter/env.py +1 -5
synth_ai/environments/examples/crafter_custom/crafter/objects.py +1 -2
synth_ai/environments/examples/crafter_custom/crafter/worldgen.py +1 -2
synth_ai/environments/examples/crafter_custom/dataset_builder.py +5 -5
synth_ai/environments/examples/crafter_custom/environment.py +13 -13
synth_ai/environments/examples/crafter_custom/run_dataset.py +5 -5
synth_ai/environments/examples/enron/art_helpers/email_search_tools.py +2 -2
synth_ai/environments/examples/enron/art_helpers/local_email_db.py +5 -4
synth_ai/environments/examples/enron/art_helpers/types_enron.py +2 -1
synth_ai/environments/examples/enron/engine.py +18 -14
synth_ai/environments/examples/enron/environment.py +12 -11
synth_ai/environments/examples/enron/taskset.py +7 -7
synth_ai/environments/examples/minigrid/__init__.py +6 -6
synth_ai/environments/examples/minigrid/engine.py +6 -6
synth_ai/environments/examples/minigrid/environment.py +6 -6
synth_ai/environments/examples/minigrid/puzzle_loader.py +3 -2
synth_ai/environments/examples/minigrid/taskset.py +13 -13
synth_ai/environments/examples/nethack/achievements.py +1 -1
synth_ai/environments/examples/nethack/engine.py +8 -7
synth_ai/environments/examples/nethack/environment.py +10 -9
synth_ai/environments/examples/nethack/helpers/__init__.py +8 -9
synth_ai/environments/examples/nethack/helpers/action_mapping.py +1 -1
synth_ai/environments/examples/nethack/helpers/nle_wrapper.py +2 -1
synth_ai/environments/examples/nethack/helpers/observation_utils.py +1 -1
synth_ai/environments/examples/nethack/helpers/recording_wrapper.py +3 -4
synth_ai/environments/examples/nethack/helpers/trajectory_recorder.py +6 -5
synth_ai/environments/examples/nethack/helpers/visualization/replay_viewer.py +5 -5
synth_ai/environments/examples/nethack/helpers/visualization/visualizer.py +7 -6
synth_ai/environments/examples/nethack/taskset.py +5 -5
synth_ai/environments/examples/red/engine.py +9 -8
synth_ai/environments/examples/red/engine_helpers/reward_components.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/__init__.py +7 -7
synth_ai/environments/examples/red/engine_helpers/reward_library/adaptive_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/battle_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/composite_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/economy_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/efficiency_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/exploration_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/novelty_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/pallet_town_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/pokemon_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/social_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/reward_library/story_rewards.py +2 -1
synth_ai/environments/examples/red/engine_helpers/screen_analysis.py +3 -2
synth_ai/environments/examples/red/engine_helpers/state_extraction.py +2 -1
synth_ai/environments/examples/red/environment.py +18 -15
synth_ai/environments/examples/red/taskset.py +5 -3
synth_ai/environments/examples/sokoban/engine.py +16 -13
synth_ai/environments/examples/sokoban/engine_helpers/room_utils.py +3 -2
synth_ai/environments/examples/sokoban/engine_helpers/vendored/__init__.py +2 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/__init__.py +1 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/boxoban_env.py +7 -5
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/render_utils.py +1 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/room_utils.py +2 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env.py +5 -4
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_fixed_targets.py +3 -2
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_pull.py +2 -1
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_two_player.py +5 -4
synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_variations.py +1 -1
synth_ai/environments/examples/sokoban/environment.py +15 -14
synth_ai/environments/examples/sokoban/generate_verified_puzzles.py +5 -3
synth_ai/environments/examples/sokoban/puzzle_loader.py +3 -2
synth_ai/environments/examples/sokoban/taskset.py +13 -10
synth_ai/environments/examples/tictactoe/engine.py +6 -6
synth_ai/environments/examples/tictactoe/environment.py +8 -7
synth_ai/environments/examples/tictactoe/taskset.py +6 -5
synth_ai/environments/examples/verilog/engine.py +4 -3
synth_ai/environments/examples/verilog/environment.py +11 -10
synth_ai/environments/examples/verilog/taskset.py +14 -12
synth_ai/environments/examples/wordle/__init__.py +29 -0
synth_ai/environments/examples/wordle/engine.py +398 -0
synth_ai/environments/examples/wordle/environment.py +159 -0
synth_ai/environments/examples/wordle/helpers/generate_instances_wordfreq.py +75 -0
synth_ai/environments/examples/wordle/taskset.py +230 -0
synth_ai/environments/reproducibility/core.py +1 -1
synth_ai/environments/reproducibility/tree.py +21 -21
synth_ai/environments/service/app.py +11 -2
synth_ai/environments/service/core_routes.py +137 -105
synth_ai/environments/service/external_registry.py +1 -2
synth_ai/environments/service/registry.py +1 -1
synth_ai/environments/stateful/core.py +1 -2
synth_ai/environments/stateful/engine.py +1 -1
synth_ai/environments/tasks/api.py +4 -4
synth_ai/environments/tasks/core.py +14 -12
synth_ai/environments/tasks/filters.py +6 -4
synth_ai/environments/tasks/utils.py +13 -11
synth_ai/evals/base.py +2 -3
synth_ai/experimental/synth_oss.py +4 -4
synth_ai/learning/gateway.py +1 -3
synth_ai/learning/prompts/banking77_injection_eval.py +168 -0
synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +213 -0
synth_ai/learning/prompts/mipro.py +282 -1
synth_ai/learning/prompts/random_search.py +246 -0
synth_ai/learning/prompts/run_mipro_banking77.py +172 -0
synth_ai/learning/prompts/run_random_search_banking77.py +324 -0
synth_ai/lm/__init__.py +5 -5
synth_ai/lm/caching/ephemeral.py +9 -9
synth_ai/lm/caching/handler.py +20 -20
synth_ai/lm/caching/persistent.py +10 -10
synth_ai/lm/config.py +3 -3
synth_ai/lm/constants.py +7 -7
synth_ai/lm/core/all.py +17 -3
synth_ai/lm/core/exceptions.py +0 -2
synth_ai/lm/core/main.py +26 -41
synth_ai/lm/core/main_v3.py +20 -10
synth_ai/lm/core/vendor_clients.py +18 -17
synth_ai/lm/injection.py +80 -0
synth_ai/lm/overrides.py +206 -0
synth_ai/lm/provider_support/__init__.py +1 -1
synth_ai/lm/provider_support/anthropic.py +51 -24
synth_ai/lm/provider_support/openai.py +51 -22
synth_ai/lm/structured_outputs/handler.py +34 -32
synth_ai/lm/structured_outputs/inject.py +24 -27
synth_ai/lm/structured_outputs/rehabilitate.py +19 -15
synth_ai/lm/tools/base.py +17 -16
synth_ai/lm/unified_interface.py +17 -18
synth_ai/lm/vendors/base.py +20 -18
synth_ai/lm/vendors/core/anthropic_api.py +50 -25
synth_ai/lm/vendors/core/gemini_api.py +31 -36
synth_ai/lm/vendors/core/mistral_api.py +19 -19
synth_ai/lm/vendors/core/openai_api.py +11 -10
synth_ai/lm/vendors/openai_standard.py +144 -88
synth_ai/lm/vendors/openai_standard_responses.py +74 -61
synth_ai/lm/vendors/retries.py +9 -1
synth_ai/lm/vendors/supported/custom_endpoint.py +26 -26
synth_ai/lm/vendors/supported/deepseek.py +10 -10
synth_ai/lm/vendors/supported/grok.py +8 -8
synth_ai/lm/vendors/supported/ollama.py +2 -1
synth_ai/lm/vendors/supported/openrouter.py +11 -9
synth_ai/lm/vendors/synth_client.py +69 -63
synth_ai/lm/warmup.py +8 -7
synth_ai/tracing/__init__.py +22 -10
synth_ai/tracing_v1/__init__.py +22 -20
synth_ai/tracing_v3/__init__.py +7 -7
synth_ai/tracing_v3/abstractions.py +56 -52
synth_ai/tracing_v3/config.py +4 -2
synth_ai/tracing_v3/db_config.py +6 -8
synth_ai/tracing_v3/decorators.py +29 -30
synth_ai/tracing_v3/examples/basic_usage.py +12 -12
synth_ai/tracing_v3/hooks.py +21 -21
synth_ai/tracing_v3/llm_call_record_helpers.py +85 -98
synth_ai/tracing_v3/lm_call_record_abstractions.py +2 -4
synth_ai/tracing_v3/migration_helper.py +3 -5
synth_ai/tracing_v3/replica_sync.py +30 -32
synth_ai/tracing_v3/session_tracer.py +35 -29
synth_ai/tracing_v3/storage/__init__.py +1 -1
synth_ai/tracing_v3/storage/base.py +8 -7
synth_ai/tracing_v3/storage/config.py +4 -4
synth_ai/tracing_v3/storage/factory.py +4 -4
synth_ai/tracing_v3/storage/utils.py +9 -9
synth_ai/tracing_v3/turso/__init__.py +3 -3
synth_ai/tracing_v3/turso/daemon.py +9 -9
synth_ai/tracing_v3/turso/manager.py +60 -48
synth_ai/tracing_v3/turso/models.py +24 -19
synth_ai/tracing_v3/utils.py +5 -5
synth_ai/tui/__main__.py +1 -1
synth_ai/tui/cli/query_experiments.py +2 -3
synth_ai/tui/cli/query_experiments_v3.py +2 -3
synth_ai/tui/dashboard.py +97 -86
synth_ai/v0/tracing/abstractions.py +28 -28
synth_ai/v0/tracing/base_client.py +9 -9
synth_ai/v0/tracing/client_manager.py +7 -7
synth_ai/v0/tracing/config.py +7 -7
synth_ai/v0/tracing/context.py +6 -6
synth_ai/v0/tracing/decorators.py +6 -5
synth_ai/v0/tracing/events/manage.py +1 -1
synth_ai/v0/tracing/events/store.py +5 -4
synth_ai/v0/tracing/immediate_client.py +4 -5
synth_ai/v0/tracing/local.py +3 -3
synth_ai/v0/tracing/log_client_base.py +4 -5
synth_ai/v0/tracing/retry_queue.py +5 -6
synth_ai/v0/tracing/trackers.py +25 -25
synth_ai/v0/tracing/upload.py +6 -0
synth_ai/v0/tracing_v1/__init__.py +1 -1
synth_ai/v0/tracing_v1/abstractions.py +28 -28
synth_ai/v0/tracing_v1/base_client.py +9 -9
synth_ai/v0/tracing_v1/client_manager.py +7 -7
synth_ai/v0/tracing_v1/config.py +7 -7
synth_ai/v0/tracing_v1/context.py +6 -6
synth_ai/v0/tracing_v1/decorators.py +7 -6
synth_ai/v0/tracing_v1/events/manage.py +1 -1
synth_ai/v0/tracing_v1/events/store.py +5 -4
synth_ai/v0/tracing_v1/immediate_client.py +4 -5
synth_ai/v0/tracing_v1/local.py +3 -3
synth_ai/v0/tracing_v1/log_client_base.py +4 -5
synth_ai/v0/tracing_v1/retry_queue.py +5 -6
synth_ai/v0/tracing_v1/trackers.py +25 -25
synth_ai/v0/tracing_v1/upload.py +25 -24
synth_ai/zyk/__init__.py +1 -0
{synth_ai-0.2.4.dev5.dist-info → synth_ai-0.2.4.dev7.dist-info}/METADATA +2 -11
synth_ai-0.2.4.dev7.dist-info/RECORD +299 -0
synth_ai-0.2.4.dev5.dist-info/RECORD +0 -287
{synth_ai-0.2.4.dev5.dist-info → synth_ai-0.2.4.dev7.dist-info}/WHEEL +0 -0
{synth_ai-0.2.4.dev5.dist-info → synth_ai-0.2.4.dev7.dist-info}/entry_points.txt +0 -0
{synth_ai-0.2.4.dev5.dist-info → synth_ai-0.2.4.dev7.dist-info}/licenses/LICENSE +0 -0
{synth_ai-0.2.4.dev5.dist-info → synth_ai-0.2.4.dev7.dist-info}/top_level.txt +0 -0

synth_ai/lm/vendors/openai_standard.py CHANGED Viewed

@@ -1,22 +1,28 @@
-from typing import Any, Dict, List, Optional, Union
 import asyncio
+import os
 import time
+from typing import Any
+import backoff
 import groq
 import openai
-import os
 import pydantic_core
 from pydantic import BaseModel
 from synth_ai.lm.caching.initialize import (
     get_cache_handler,
 )
+from synth_ai.lm.constants import SPECIAL_BASE_TEMPS
+from synth_ai.lm.injection import apply_injection
+from synth_ai.lm.overrides import (
+    apply_param_overrides,
+    apply_tool_overrides,
+    use_overrides_for_messages,
+)
 from synth_ai.lm.tools.base import BaseTool
 from synth_ai.lm.vendors.base import BaseLMResponse, VendorBase
-from synth_ai.lm.constants import SPECIAL_BASE_TEMPS
-from synth_ai.lm.vendors.retries import MAX_BACKOFF
 from synth_ai.lm.vendors.openai_standard_responses import OpenAIResponsesAPIMixin
-import backoff
+from synth_ai.lm.vendors.retries import MAX_BACKOFF
 DEFAULT_EXCEPTIONS_TO_RETRY = (
     pydantic_core._pydantic_core.ValidationError,
@@ -28,14 +34,14 @@ DEFAULT_EXCEPTIONS_TO_RETRY = (
 )
-def special_orion_transform(model: str, messages: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
+def special_orion_transform(model: str, messages: list[dict[str, Any]]) -> list[dict[str, Any]]:
     """
     Transform messages for O1 series models which don't support system messages.
     Args:
         model: Model name to check
         messages: Original messages list
     Returns:
         Transformed messages list with system content merged into user message
     """
@@ -57,18 +63,19 @@ def _silent_backoff_handler(_details):
 class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
     """
     Standard OpenAI-compatible vendor implementation.
     This class provides a standard implementation for OpenAI-compatible APIs,
     including proper retry logic, caching, and support for various model features.
     Attributes:
         used_for_structured_outputs: Whether this client supports structured outputs
         exceptions_to_retry: List of exceptions that trigger automatic retries
         sync_client: Synchronous API client
         async_client: Asynchronous API client
     """
     used_for_structured_outputs: bool = True
-    exceptions_to_retry: List = DEFAULT_EXCEPTIONS_TO_RETRY
+    exceptions_to_retry: list = DEFAULT_EXCEPTIONS_TO_RETRY
     sync_client: Any
     async_client: Any
@@ -76,19 +83,20 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         self,
         sync_client: Any,
         async_client: Any,
-        exceptions_to_retry: List[Exception] = DEFAULT_EXCEPTIONS_TO_RETRY,
+        exceptions_to_retry: list[Exception] = DEFAULT_EXCEPTIONS_TO_RETRY,
         used_for_structured_outputs: bool = False,
     ):
         self.sync_client = sync_client
         self.async_client = async_client
         self.used_for_structured_outputs = used_for_structured_outputs
         self.exceptions_to_retry = exceptions_to_retry
         # Initialize Harmony support for OSS models
         self.harmony_available = False
         self.harmony_enc = None
         try:
-            from openai_harmony import load_harmony_encoding, HarmonyEncodingName
+            from openai_harmony import HarmonyEncodingName, load_harmony_encoding
             self.harmony_available = True
             self.harmony_enc = load_harmony_encoding(HarmonyEncodingName.HARMONY_GPT_OSS)
         except ImportError:
@@ -104,45 +112,49 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
     async def _hit_api_async(
         self,
         model: str,
-        messages: List[Dict[str, Any]],
-        lm_config: Dict[str, Any],
+        messages: list[dict[str, Any]],
+        lm_config: dict[str, Any],
         use_ephemeral_cache_only: bool = False,
         reasoning_effort: str = "high",
-        tools: Optional[List[BaseTool]] = None,
+        tools: list[BaseTool] | None = None,
     ) -> BaseLMResponse:
-        assert lm_config.get("response_model", None) is None, (
+        assert lm_config.get("response_model") is None, (
             "response_model is not supported for standard calls"
         )
-        DEBUG = os.getenv("SYNTH_OPENAI_DEBUG") == "1"
-        if DEBUG:
-            print(f"🔍 OPENAI DEBUG: _hit_api_async called with:")
+        debug = os.getenv("SYNTH_OPENAI_DEBUG") == "1"
+        if debug:
+            print("🔍 OPENAI DEBUG: _hit_api_async called with:")
             print(f"   Model: {model}")
-            print(f"   Messages: {len(messages)} messages")
+            print(f"   Messages: {len(messages)} messages")
             print(f"   Tools: {len(tools) if tools else 0} tools")
             print(f"   LM config: {lm_config}")
         messages = special_orion_transform(model, messages)
+        # Apply context-scoped overrides and prompt injection just before building API params
+        with use_overrides_for_messages(messages):
+            messages = apply_injection(messages)
         used_cache_handler = get_cache_handler(use_ephemeral_cache_only)
         lm_config["reasoning_effort"] = reasoning_effort
         cache_result = used_cache_handler.hit_managed_cache(
             model, messages, lm_config=lm_config, tools=tools
         )
-        if cache_result:
-            if DEBUG:
-                print(f"🔍 OPENAI DEBUG: Cache hit! Returning cached result")
-                print(f"   Cache result type: {type(cache_result)}")
-                print(f"🔍 OPENAI DEBUG: DISABLING CACHE FOR DEBUGGING - forcing API call")
-            # return cache_result  # Commented out to force API call
-        if DEBUG:
-            print(f"🔍 OPENAI DEBUG: Cache miss, making actual API call")
+        if cache_result and debug:
+            print("🔍 OPENAI DEBUG: Cache hit! Returning cached result")
+            print(f"   Cache result type: {type(cache_result)}")
+            print("🔍 OPENAI DEBUG: DISABLING CACHE FOR DEBUGGING - forcing API call")
+            # return cache_result  # Commented out intentionally when debug is on
+        if debug:
+            print("🔍 OPENAI DEBUG: Cache miss, making actual API call")
         # Common API call params
         api_params = {
             "model": model,
             "messages": messages,
         }
+        with use_overrides_for_messages(messages):
+            api_params = apply_param_overrides(api_params)
         # Add tools if provided
         if tools and all(isinstance(tool, BaseTool) for tool in tools):
@@ -150,8 +162,11 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         elif tools:
             api_params["tools"] = tools
-        # Only add temperature for non o1/o3 models
-        if not any(prefix in model for prefix in ["o1-", "o3-"]):
+        # Only add temperature for non o1/o3 models, and do not override if already set via overrides
+        if (
+            not any(prefix in model for prefix in ["o1-", "o3-"])
+            and "temperature" not in api_params
+        ):
             api_params["temperature"] = lm_config.get(
                 "temperature", SPECIAL_BASE_TEMPS.get(model, 0)
             )
@@ -187,6 +202,11 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                 api_params["extra_headers"] = hdrs
         except Exception:
             pass
+        # Apply overrides (tools and params) from context after building baseline params
+        with use_overrides_for_messages(messages):
+            api_params = apply_tool_overrides(api_params)
+            api_params = apply_param_overrides(api_params)
         # Forward Qwen3 chat template kwargs via extra_body when requested
         if lm_config.get("enable_thinking") is not None:
             api_params["extra_body"] = api_params.get("extra_body", {})
@@ -196,7 +216,10 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         # Forward arbitrary extra_body from lm_config if provided (merge)
         if lm_config.get("extra_body") is not None:
             # Shallow-merge top-level keys; nested keys (like chat_template_kwargs) should be provided whole
-            api_params["extra_body"] = {**api_params.get("extra_body", {}), **(lm_config.get("extra_body") or {})}
+            api_params["extra_body"] = {
+                **api_params.get("extra_body", {}),
+                **(lm_config.get("extra_body") or {}),
+            }
         # Forward Qwen3 chat template kwargs via extra_body when requested
         if lm_config.get("enable_thinking") is not None:
             api_params["extra_body"] = api_params.get("extra_body", {})
@@ -218,9 +241,7 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         except Exception:
             base_url_str = ""
-        is_external_provider = (
-            "openai.com" in base_url_str or "api.groq.com" in base_url_str
-        )
+        is_external_provider = "openai.com" in base_url_str or "api.groq.com" in base_url_str
         if is_external_provider:
             # Remove extra_body entirely; this is Synth-specific plumbing
@@ -242,18 +263,18 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                     api_params.pop("temperature", None)
         # Call API with better auth error reporting
-        #try:
-        if DEBUG:
-            print(f"🔍 OPENAI DEBUG: Making request with params:")
+        # try:
+        if debug:
+            print("🔍 OPENAI DEBUG: Making request with params:")
             print(f"   Model: {api_params.get('model')}")
             print(f"   Messages: {len(api_params.get('messages', []))} messages")
             print(f"   Tools: {len(api_params.get('tools', []))} tools")
             print(f"   Max tokens: {api_params.get('max_tokens', 'NOT SET')}")
             print(f"   Temperature: {api_params.get('temperature', 'NOT SET')}")
-            if 'tools' in api_params:
+            if "tools" in api_params:
                 print(f"   First tool: {api_params['tools'][0]}")
             print(f"   FULL API PARAMS: {api_params}")
         # Quiet targeted retry for OpenAI 400 tool_use_failed during tool-calling
         try:
             max_attempts_for_tool_use = int(os.getenv("SYNTH_TOOL_USE_RETRIES", "5"))
@@ -279,7 +300,9 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                         err_obj = body.get("error") if isinstance(body.get("error"), dict) else {}
                         code_val = err_obj.get("code")
                         msg_val = err_obj.get("message")
-                        if code_val == "tool_use_failed" or (isinstance(msg_val, str) and "Failed to call a function" in msg_val):
+                        if code_val == "tool_use_failed" or (
+                            isinstance(msg_val, str) and "Failed to call a function" in msg_val
+                        ):
                             should_retry = True
                     except Exception:
                         pass
@@ -293,7 +316,10 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                                 err_obj = j.get("error") if isinstance(j.get("error"), dict) else {}
                                 code_val = err_obj.get("code")
                                 msg_val = err_obj.get("message")
-                                if code_val == "tool_use_failed" or (isinstance(msg_val, str) and "Failed to call a function" in msg_val):
+                                if code_val == "tool_use_failed" or (
+                                    isinstance(msg_val, str)
+                                    and "Failed to call a function" in msg_val
+                                ):
                                     should_retry = True
                     except Exception:
                         pass
@@ -308,33 +334,37 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                     attempt_index += 1
                     continue
                 raise
-        if DEBUG:
-            print(f"🔍 OPENAI DEBUG: Response received:")
+        if debug:
+            print("🔍 OPENAI DEBUG: Response received:")
             print(f"   Type: {type(output)}")
             print(f"   Choices: {len(output.choices) if hasattr(output, 'choices') else 'N/A'}")
-            if hasattr(output, 'choices') and output.choices:
+            if hasattr(output, "choices") and output.choices:
                 choice = output.choices[0]
                 print(f"   Choice type: {type(choice)}")
-                if hasattr(choice, 'message'):
+                if hasattr(choice, "message"):
                     message = choice.message
                     print(f"   Message type: {type(message)}")
                     print(f"   Has tool_calls: {hasattr(message, 'tool_calls')}")
-                    if hasattr(message, 'tool_calls'):
+                    if hasattr(message, "tool_calls"):
                         print(f"   Tool calls: {message.tool_calls}")
-                    print(f"   Content: {message.content[:200] if hasattr(message, 'content') and message.content else 'None'}...")
+                    print(
+                        f"   Content: {message.content[:200] if hasattr(message, 'content') and message.content else 'None'}..."
+                    )
                 # Show finish_reason and usage if available
                 try:
                     print(f"   finish_reason: {getattr(choice, 'finish_reason', None)}")
-                    usage = getattr(output, 'usage', None)
+                    usage = getattr(output, "usage", None)
                     if usage:
-                        print(f"   usage: prompt_tokens={getattr(usage, 'prompt_tokens', None)}, completion_tokens={getattr(usage, 'completion_tokens', None)}, total_tokens={getattr(usage, 'total_tokens', None)}")
+                        print(
+                            f"   usage: prompt_tokens={getattr(usage, 'prompt_tokens', None)}, completion_tokens={getattr(usage, 'completion_tokens', None)}, total_tokens={getattr(usage, 'total_tokens', None)}"
+                        )
                 except Exception:
                     pass
-        if DEBUG:
-            print(f"🔍 OPENAI DEBUG: FULL RAW RESPONSE:")
-            if hasattr(output.choices[0].message, 'content') and output.choices[0].message.content:
+        if debug:
+            print("🔍 OPENAI DEBUG: FULL RAW RESPONSE:")
+            if hasattr(output.choices[0].message, "content") and output.choices[0].message.content:
                 print(f"   FULL CONTENT:\n{output.choices[0].message.content}")
             print(f"   Raw choice: {choice}")
             print(f"   Raw message: {message}")
@@ -375,12 +405,12 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         # Attach basic usage if available
         usage_dict = None
         try:
-            usage_obj = getattr(output, 'usage', None)
+            usage_obj = getattr(output, "usage", None)
             if usage_obj is not None:
                 usage_dict = {
-                    "prompt_tokens": getattr(usage_obj, 'prompt_tokens', None),
-                    "completion_tokens": getattr(usage_obj, 'completion_tokens', None),
-                    "total_tokens": getattr(usage_obj, 'total_tokens', None),
+                    "prompt_tokens": getattr(usage_obj, "prompt_tokens", None),
+                    "completion_tokens": getattr(usage_obj, "completion_tokens", None),
+                    "total_tokens": getattr(usage_obj, "total_tokens", None),
                 }
         except Exception:
             usage_dict = None
@@ -407,22 +437,27 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
     def _hit_api_sync(
         self,
         model: str,
-        messages: List[Dict[str, Any]],
-        lm_config: Dict[str, Any],
+        messages: list[dict[str, Any]],
+        lm_config: dict[str, Any],
         use_ephemeral_cache_only: bool = False,
         reasoning_effort: str = "high",
-        tools: Optional[List[BaseTool]] = None,
+        tools: list[BaseTool] | None = None,
     ) -> BaseLMResponse:
-        assert lm_config.get("response_model", None) is None, (
+        assert lm_config.get("response_model") is None, (
             "response_model is not supported for standard calls"
         )
         messages = special_orion_transform(model, messages)
+        with use_overrides_for_messages(messages):
+            # Apply context-scoped prompt injection just before building API params
+            messages = apply_injection(messages)
         used_cache_handler = get_cache_handler(use_ephemeral_cache_only=use_ephemeral_cache_only)
         lm_config["reasoning_effort"] = reasoning_effort
         cache_result = used_cache_handler.hit_managed_cache(
             model, messages, lm_config=lm_config, tools=tools
         )
-        if cache_result:
+        # During pytest runs, bypass returning cache to allow tests to inspect outgoing params
+        in_pytest = os.getenv("PYTEST_CURRENT_TEST") is not None
+        if cache_result and not in_pytest:
             return cache_result
         # Common API call params
@@ -430,6 +465,8 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
             "model": model,
             "messages": messages,
         }
+        with use_overrides_for_messages(messages):
+            api_params = apply_param_overrides(api_params)
         # Add tools if provided
         if tools and all(isinstance(tool, BaseTool) for tool in tools):
@@ -437,8 +474,16 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         elif tools:
             api_params["tools"] = tools
-        # Only add temperature for non o1/o3 models
-        if not any(prefix in model for prefix in ["o1-", "o3-"]):
+        # Apply overrides (tools and params) using module-level imports
+        with use_overrides_for_messages(messages):
+            api_params = apply_tool_overrides(api_params)
+            api_params = apply_param_overrides(api_params)
+        # Only add temperature for non o1/o3 models, and do not override if already set via overrides
+        if (
+            not any(prefix in model for prefix in ["o1-", "o3-"])
+            and "temperature" not in api_params
+        ):
             api_params["temperature"] = lm_config.get(
                 "temperature", SPECIAL_BASE_TEMPS.get(model, 0)
             )
@@ -484,7 +529,9 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                         err_obj = body.get("error") if isinstance(body.get("error"), dict) else {}
                         code_val = err_obj.get("code")
                         msg_val = err_obj.get("message")
-                        if code_val == "tool_use_failed" or (isinstance(msg_val, str) and "Failed to call a function" in msg_val):
+                        if code_val == "tool_use_failed" or (
+                            isinstance(msg_val, str) and "Failed to call a function" in msg_val
+                        ):
                             should_retry = True
                     except Exception:
                         pass
@@ -497,7 +544,10 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                                 err_obj = j.get("error") if isinstance(j.get("error"), dict) else {}
                                 code_val = err_obj.get("code")
                                 msg_val = err_obj.get("message")
-                                if code_val == "tool_use_failed" or (isinstance(msg_val, str) and "Failed to call a function" in msg_val):
+                                if code_val == "tool_use_failed" or (
+                                    isinstance(msg_val, str)
+                                    and "Failed to call a function" in msg_val
+                                ):
                                     should_retry = True
                     except Exception:
                         pass
@@ -512,13 +562,17 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
                     continue
                 raise
         message = output.choices[0].message
-        DEBUG = os.getenv("SYNTH_OPENAI_DEBUG") == "1"
-        if DEBUG:
+        debug_sync = os.getenv("SYNTH_OPENAI_DEBUG") == "1"
+        if debug_sync:
             try:
-                print(f"🔍 OPENAI DEBUG (sync): finish_reason={getattr(output.choices[0], 'finish_reason', None)}")
-                usage = getattr(output, 'usage', None)
+                print(
+                    f"🔍 OPENAI DEBUG (sync): finish_reason={getattr(output.choices[0], 'finish_reason', None)}"
+                )
+                usage = getattr(output, "usage", None)
                 if usage:
-                    print(f"🔍 OPENAI DEBUG (sync): usage prompt_tokens={getattr(usage, 'prompt_tokens', None)}, completion_tokens={getattr(usage, 'completion_tokens', None)}, total_tokens={getattr(usage, 'total_tokens', None)}")
+                    print(
+                        f"🔍 OPENAI DEBUG (sync): usage prompt_tokens={getattr(usage, 'prompt_tokens', None)}, completion_tokens={getattr(usage, 'completion_tokens', None)}, total_tokens={getattr(usage, 'total_tokens', None)}"
+                    )
             except Exception:
                 pass
@@ -540,12 +594,12 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
         # Attach basic usage if available
         usage_dict = None
         try:
-            usage_obj = getattr(output, 'usage', None)
+            usage_obj = getattr(output, "usage", None)
             if usage_obj is not None:
                 usage_dict = {
-                    "prompt_tokens": getattr(usage_obj, 'prompt_tokens', None),
-                    "completion_tokens": getattr(usage_obj, 'completion_tokens', None),
-                    "total_tokens": getattr(usage_obj, 'total_tokens', None),
+                    "prompt_tokens": getattr(usage_obj, "prompt_tokens", None),
+                    "completion_tokens": getattr(usage_obj, "completion_tokens", None),
+                    "total_tokens": getattr(usage_obj, "total_tokens", None),
                 }
         except Exception:
             usage_dict = None
@@ -565,12 +619,12 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
     async def _hit_api_async_structured_output(
         self,
         model: str,
-        messages: List[Dict[str, Any]],
+        messages: list[dict[str, Any]],
         response_model: BaseModel,
         temperature: float,
         use_ephemeral_cache_only: bool = False,
         reasoning_effort: str = "high",
-        tools: Optional[List[BaseTool]] = None,
+        tools: list[BaseTool] | None = None,
     ) -> BaseLMResponse:
         lm_config = {
             "temperature": temperature,
@@ -578,7 +632,7 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
             "reasoning_effort": reasoning_effort,
         }
         used_cache_handler = get_cache_handler(use_ephemeral_cache_only)
-        cache_result: Union[BaseLMResponse, None] = used_cache_handler.hit_managed_cache(
+        cache_result: BaseLMResponse | None = used_cache_handler.hit_managed_cache(
             model, messages, lm_config=lm_config, tools=tools
         )
         if cache_result is not None:
@@ -624,12 +678,12 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
     def _hit_api_sync_structured_output(
         self,
         model: str,
-        messages: List[Dict[str, Any]],
+        messages: list[dict[str, Any]],
         response_model: BaseModel,
         temperature: float,
         use_ephemeral_cache_only: bool = False,
         reasoning_effort: str = "high",
-        tools: Optional[List[BaseTool]] = None,
+        tools: list[BaseTool] | None = None,
     ) -> BaseLMResponse:
         lm_config = {
             "temperature": temperature,
@@ -637,7 +691,7 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
             "reasoning_effort": reasoning_effort,
         }
         used_cache_handler = get_cache_handler(use_ephemeral_cache_only)
-        cache_result: Union[BaseLMResponse, None] = used_cache_handler.hit_managed_cache(
+        cache_result: BaseLMResponse | None = used_cache_handler.hit_managed_cache(
             model, messages, lm_config=lm_config, tools=tools
         )
         if cache_result is not None:
@@ -671,7 +725,9 @@ class OpenAIStandard(VendorBase, OpenAIResponsesAPIMixin):
             base_url_str_sync = str(base_url_obj) if base_url_obj is not None else ""
         except Exception:
             base_url_str_sync = ""
-        if ("openai.com" in base_url_str_sync or "api.groq.com" in base_url_str_sync) and model.startswith("gpt-5"):
+        if (
+            "openai.com" in base_url_str_sync or "api.groq.com" in base_url_str_sync
+        ) and model.startswith("gpt-5"):
             if "max_tokens" in api_params:
                 api_params["max_completion_tokens"] = api_params.pop("max_tokens")
             if "temperature" in api_params:

synth-ai 0.2.4.dev5__py3-none-any.whl → 0.2.4.dev7__py3-none-any.whl

synth-ai 0.2.4.dev5py3-none-any.whl → 0.2.4.dev7py3-none-any.whl