PyPI - synth-ai - Versions diffs - 0.1.0.dev38__py3-none-any.whl → 0.1.0.dev49__py3-none-any.whl - Mend

synth-ai 0.1.0.dev38py3-none-any.whl → 0.1.0.dev49py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (69) hide show

synth_ai/__init__.py +3 -1
{synth_ai-0.1.0.dev38.dist-info → synth_ai-0.1.0.dev49.dist-info}/METADATA +12 -11
synth_ai-0.1.0.dev49.dist-info/RECORD +6 -0
{synth_ai-0.1.0.dev38.dist-info → synth_ai-0.1.0.dev49.dist-info}/WHEEL +1 -1
synth_ai-0.1.0.dev49.dist-info/top_level.txt +1 -0
private_tests/try_synth_sdk.py +0 -1
public_tests/test_agent.py +0 -538
public_tests/test_all_structured_outputs.py +0 -196
public_tests/test_anthropic_structured_outputs.py +0 -0
public_tests/test_deepseek_structured_outputs.py +0 -0
public_tests/test_deepseek_tools.py +0 -64
public_tests/test_gemini_output.py +0 -188
public_tests/test_gemini_structured_outputs.py +0 -106
public_tests/test_models.py +0 -183
public_tests/test_openai_structured_outputs.py +0 -106
public_tests/test_reasoning_effort.py +0 -75
public_tests/test_reasoning_models.py +0 -92
public_tests/test_recursive_structured_outputs.py +0 -180
public_tests/test_structured.py +0 -137
public_tests/test_structured_outputs.py +0 -109
public_tests/test_synth_sdk.py +0 -384
public_tests/test_text.py +0 -160
public_tests/test_tools.py +0 -319
synth_ai/zyk/__init__.py +0 -3
synth_ai/zyk/lms/__init__.py +0 -0
synth_ai/zyk/lms/caching/__init__.py +0 -0
synth_ai/zyk/lms/caching/constants.py +0 -1
synth_ai/zyk/lms/caching/dbs.py +0 -0
synth_ai/zyk/lms/caching/ephemeral.py +0 -72
synth_ai/zyk/lms/caching/handler.py +0 -142
synth_ai/zyk/lms/caching/initialize.py +0 -13
synth_ai/zyk/lms/caching/persistent.py +0 -83
synth_ai/zyk/lms/config.py +0 -8
synth_ai/zyk/lms/core/__init__.py +0 -0
synth_ai/zyk/lms/core/all.py +0 -47
synth_ai/zyk/lms/core/exceptions.py +0 -9
synth_ai/zyk/lms/core/main.py +0 -314
synth_ai/zyk/lms/core/vendor_clients.py +0 -85
synth_ai/zyk/lms/cost/__init__.py +0 -0
synth_ai/zyk/lms/cost/monitor.py +0 -1
synth_ai/zyk/lms/cost/statefulness.py +0 -1
synth_ai/zyk/lms/structured_outputs/__init__.py +0 -0
synth_ai/zyk/lms/structured_outputs/handler.py +0 -442
synth_ai/zyk/lms/structured_outputs/inject.py +0 -314
synth_ai/zyk/lms/structured_outputs/rehabilitate.py +0 -187
synth_ai/zyk/lms/tools/base.py +0 -104
synth_ai/zyk/lms/vendors/__init__.py +0 -0
synth_ai/zyk/lms/vendors/base.py +0 -31
synth_ai/zyk/lms/vendors/constants.py +0 -22
synth_ai/zyk/lms/vendors/core/__init__.py +0 -0
synth_ai/zyk/lms/vendors/core/anthropic_api.py +0 -413
synth_ai/zyk/lms/vendors/core/gemini_api.py +0 -306
synth_ai/zyk/lms/vendors/core/mistral_api.py +0 -327
synth_ai/zyk/lms/vendors/core/openai_api.py +0 -185
synth_ai/zyk/lms/vendors/local/__init__.py +0 -0
synth_ai/zyk/lms/vendors/local/ollama.py +0 -0
synth_ai/zyk/lms/vendors/openai_standard.py +0 -375
synth_ai/zyk/lms/vendors/retries.py +0 -3
synth_ai/zyk/lms/vendors/supported/__init__.py +0 -0
synth_ai/zyk/lms/vendors/supported/deepseek.py +0 -73
synth_ai/zyk/lms/vendors/supported/groq.py +0 -16
synth_ai/zyk/lms/vendors/supported/ollama.py +0 -14
synth_ai/zyk/lms/vendors/supported/together.py +0 -11
synth_ai-0.1.0.dev38.dist-info/RECORD +0 -67
synth_ai-0.1.0.dev38.dist-info/top_level.txt +0 -4
tests/test_agent.py +0 -538
tests/test_recursive_structured_outputs.py +0 -180
tests/test_structured_outputs.py +0 -100
{synth_ai-0.1.0.dev38.dist-info → synth_ai-0.1.0.dev49.dist-info}/licenses/LICENSE +0 -0

synth_ai/zyk/lms/vendors/core/anthropic_api.py DELETED Viewed

@@ -1,413 +0,0 @@
-import json
-from typing import Any, Dict, List, Optional, Tuple, Type
-import anthropic
-import pydantic
-from pydantic import BaseModel
-from synth_ai.zyk.lms.caching.initialize import (
-    get_cache_handler,
-)
-from synth_ai.zyk.lms.tools.base import BaseTool
-from synth_ai.zyk.lms.vendors.base import BaseLMResponse, VendorBase
-from synth_ai.zyk.lms.vendors.constants import SPECIAL_BASE_TEMPS
-from synth_ai.zyk.lms.vendors.core.openai_api import OpenAIStructuredOutputClient
-ANTHROPIC_EXCEPTIONS_TO_RETRY: Tuple[Type[Exception], ...] = (anthropic.APIError,)
-sonnet_37_budgets = {
-    "high": 8000,
-    "medium": 4000,
-    "low": 1000,
-}
-class AnthropicAPI(VendorBase):
-    used_for_structured_outputs: bool = True
-    exceptions_to_retry: Tuple = ANTHROPIC_EXCEPTIONS_TO_RETRY
-    sync_client: Any
-    async_client: Any
-    def __init__(
-        self,
-        exceptions_to_retry: Tuple[
-            Type[Exception], ...
-        ] = ANTHROPIC_EXCEPTIONS_TO_RETRY,
-        used_for_structured_outputs: bool = False,
-        reasoning_effort: str = "high",
-    ):
-        self.sync_client = anthropic.Anthropic()
-        self.async_client = anthropic.AsyncAnthropic()
-        self.used_for_structured_outputs = used_for_structured_outputs
-        self.exceptions_to_retry = exceptions_to_retry
-        self._openai_fallback = None
-        self.reasoning_effort = reasoning_effort
-    # @backoff.on_exception(
-    #     backoff.expo,
-    #     exceptions_to_retry,
-    #     max_tries=BACKOFF_TOLERANCE,
-    #     on_giveup=lambda e: print(e),
-    # )
-    async def _hit_api_async(
-        self,
-        model: str,
-        messages: List[Dict[str, Any]],
-        lm_config: Dict[str, Any],
-        use_ephemeral_cache_only: bool = False,
-        reasoning_effort: str = "high",
-        tools: Optional[List[BaseTool]] = None,
-        **vendor_params: Dict[str, Any],
-    ) -> BaseLMResponse:
-        assert (
-            lm_config.get("response_model", None) is None
-        ), "response_model is not supported for standard calls"
-        used_cache_handler = get_cache_handler(use_ephemeral_cache_only)
-        cache_result = used_cache_handler.hit_managed_cache(
-            model, messages, lm_config=lm_config, tools=tools, reasoning_effort=reasoning_effort
-        )
-        if cache_result:
-            return cache_result
-        # Common API parameters
-        api_params = {
-            "system": messages[0]["content"],
-            "messages": messages[1:],
-            "model": model,
-            "max_tokens": lm_config.get("max_tokens", 4096),
-            "temperature": lm_config.get(
-                "temperature", SPECIAL_BASE_TEMPS.get(model, 0)
-            ),
-        }
-        # Add tools if provided
-        if tools:
-            api_params["tools"] = []
-            for tool in tools:
-                if isinstance(tool, BaseTool):
-                    api_params["tools"].append(tool.to_anthropic_tool())
-                else:
-                    api_params["tools"].append(tool)
-        # Only try to add thinking if supported by the SDK
-        try:
-            import inspect
-            create_sig = inspect.signature(self.async_client.messages.create)
-            if "thinking" in create_sig.parameters and "claude-3-7" in model:
-                if reasoning_effort in ["high", "medium"]:
-                    budget = sonnet_37_budgets[reasoning_effort]
-                    api_params["thinking"] = {
-                        "type": "enabled",
-                        "budget_tokens": budget,
-                    }
-                    api_params["max_tokens"] = budget+4096
-                    api_params["temperature"] = 1
-        except (ImportError, AttributeError, TypeError):
-            pass
-        # Make the API call
-        response = await self.async_client.messages.create(**api_params)
-        # Extract text content and tool calls
-        raw_response = ""
-        tool_calls = []
-        for content in response.content:
-            if content.type == "text":
-                raw_response += content.text
-            elif content.type == "tool_use":
-                tool_calls.append(
-                    {
-                        "id": content.id,
-                        "type": "function",
-                        "function": {
-                            "name": content.name,
-                            "arguments": json.dumps(content.input),
-                        },
-                    }
-                )
-        lm_response = BaseLMResponse(
-            raw_response=raw_response,
-            structured_output=None,
-            tool_calls=tool_calls if tool_calls else None,
-        )
-        used_cache_handler.add_to_managed_cache(
-            model, messages, lm_config=lm_config, output=lm_response, tools=tools, reasoning_effort=reasoning_effort
-        )
-        return lm_response
-    # @backoff.on_exception(
-    #     backoff.expo,
-    #     exceptions_to_retry,
-    #     max_tries=BACKOFF_TOLERANCE,
-    #     on_giveup=lambda e: print(e),
-    # )
-    def _hit_api_sync(
-        self,
-        model: str,
-        messages: List[Dict[str, Any]],
-        lm_config: Dict[str, Any],
-        use_ephemeral_cache_only: bool = False,
-        reasoning_effort: str = "high",
-        tools: Optional[List[BaseTool]] = None,
-        **vendor_params: Dict[str, Any],
-    ) -> BaseLMResponse:
-        assert (
-            lm_config.get("response_model", None) is None
-        ), "response_model is not supported for standard calls"
-        used_cache_handler = get_cache_handler(
-            use_ephemeral_cache_only=use_ephemeral_cache_only
-        )
-        cache_result = used_cache_handler.hit_managed_cache(
-            model, messages, lm_config=lm_config, tools=tools, reasoning_effort=reasoning_effort
-        )
-        if cache_result:
-            return cache_result
-        # Common API parameters
-        api_params = {
-            "system": messages[0]["content"],
-            "messages": messages[1:],
-            "model": model,
-            "max_tokens": lm_config.get("max_tokens", 4096),
-            "temperature": lm_config.get(
-                "temperature", SPECIAL_BASE_TEMPS.get(model, 0)
-            ),
-        }
-        # Add tools if provided
-        if tools:
-            api_params["tools"] = []
-            for tool in tools:
-                if isinstance(tool, BaseTool):
-                    api_params["tools"].append(tool.to_anthropic_tool())
-                else:
-                    api_params["tools"].append(tool)
-        # Only try to add thinking if supported by the SDK
-        try:
-            import inspect
-            create_sig = inspect.signature(self.sync_client.messages.create)
-            if "thinking" in create_sig.parameters and "claude-3-7" in model:
-                api_params["temperature"] = 1
-                if reasoning_effort in ["high", "medium"]:
-                    budgets = sonnet_37_budgets
-                    budget = budgets[reasoning_effort]
-                    api_params["thinking"] = {
-                        "type": "enabled",
-                        "budget_tokens": budget,
-                    }
-                    api_params["max_tokens"] = budget+4096
-                    api_params["temperature"] = 1
-        except (ImportError, AttributeError, TypeError):
-            pass
-        # Make the API call
-        response = self.sync_client.messages.create(**api_params)
-        # Extract text content and tool calls
-        raw_response = ""
-        tool_calls = []
-        for content in response.content:
-            if content.type == "text":
-                raw_response += content.text
-            elif content.type == "tool_use":
-                tool_calls.append(
-                    {
-                        "id": content.id,
-                        "type": "function",
-                        "function": {
-                            "name": content.name,
-                            "arguments": json.dumps(content.input),
-                        },
-                    }
-                )
-        lm_response = BaseLMResponse(
-            raw_response=raw_response,
-            structured_output=None,
-            tool_calls=tool_calls if tool_calls else None,
-        )
-        used_cache_handler.add_to_managed_cache(
-            model, messages, lm_config=lm_config, output=lm_response, tools=tools, reasoning_effort=reasoning_effort
-        )
-        return lm_response
-    async def _hit_api_async_structured_output(
-        self,
-        model: str,
-        messages: List[Dict[str, Any]],
-        response_model: BaseModel,
-        temperature: float,
-        use_ephemeral_cache_only: bool = False,
-        reasoning_effort: str = "high",
-        **vendor_params: Dict[str, Any],
-    ) -> BaseLMResponse:
-        used_cache_handler = get_cache_handler(use_ephemeral_cache_only)
-        lm_config = {"temperature": temperature, "response_model": response_model}
-        cache_result = used_cache_handler.hit_managed_cache(
-            model=model,
-            messages=messages,
-            lm_config=lm_config,
-            reasoning_effort=reasoning_effort,
-        )
-        if cache_result:
-            return cache_result
-        try:
-            # First try with Anthropic
-            reasoning_effort = vendor_params.get("reasoning_effort", reasoning_effort)
-            if "claude-3-7" in model:
-                #if reasoning_effort in ["high", "medium"]:
-                budgets = sonnet_37_budgets
-                budget = budgets[reasoning_effort]
-                max_tokens = budget+4096
-                temperature = 1
-                response = await self.async_client.messages.create(
-                    system=messages[0]["content"],
-                    messages=messages[1:],
-                    model=model,
-                    max_tokens=max_tokens,
-                    thinking={"type": "enabled", "budget_tokens": budget},
-                    temperature=temperature,
-                )
-            else:
-                response = await self.async_client.messages.create(
-                    system=messages[0]["content"],
-                    messages=messages[1:],
-                    model=model,
-                    max_tokens=max_tokens,
-                    temperature=temperature,
-                )
-            result = response.content[0].text
-            parsed = json.loads(result)
-            lm_response = BaseLMResponse(
-                raw_response="",
-                structured_output=response_model(**parsed),
-                tool_calls=None,
-            )
-            used_cache_handler.add_to_managed_cache(
-                model=model,
-                messages=messages,
-                lm_config=lm_config,
-                output=lm_response,
-                reasoning_effort=reasoning_effort,
-            )
-            return lm_response
-        except (json.JSONDecodeError, pydantic.ValidationError):
-            # If Anthropic fails, fallback to OpenAI
-            if self._openai_fallback is None:
-                self._openai_fallback = OpenAIStructuredOutputClient()
-            return await self._openai_fallback._hit_api_async_structured_output(
-                model="gpt-4o",  # Fallback to GPT-4
-                messages=messages,
-                response_model=response_model,
-                temperature=temperature,
-                use_ephemeral_cache_only=use_ephemeral_cache_only,
-            )
-    def _hit_api_sync_structured_output(
-        self,
-        model: str,
-        messages: List[Dict[str, Any]],
-        response_model: BaseModel,
-        temperature: float,
-        use_ephemeral_cache_only: bool = False,
-        reasoning_effort: str = "high",
-        **vendor_params: Dict[str, Any],
-    ) -> BaseLMResponse:
-        used_cache_handler = get_cache_handler(use_ephemeral_cache_only)
-        lm_config = {"temperature": temperature, "response_model": response_model}
-        cache_result = used_cache_handler.hit_managed_cache(
-            model=model,
-            messages=messages,
-            lm_config=lm_config,
-            reasoning_effort=reasoning_effort,
-        )
-        if cache_result:
-            return cache_result
-        try:
-            # First try with Anthropic
-            reasoning_effort = vendor_params.get("reasoning_effort", reasoning_effort)
-            import time
-            if "claude-3-7" in model:
-                if reasoning_effort in ["high", "medium"]:
-                    budgets = sonnet_37_budgets
-                    budget = budgets[reasoning_effort]
-                    max_tokens = budget+4096
-                    temperature = 1
-                response = self.sync_client.messages.create(
-                    system=messages[0]["content"],
-                    messages=messages[1:],
-                    model=model,
-                    max_tokens=max_tokens,
-                    temperature=temperature,
-                    thinking={"type": "enabled", "budget_tokens": budget},
-                )
-            else:
-                response = self.sync_client.messages.create(
-                    system=messages[0]["content"],
-                    messages=messages[1:],
-                    model=model,
-                    max_tokens=max_tokens,
-                    temperature=temperature,
-                )
-            # print("Time taken for API call", time.time() - t)
-            result = response.content[0].text
-            # Try to parse the result as JSON
-            parsed = json.loads(result)
-            lm_response = BaseLMResponse(
-                raw_response="",
-                structured_output=response_model(**parsed),
-                tool_calls=None,
-            )
-            used_cache_handler.add_to_managed_cache(
-                model=model,
-                messages=messages,
-                lm_config=lm_config,
-                output=lm_response,
-                reasoning_effort=reasoning_effort,
-            )
-            return lm_response
-        except (json.JSONDecodeError, pydantic.ValidationError):
-            # If Anthropic fails, fallback to OpenAI
-            print("WARNING - Falling back to OpenAI - THIS IS SLOW")
-            if self._openai_fallback is None:
-                self._openai_fallback = OpenAIStructuredOutputClient()
-            return self._openai_fallback._hit_api_sync_structured_output(
-                model="gpt-4o",  # Fallback to GPT-4
-                messages=messages,
-                response_model=response_model,
-                temperature=temperature,
-                use_ephemeral_cache_only=use_ephemeral_cache_only,
-            )
-    async def _process_call_async(
-        self,
-        messages: List[Dict[str, Any]],
-        model: str,
-        response_model: BaseModel,
-        api_call_method,
-        temperature: float = 0.0,
-        use_ephemeral_cache_only: bool = False,
-        vendor_params: Dict[str, Any] = None,
-    ) -> BaseModel:
-        vendor_params = vendor_params or {}
-        # Each vendor can filter parameters they support
-        return await api_call_method(
-            messages=messages,
-            model=model,
-            temperature=temperature,
-            use_ephemeral_cache_only=use_ephemeral_cache_only,
-            **vendor_params,  # Pass all vendor-specific params
-        )

synth-ai 0.1.0.dev38__py3-none-any.whl → 0.1.0.dev49__py3-none-any.whl

synth-ai 0.1.0.dev38py3-none-any.whl → 0.1.0.dev49py3-none-any.whl