PyPI - amsdal_ml - Versions diffs - 0.1.4__py3-none-any.whl → 0.2.0__py3-none-any.whl - Mend

amsdal_ml 0.1.4py3-none-any.whl → 0.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

amsdal_ml/Third-Party Materials - AMSDAL Dependencies - License Notices.md +617 -0
amsdal_ml/__about__.py +1 -1
amsdal_ml/agents/__init__.py +13 -0
amsdal_ml/agents/agent.py +5 -7
amsdal_ml/agents/default_qa_agent.py +108 -143
amsdal_ml/agents/functional_calling_agent.py +233 -0
amsdal_ml/agents/mcp_client_tool.py +46 -0
amsdal_ml/agents/python_tool.py +86 -0
amsdal_ml/agents/retriever_tool.py +5 -6
amsdal_ml/agents/tool_adapters.py +98 -0
amsdal_ml/fileio/base_loader.py +7 -5
amsdal_ml/fileio/openai_loader.py +16 -17
amsdal_ml/mcp_client/base.py +2 -0
amsdal_ml/mcp_client/http_client.py +7 -1
amsdal_ml/mcp_client/stdio_client.py +19 -16
amsdal_ml/mcp_server/server_retriever_stdio.py +8 -11
amsdal_ml/ml_ingesting/__init__.py +29 -0
amsdal_ml/ml_ingesting/default_ingesting.py +49 -51
amsdal_ml/ml_ingesting/embedders/__init__.py +4 -0
amsdal_ml/ml_ingesting/embedders/embedder.py +12 -0
amsdal_ml/ml_ingesting/embedders/openai_embedder.py +30 -0
amsdal_ml/ml_ingesting/embedding_data.py +3 -0
amsdal_ml/ml_ingesting/loaders/__init__.py +6 -0
amsdal_ml/ml_ingesting/loaders/folder_loader.py +52 -0
amsdal_ml/ml_ingesting/loaders/loader.py +28 -0
amsdal_ml/ml_ingesting/loaders/pdf_loader.py +136 -0
amsdal_ml/ml_ingesting/loaders/text_loader.py +44 -0
amsdal_ml/ml_ingesting/model_ingester.py +278 -0
amsdal_ml/ml_ingesting/pipeline.py +131 -0
amsdal_ml/ml_ingesting/pipeline_interface.py +31 -0
amsdal_ml/ml_ingesting/processors/__init__.py +4 -0
amsdal_ml/ml_ingesting/processors/cleaner.py +14 -0
amsdal_ml/ml_ingesting/processors/text_cleaner.py +42 -0
amsdal_ml/ml_ingesting/splitters/__init__.py +4 -0
amsdal_ml/ml_ingesting/splitters/splitter.py +15 -0
amsdal_ml/ml_ingesting/splitters/token_splitter.py +85 -0
amsdal_ml/ml_ingesting/stores/__init__.py +4 -0
amsdal_ml/ml_ingesting/stores/embedding_data.py +63 -0
amsdal_ml/ml_ingesting/stores/store.py +22 -0
amsdal_ml/ml_ingesting/types.py +40 -0
amsdal_ml/ml_models/models.py +96 -4
amsdal_ml/ml_models/openai_model.py +430 -122
amsdal_ml/ml_models/utils.py +7 -0
amsdal_ml/ml_retrievers/__init__.py +17 -0
amsdal_ml/ml_retrievers/adapters.py +93 -0
amsdal_ml/ml_retrievers/default_retriever.py +11 -1
amsdal_ml/ml_retrievers/openai_retriever.py +27 -7
amsdal_ml/ml_retrievers/query_retriever.py +487 -0
amsdal_ml/ml_retrievers/retriever.py +12 -0
amsdal_ml/models/embedding_model.py +7 -7
amsdal_ml/prompts/__init__.py +77 -0
amsdal_ml/prompts/database_query_agent.prompt +14 -0
amsdal_ml/prompts/functional_calling_agent_base.prompt +9 -0
amsdal_ml/prompts/nl_query_filter.prompt +318 -0
amsdal_ml/{agents/promts → prompts}/react_chat.prompt +17 -8
amsdal_ml/utils/__init__.py +5 -0
amsdal_ml/utils/query_utils.py +189 -0
{amsdal_ml-0.1.4.dist-info → amsdal_ml-0.2.0.dist-info}/METADATA +59 -1
amsdal_ml-0.2.0.dist-info/RECORD +72 -0
{amsdal_ml-0.1.4.dist-info → amsdal_ml-0.2.0.dist-info}/WHEEL +1 -1
amsdal_ml/agents/promts/__init__.py +0 -58
amsdal_ml-0.1.4.dist-info/RECORD +0 -39

amsdal_ml/ml_models/openai_model.py CHANGED Viewed

@@ -2,8 +2,10 @@ from __future__ import annotations
 import asyncio
 import os
+import warnings
 from collections.abc import AsyncIterator
 from collections.abc import Iterator
+from collections.abc import Sequence
 from typing import Any
 from typing import Optional
 from typing import cast
@@ -18,29 +20,91 @@ from amsdal_ml.fileio.base_loader import FILE_ID
 from amsdal_ml.fileio.base_loader import PLAIN_TEXT
 from amsdal_ml.fileio.base_loader import FileAttachment
 from amsdal_ml.ml_config import ml_config
+from amsdal_ml.ml_models.models import LLModelInput
 from amsdal_ml.ml_models.models import MLModel
 from amsdal_ml.ml_models.models import ModelAPIError
 from amsdal_ml.ml_models.models import ModelConnectionError
 from amsdal_ml.ml_models.models import ModelError
 from amsdal_ml.ml_models.models import ModelRateLimitError
+from amsdal_ml.ml_models.models import StructuredMessage
+from amsdal_ml.ml_models.utils import ResponseFormat
 class OpenAIModel(MLModel):
     """OpenAI LLM wrapper using a single Responses API pathway for all modes."""
-    def __init__(self) -> None:
+    def __init__(
+        self,
+        *,
+        model_name: Optional[str] = None,
+        temperature: Optional[float] = None,
+    ) -> None:
         self.client: Optional[OpenAI | AsyncOpenAI] = None
         self.async_mode: bool = bool(ml_config.async_mode)
-        self.model_name: str = ml_config.llm_model_name
-        self.temperature: float = ml_config.llm_temperature
+        self.model_name: str = model_name or ml_config.llm_model_name
+        self.temperature: float = (
+            temperature if temperature is not None else ml_config.llm_temperature
+        )
         self._api_key: Optional[str] = None
-    # ---------- Public sync API ----------
+    @property
+    def supported_formats(self) -> set[ResponseFormat]:
+        """OpenAI supports PLAIN_TEXT, JSON_OBJECT and JSON_SCHEMA formats."""
+        return {
+            ResponseFormat.PLAIN_TEXT,
+            ResponseFormat.JSON_OBJECT,
+            ResponseFormat.JSON_SCHEMA,
+        }
+    @property
+    def input_role(self) -> str:
+        """Return 'user' for OpenAI."""
+        return "user"
+    @property
+    def output_role(self) -> str:
+        """Return 'assistant' for OpenAI."""
+        return "assistant"
+    @property
+    def tool_role(self) -> str:
+        """Return 'tool' for OpenAI."""
+        return "tool"
+    @property
+    def system_role(self) -> str:
+        """Return 'system' for OpenAI."""
+        return "system"
+    @property
+    def content_field(self) -> str:
+        """Return 'content' for OpenAI."""
+        return "content"
+    @property
+    def role_field(self) -> str:
+        """Return 'role' for OpenAI."""
+        return "role"
+    @property
+    def tool_call_id_field(self) -> str:
+        """Return 'tool_call_id' for OpenAI."""
+        return "tool_call_id"
+    @property
+    def tool_name_field(self) -> str:
+        """Return 'name' for OpenAI."""
+        return "name"
     def invoke(
         self,
-        prompt: str,
+        input: LLModelInput,  # noqa: A002
         *,
         attachments: list[FileAttachment] | None = None,
+        response_format: ResponseFormat | None = None,
+        schema: dict[str, Any] | None = None,
+        tools: list[dict[str, Any]] | None = None,
+        tool_choice: str | dict[str, Any] | None = None,
     ) -> str:
         if self.async_mode:
             msg = "Async mode is enabled. Use 'ainvoke' instead."
@@ -50,18 +114,44 @@ class OpenAIModel(MLModel):
             raise RuntimeError(msg)
         atts = self._validate_attachments(attachments)
+        api_response_format = self._map_response_format(response_format, schema)
         if self._has_file_ids(atts):
-            input_content = self._build_input_content(prompt, atts)
-            return self._call_responses(input_content)
+            input_content = self._build_input_content(input, atts)
+            return self._call_responses(
+                input_content, response_format=api_response_format
+            )
-        final_prompt = self._merge_plain_text(prompt, atts)
-        return self._call_chat(final_prompt)
+        if isinstance(input, str):
+            final_prompt = self._merge_plain_text(input, atts)
+            return self._call_chat(
+                [{"role": "user", "content": final_prompt}],
+                response_format=api_response_format,
+                tools=tools,
+                tool_choice=tool_choice,
+            )
+        messages = list(input)
+        attachments_text = self._merge_plain_text("", atts)
+        if attachments_text:
+            messages.append({"role": "user", "content": attachments_text})
+        return self._call_chat(
+            messages,
+            response_format=api_response_format,
+            tools=tools,
+            tool_choice=tool_choice,
+        )
     def stream(
         self,
-        prompt: str,
+        input: LLModelInput,  # noqa: A002
         *,
         attachments: list[FileAttachment] | None = None,
+        response_format: ResponseFormat | None = None,
+        schema: dict[str, Any] | None = None,
+        tools: list[dict[str, Any]] | None = None,
+        tool_choice: str | dict[str, Any] | None = None,
     ) -> Iterator[str]:
         if self.async_mode:
             msg = "Async mode is enabled. Use 'astream' instead."
@@ -71,22 +161,50 @@ class OpenAIModel(MLModel):
             raise RuntimeError(msg)
         atts = self._validate_attachments(attachments)
+        api_response_format = self._map_response_format(response_format, schema)
         if self._has_file_ids(atts):
-            input_content = self._build_input_content(prompt, atts)
-            for chunk in self._call_responses_stream(input_content):
+            input_content = self._build_input_content(input, atts)
+            for chunk in self._call_responses_stream(
+                input_content, response_format=api_response_format
+            ):
                 yield chunk
             return
-        final_prompt = self._merge_plain_text(prompt, atts)
-        for chunk in self._call_chat_stream(final_prompt):
+        if isinstance(input, str):
+            final_prompt = self._merge_plain_text(input, atts)
+            for chunk in self._call_chat_stream(
+                [{"role": "user", "content": final_prompt}],
+                response_format=api_response_format,
+                tools=tools,
+                tool_choice=tool_choice,
+            ):
+                yield chunk
+            return
+        messages = list(input)
+        attachments_text = self._merge_plain_text("", atts)
+        if attachments_text:
+            messages.append({"role": "user", "content": attachments_text})
+        for chunk in self._call_chat_stream(
+            messages,
+            response_format=api_response_format,
+            tools=tools,
+            tool_choice=tool_choice,
+        ):
             yield chunk
     # ---------- Public async API ----------
     async def ainvoke(
         self,
-        prompt: str,
+        input: LLModelInput,  # noqa: A002
         *,
         attachments: list[FileAttachment] | None = None,
+        response_format: ResponseFormat | None = None,
+        schema: dict[str, Any] | None = None,
+        tools: list[dict[str, Any]] | None = None,
+        tool_choice: str | dict[str, Any] | None = None,
     ) -> str:
         if not self.async_mode:
             msg = "Async mode is disabled. Use 'invoke' instead."
@@ -97,18 +215,44 @@ class OpenAIModel(MLModel):
             raise RuntimeError(msg)
         atts = self._validate_attachments(attachments)
+        api_response_format = self._map_response_format(response_format, schema)
         if self._has_file_ids(atts):
-            input_content = self._build_input_content(prompt, atts)
-            return await self._acall_responses(input_content)
+            input_content = self._build_input_content(input, atts)
+            return await self._acall_responses(
+                input_content, response_format=api_response_format
+            )
-        final_prompt = self._merge_plain_text(prompt, atts)
-        return await self._acall_chat(final_prompt)
+        if isinstance(input, str):
+            final_prompt = self._merge_plain_text(input, atts)
+            return await self._acall_chat(
+                [{"role": "user", "content": final_prompt}],
+                response_format=api_response_format,
+                tools=tools,
+                tool_choice=tool_choice,
+            )
+        messages = list(input)
+        attachments_text = self._merge_plain_text("", atts)
+        if attachments_text:
+            messages.append({"role": "user", "content": attachments_text})
+        return await self._acall_chat(
+            messages,
+            response_format=api_response_format,
+            tools=tools,
+            tool_choice=tool_choice,
+        )
     async def astream(
         self,
-        prompt: str,
+        input: LLModelInput,  # noqa: A002
         *,
         attachments: list[FileAttachment] | None = None,
+        response_format: ResponseFormat | None = None,
+        schema: dict[str, Any] | None = None,
+        tools: list[dict[str, Any]] | None = None,
+        tool_choice: str | dict[str, Any] | None = None,
     ) -> AsyncIterator[str]:
         if not self.async_mode:
             msg = "Async mode is disabled. Use 'stream' instead."
@@ -119,30 +263,50 @@ class OpenAIModel(MLModel):
             raise RuntimeError(msg)
         atts = self._validate_attachments(attachments)
+        api_response_format = self._map_response_format(response_format, schema)
         if self._has_file_ids(atts):
-            input_content = self._build_input_content(prompt, atts)
-            async for chunk in self._acall_responses_stream(input_content):
+            input_content = self._build_input_content(input, atts)
+            async for chunk in self._acall_responses_stream(
+                input_content, response_format=api_response_format
+            ):
                 yield chunk
             return
-        final_prompt = self._merge_plain_text(prompt, atts)
-        async for chunk in self._acall_chat_stream(final_prompt):
+        if isinstance(input, str):
+            final_prompt = self._merge_plain_text(input, atts)
+            async for chunk in self._acall_chat_stream(
+                [{"role": "user", "content": final_prompt}],
+                response_format=api_response_format,
+                tools=tools,
+                tool_choice=tool_choice,
+            ):
+                yield chunk
+            return
+        messages = list(input)
+        attachments_text = self._merge_plain_text("", atts)
+        if attachments_text:
+            messages.append({"role": "user", "content": attachments_text})
+        async for chunk in self._acall_chat_stream(
+            messages,
+            response_format=api_response_format,
+            tools=tools,
+            tool_choice=tool_choice,
+        ):
             yield chunk
     # ---------- lifecycle ----------
     def setup(self) -> None:
         api_key = os.getenv("OPENAI_API_KEY") or ml_config.resolved_openai_key
         if not api_key:
-            msg = (
-                "OPENAI_API_KEY is required. "
-                "Set it via env or ml_config.api_keys.openai."
-            )
+            msg = "OPENAI_API_KEY is required. Set it via env or ml_config.api_keys.openai."
             raise RuntimeError(msg)
         self._api_key = api_key
         try:
             if self.async_mode:
-                # Only create async client if loop is running; otherwise defer.
                 try:
                     asyncio.get_running_loop()
                     self._ensure_async_client()
@@ -153,6 +317,40 @@ class OpenAIModel(MLModel):
         except Exception as e:  # pragma: no cover
             raise self._map_openai_error(e) from e
+    def _map_response_format(
+        self, response_format: ResponseFormat | None, schema: dict[str, Any] | None
+    ) -> dict[str, Any] | None:
+        if response_format is None or response_format == ResponseFormat.PLAIN_TEXT:
+            return None
+        if response_format == ResponseFormat.JSON_OBJECT:
+            return {"type": "json_object"}
+        if response_format == ResponseFormat.JSON_SCHEMA:
+            if self.model_name and self.model_name in [
+                'gpt-4', 'gpt-4-0613', 'gpt-4-0314', 'gpt-3.5-turbo',
+                'gpt-3.5-turbo-0125', 'gpt-3.5-turbo-1106', 'gpt-3.5-turbo-instruct',
+                'gpt-4-0125-preview', 'gpt-4-1106-vision-preview', 'chatgpt-4o-latest',
+                'gpt-4-turbo', 'gpt-4-turbo-2024-04-09', 'gpt-4-turbo-preview',
+                'gpt-4-0125-preview', 'gpt-4-1106-vision-preview'
+            ]:
+                warnings.warn(
+                    f"Model '{self.model_name}' may not support the JSON Schema format. "
+                    "Consider using a newer model like 'gpt-4o' for guaranteed compatibility.",
+                    UserWarning,
+                    stacklevel=2
+                )
+                return None
+            if not schema:
+                msg = "`schema` is required for `JSON_SCHEMA` format."
+                raise ValueError(msg)
+            return {
+                "type": "json_schema",
+                "json_schema": schema
+            }
+        return None
     def _ensure_async_client(self) -> None:
         if self.client is None:
             try:
@@ -187,20 +385,19 @@ class OpenAIModel(MLModel):
         kinds = {a.type for a in atts}
         unsupported = kinds - self.supported_attachments()
         if unsupported:
-            msg = (
-                f"{self.__class__.__name__} does not support attachments: "
-                f"{', '.join(sorted(unsupported))}"
-            )
+            msg = f'{self.__class__.__name__} does not support attachments: {", ".join(sorted(unsupported))}'
             raise ModelAPIError(msg)
         foreign = [
-            a for a in atts if a.type == FILE_ID and (a.metadata or {}).get("provider") != "openai"
+            a
+            for a in atts
+            if a.type == FILE_ID and (a.metadata or {}).get("provider") != "openai"
         ]
         if foreign:
             provs = {(a.metadata or {}).get("provider", "unknown") for a in foreign}
             msg = (
                 f"{self.__class__.__name__} only supports FILE_ID with provider='openai'. "
-                f"Got providers: {', '.join(sorted(provs))}"
+                f'Got providers: {", ".join(sorted(provs))}'
             )
             raise ModelAPIError(msg)
@@ -210,14 +407,30 @@ class OpenAIModel(MLModel):
     def _has_file_ids(atts: list[FileAttachment]) -> bool:
         return any(a.type == FILE_ID for a in atts)
-    def _build_input_content(self, prompt: str, atts: list[FileAttachment]) -> list[dict[str, Any]]:
-        parts: list[dict[str, Any]] = [{"type": "input_text", "text": prompt}]
+    def _build_input_content(
+        self, input: LLModelInput, atts: list[FileAttachment],  # noqa: A002
+    ) -> list[StructuredMessage]:
+        if isinstance(input, str):
+            parts: list[dict[str, Any]] = [{"type": "input_text", "text": input}]
+            for a in atts:
+                if a.type == PLAIN_TEXT:
+                    parts.append({"type": "input_text", "text": str(a.content)})
+                elif a.type == FILE_ID:
+                    parts.append({"type": "input_file", "file_id": str(a.content)})
+            return [{"role": "user", "content": parts}]
+        messages = cast(list[StructuredMessage], [dict(msg) for msg in input])
+        parts = []
         for a in atts:
             if a.type == PLAIN_TEXT:
                 parts.append({"type": "input_text", "text": str(a.content)})
             elif a.type == FILE_ID:
                 parts.append({"type": "input_file", "file_id": str(a.content)})
-        return [{"role": "user", "content": parts}]
+        if parts:
+            messages.append({"role": "user", "content": parts})
+        return messages
     def _merge_plain_text(self, prompt: str, atts: list[FileAttachment]) -> str:
         extras = [str(a.content) for a in atts if a.type == PLAIN_TEXT]
@@ -240,132 +453,227 @@ class OpenAIModel(MLModel):
                 payload_repr = resp.json() if resp is not None else None
             except Exception:
                 payload_repr = None
-            return ModelAPIError(f"OpenAI API status error ({status}). payload={payload_repr!r}")
+            return ModelAPIError(
+                f"OpenAI API status error ({status}). payload={payload_repr!r}"
+            )
         if isinstance(err, openai.APIError):
             return ModelAPIError(str(err))
         return ModelAPIError(str(err))
     # ---------- Sync core callers ----------
-    def _call_chat(self, prompt: str) -> str:
+    def _call_chat(
+        self,
+        messages: Sequence[StructuredMessage],
+        response_format: dict[str, Any] | None = None,
+        tools: list[dict[str, Any]] | None = None,
+        tool_choice: str | dict[str, Any] | None = None,
+    ) -> str:
         client = self._require_sync_client()
+        kwargs: dict[str, Any] = {
+            "model": self.model_name,
+            "messages": messages,
+            "temperature": self.temperature,
+        }
+        if response_format:
+            kwargs["response_format"] = response_format
+        if tools:
+            kwargs["tools"] = tools
+        if tool_choice:
+            kwargs["tool_choice"] = tool_choice
         try:
-            resp = client.chat.completions.create(
-                model=self.model_name,
-                messages=[{"role": "user", "content": prompt}],
-                temperature=self.temperature,
-            )
-            return resp.choices[0].message.content or ""
+            resp = client.chat.completions.create(**kwargs)
         except Exception as e:
             raise self._map_openai_error(e) from e
-    def _call_chat_stream(self, prompt: str) -> Iterator[str]:
+        if tools:
+            return resp.choices[0].message.model_dump_json()
+        return resp.choices[0].message.content or ""
+    def _call_chat_stream(
+        self,
+        messages: Sequence[StructuredMessage],
+        response_format: dict[str, Any] | None = None,
+        tools: list[dict[str, Any]] | None = None,
+        tool_choice: str | dict[str, Any] | None = None,
+    ) -> Iterator[str]:
         client = self._require_sync_client()
+        kwargs: dict[str, Any] = {
+            "model": self.model_name,
+            "messages": messages,
+            "temperature": self.temperature,
+            "stream": True,
+        }
+        if response_format:
+            kwargs["response_format"] = response_format
+        if tools:
+            kwargs["tools"] = tools
+        if tool_choice:
+            kwargs["tool_choice"] = tool_choice
         try:
-            stream = client.chat.completions.create(
-                model=self.model_name,
-                messages=[{"role": "user", "content": prompt}],
-                temperature=self.temperature,
-                stream=True,
-            )
-            for chunk in stream:
-                delta = chunk.choices[0].delta
-                if delta and delta.content:
-                    yield delta.content
+            stream = client.chat.completions.create(**kwargs)
         except Exception as e:
             raise self._map_openai_error(e) from e
-    def _call_responses(self, input_content: list[dict[str, Any]]) -> str:
+        for chunk in stream:
+            delta = chunk.choices[0].delta
+            if delta and delta.content:
+                yield delta.content
+    def _call_responses(
+        self, input_content: Sequence[StructuredMessage], response_format: dict[str, Any] | None = None
+    ) -> str:
         client = self._require_sync_client()
+        kwargs: dict[str, Any] = {
+            "model": self.model_name,
+            "input": cast(Any, input_content),
+            "temperature": self.temperature,
+        }
+        if response_format:
+            kwargs["response_format"] = response_format
         try:
-            resp: Any = client.responses.create(
-                model=self.model_name,
-                input=cast(Any, input_content),
-                temperature=self.temperature,
-            )
-            return (getattr(resp, "output_text", None) or "").strip()
+            resp: Any = client.responses.create(**kwargs)
         except Exception as e:
             raise self._map_openai_error(e) from e
-    def _call_responses_stream(self, input_content: list[dict[str, Any]]) -> Iterator[str]:
+        return (getattr(resp, "output_text", None) or "").strip()
+    def _call_responses_stream(
+        self, input_content: Sequence[StructuredMessage], response_format: dict[str, Any] | None = None
+    ) -> Iterator[str]:
         client = self._require_sync_client()
+        kwargs: dict[str, Any] = {
+            "model": self.model_name,
+            "input": cast(Any, input_content),
+            "temperature": self.temperature,
+            "stream": True,
+        }
+        if response_format:
+            kwargs["response_format"] = response_format
         try:
-            stream_or_resp = client.responses.create(
-                model=self.model_name,
-                input=cast(Any, input_content),
-                temperature=self.temperature,
-                stream=True,
-            )
-            if isinstance(stream_or_resp, Stream):
-                for ev in stream_or_resp:
-                    delta = getattr(getattr(ev, "delta", None), "content", None)
-                    if delta:
-                        yield delta
-            else:
-                text = (getattr(stream_or_resp, "output_text", None) or "").strip()
-                if text:
-                    yield text
+            stream_or_resp = client.responses.create(**kwargs)
         except Exception as e:
             raise self._map_openai_error(e) from e
+        if isinstance(stream_or_resp, Stream):
+            for ev in stream_or_resp:
+                delta = getattr(getattr(ev, "delta", None), "content", None)
+                if delta:
+                    yield delta
+        else:
+            text = (getattr(stream_or_resp, "output_text", None) or "").strip()
+            if text:
+                yield text
     # ---------- Async core callers ----------
-    async def _acall_chat(self, prompt: str) -> str:
+    async def _acall_chat(
+        self,
+        messages: Sequence[StructuredMessage],
+        response_format: dict[str, Any] | None = None,
+        tools: list[dict[str, Any]] | None = None,
+        tool_choice: str | dict[str, Any] | None = None,
+    ) -> str:
         client = self._require_async_client()
-        print("acall_chat:", prompt)  # noqa: T201
+        kwargs: dict[str, Any] = {
+            "model": self.model_name,
+            "messages": messages,
+            "temperature": self.temperature,
+        }
+        if response_format:
+            kwargs["response_format"] = response_format
+        if tools:
+            kwargs["tools"] = tools
+        if tool_choice:
+            kwargs["tool_choice"] = tool_choice
         try:
-            resp = await client.chat.completions.create(
-                model=self.model_name,
-                messages=[{"role": "user", "content": prompt}],
-                temperature=self.temperature,
-            )
-            return resp.choices[0].message.content or ""
+            resp = await client.chat.completions.create(**kwargs)
         except Exception as e:
             raise self._map_openai_error(e) from e
-    async def _acall_chat_stream(self, prompt: str) -> AsyncIterator[str]:
+        if tools:
+            return resp.choices[0].message.model_dump_json()
+        return resp.choices[0].message.content or ""
+    async def _acall_chat_stream(
+        self,
+        messages: Sequence[StructuredMessage],
+        response_format: dict[str, Any] | None = None,
+        tools: list[dict[str, Any]] | None = None,
+        tool_choice: str | dict[str, Any] | None = None,
+    ) -> AsyncIterator[str]:
         client = self._require_async_client()
+        kwargs: dict[str, Any] = {
+            "model": self.model_name,
+            "messages": messages,
+            "temperature": self.temperature,
+            "stream": True,
+        }
+        if response_format:
+            kwargs["response_format"] = response_format
+        if tools:
+            kwargs["tools"] = tools
+        if tool_choice:
+            kwargs["tool_choice"] = tool_choice
         try:
-            stream = await client.chat.completions.create(
-                model=self.model_name,
-                messages=[{"role": "user", "content": prompt}],
-                temperature=self.temperature,
-                stream=True,
-            )
-            async for chunk in stream:
-                delta = chunk.choices[0].delta
-                if delta and delta.content:
-                    yield delta.content
+            stream = await client.chat.completions.create(**kwargs)
         except Exception as e:
             raise self._map_openai_error(e) from e
-    async def _acall_responses(self, input_content: list[dict[str, Any]]) -> str:
+        async for chunk in stream:
+            delta = chunk.choices[0].delta
+            if delta and delta.content:
+                yield delta.content
+    async def _acall_responses(
+        self, input_content: Sequence[StructuredMessage], response_format: dict[str, Any] | None = None
+    ) -> str:
         client = self._require_async_client()
+        kwargs: dict[str, Any] = {
+            "model": self.model_name,
+            "input": cast(Any, input_content),
+            "temperature": self.temperature,
+        }
+        if response_format:
+            kwargs["response_format"] = response_format
         try:
-            resp: Any = await client.responses.create(
-                model=self.model_name,
-                input=cast(Any, input_content),
-                temperature=self.temperature,
-            )
-            return (getattr(resp, "output_text", None) or "").strip()
+            resp: Any = await client.responses.create(**kwargs)
         except Exception as e:
             raise self._map_openai_error(e) from e
-    async def _acall_responses_stream(self, input_content: list[dict[str, Any]]) -> AsyncIterator[str]:
+        return (getattr(resp, "output_text", None) or "").strip()
+    async def _acall_responses_stream(
+        self, input_content: Sequence[StructuredMessage], response_format: dict[str, Any] | None = None
+    ) -> AsyncIterator[str]:
         client = self._require_async_client()
+        kwargs: dict[str, Any] = {
+            "model": self.model_name,
+            "input": cast(Any, input_content),
+            "temperature": self.temperature,
+            "stream": True,
+        }
+        if response_format:
+            kwargs["response_format"] = response_format
         try:
-            stream_or_resp = await client.responses.create(
-                model=self.model_name,
-                input=cast(Any, input_content),
-                temperature=self.temperature,
-                stream=True,
-            )
-            if isinstance(stream_or_resp, AsyncStream):
-                async for ev in stream_or_resp:
-                    delta = getattr(getattr(ev, "delta", None), "content", None)
-                    if delta:
-                        yield delta
-            else:
-                text = (getattr(stream_or_resp, "output_text", None) or "").strip()
-                if text:
-                    yield text
+            stream_or_resp = await client.responses.create(**kwargs)
         except Exception as e:
             raise self._map_openai_error(e) from e
+        if isinstance(stream_or_resp, AsyncStream):
+            async for ev in stream_or_resp:
+                delta = getattr(getattr(ev, "delta", None), "content", None)
+                if delta:
+                    yield delta
+        else:
+            text = (getattr(stream_or_resp, "output_text", None) or "").strip()
+            if text:
+                yield text

amsdal_ml 0.1.4__py3-none-any.whl → 0.2.0__py3-none-any.whl

amsdal_ml 0.1.4py3-none-any.whl → 0.2.0py3-none-any.whl