PyPI - hammad-python - Versions diffs - 0.0.19__py3-none-any.whl → 0.0.20__py3-none-any.whl - Mend

hammad-python 0.0.19py3-none-any.whl → 0.0.20py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (83) hide show

hammad/__init__.py +7 -137
hammad/_internal.py +1 -0
hammad/cli/_runner.py +8 -8
hammad/cli/plugins.py +55 -26
hammad/cli/styles/utils.py +16 -8
hammad/data/__init__.py +1 -5
hammad/data/collections/__init__.py +2 -3
hammad/data/collections/collection.py +41 -22
hammad/data/collections/indexes/__init__.py +1 -1
hammad/data/collections/indexes/qdrant/__init__.py +1 -1
hammad/data/collections/indexes/qdrant/index.py +106 -118
hammad/data/collections/indexes/qdrant/settings.py +14 -14
hammad/data/collections/indexes/qdrant/utils.py +28 -38
hammad/data/collections/indexes/tantivy/__init__.py +1 -1
hammad/data/collections/indexes/tantivy/index.py +57 -59
hammad/data/collections/indexes/tantivy/settings.py +8 -19
hammad/data/collections/indexes/tantivy/utils.py +28 -52
hammad/data/models/__init__.py +2 -7
hammad/data/sql/__init__.py +1 -1
hammad/data/sql/database.py +71 -73
hammad/data/sql/types.py +37 -51
hammad/formatting/__init__.py +2 -1
hammad/formatting/json/converters.py +2 -2
hammad/genai/__init__.py +96 -36
hammad/genai/agents/__init__.py +47 -1
hammad/genai/agents/agent.py +1022 -0
hammad/genai/agents/run.py +615 -0
hammad/genai/agents/types/__init__.py +29 -22
hammad/genai/agents/types/agent_context.py +13 -0
hammad/genai/agents/types/agent_event.py +128 -0
hammad/genai/agents/types/agent_hooks.py +220 -0
hammad/genai/agents/types/agent_messages.py +31 -0
hammad/genai/agents/types/agent_response.py +90 -0
hammad/genai/agents/types/agent_stream.py +242 -0
hammad/genai/models/__init__.py +1 -0
hammad/genai/models/embeddings/__init__.py +39 -0
hammad/genai/{embedding_models/embedding_model.py → models/embeddings/model.py} +45 -41
hammad/genai/{embedding_models → models/embeddings}/run.py +10 -8
hammad/genai/models/embeddings/types/__init__.py +37 -0
hammad/genai/{embedding_models → models/embeddings/types}/embedding_model_name.py +2 -4
hammad/genai/{embedding_models → models/embeddings/types}/embedding_model_response.py +11 -4
hammad/genai/{embedding_models/embedding_model_request.py → models/embeddings/types/embedding_model_run_params.py} +4 -3
hammad/genai/models/embeddings/types/embedding_model_settings.py +47 -0
hammad/genai/models/language/__init__.py +48 -0
hammad/genai/{language_models/language_model.py → models/language/model.py} +481 -204
hammad/genai/{language_models → models/language}/run.py +80 -57
hammad/genai/models/language/types/__init__.py +40 -0
hammad/genai/models/language/types/language_model_instructor_mode.py +47 -0
hammad/genai/models/language/types/language_model_messages.py +28 -0
hammad/genai/{language_models/_types.py → models/language/types/language_model_name.py} +3 -40
hammad/genai/{language_models → models/language/types}/language_model_request.py +17 -25
hammad/genai/{language_models → models/language/types}/language_model_response.py +61 -68
hammad/genai/{language_models → models/language/types}/language_model_response_chunk.py +8 -5
hammad/genai/models/language/types/language_model_settings.py +89 -0
hammad/genai/{language_models/_streaming.py → models/language/types/language_model_stream.py} +221 -243
hammad/genai/{language_models/_utils → models/language/utils}/__init__.py +8 -11
hammad/genai/models/language/utils/requests.py +421 -0
hammad/genai/{language_models/_utils/_structured_outputs.py → models/language/utils/structured_outputs.py} +31 -20
hammad/genai/models/model_provider.py +4 -0
hammad/genai/{multimodal_models.py → models/multimodal.py} +4 -5
hammad/genai/models/reranking.py +26 -0
hammad/genai/types/__init__.py +1 -0
hammad/genai/types/base.py +215 -0
hammad/genai/{agents/types → types}/history.py +101 -88
hammad/genai/{agents/types/tool.py → types/tools.py} +156 -141
hammad/logging/logger.py +1 -1
hammad/mcp/client/__init__.py +2 -3
hammad/mcp/client/client.py +10 -10
hammad/mcp/servers/__init__.py +2 -1
hammad/service/decorators.py +1 -3
hammad/web/models.py +1 -3
hammad/web/search/client.py +10 -22
{hammad_python-0.0.19.dist-info → hammad_python-0.0.20.dist-info}/METADATA +10 -2
hammad_python-0.0.20.dist-info/RECORD +127 -0
hammad/genai/embedding_models/__init__.py +0 -41
hammad/genai/language_models/__init__.py +0 -35
hammad/genai/language_models/_utils/_completions.py +0 -131
hammad/genai/language_models/_utils/_messages.py +0 -89
hammad/genai/language_models/_utils/_requests.py +0 -202
hammad/genai/rerank_models.py +0 -26
hammad_python-0.0.19.dist-info/RECORD +0 -111
{hammad_python-0.0.19.dist-info → hammad_python-0.0.20.dist-info}/WHEEL +0 -0
{hammad_python-0.0.19.dist-info → hammad_python-0.0.20.dist-info}/licenses/LICENSE +0 -0

hammad/genai/{language_models/_streaming.py → models/language/types/language_model_stream.py} RENAMED Viewed

@@ -1,5 +1,6 @@
-"""hammad.genai.language_models._streaming"""
+"""hammad.genai.models.language.types.language_model_stream"""
+import asyncio
 from typing import (
     List,
     Type,
@@ -11,16 +12,17 @@ from typing import (
     Any,
     Callable,
     Dict,
+    Union,
 )
-from ...typing import get_origin, get_args
+from .....typing import get_origin, get_args
+from ....types.base import BaseGenAIModelStream
 from .language_model_response import LanguageModelResponse
 from .language_model_response_chunk import LanguageModelResponseChunk
 __all__ = [
-    "Stream",
-    "AsyncStream",
+    "LanguageModelStream",
     "InstructorStreamCollector",
     "InstructorStreamWrapper",
     "AsyncInstructorStreamWrapper",
@@ -32,86 +34,89 @@ T = TypeVar("T")
 class InstructorStreamCollector:
     """Collector for instructor streaming responses using hooks."""
     def __init__(self):
         self.raw_chunks = []
         self.completion_responses = []
         self.last_response = None
         self.error = None
     def on_completion_response(self, response):
         """Hook handler for completion responses."""
         self.completion_responses.append(response)
     def on_completion_error(self, error):
         """Hook handler for completion errors."""
         self.error = error
     def add_chunk(self, chunk):
         """Add a raw chunk to the collector."""
         self.raw_chunks.append(chunk)
     def get_raw_content(self):
         """Get raw content from completion responses."""
         if self.completion_responses:
             last_response = self.completion_responses[-1]
-            if hasattr(last_response, 'choices') and last_response.choices:
+            if hasattr(last_response, "choices") and last_response.choices:
                 choice = last_response.choices[0]
-                if hasattr(choice, 'message'):
-                    return getattr(choice.message, 'content', None)
+                if hasattr(choice, "message"):
+                    return getattr(choice.message, "content", None)
         return None
     def get_raw_completion(self):
         """Get the raw completion object."""
         return self.completion_responses[-1] if self.completion_responses else None
     def get_tool_calls(self):
         """Get tool calls from completion responses."""
         if self.completion_responses:
             last_response = self.completion_responses[-1]
-            if hasattr(last_response, 'choices') and last_response.choices:
+            if hasattr(last_response, "choices") and last_response.choices:
                 choice = last_response.choices[0]
-                if hasattr(choice, 'message'):
-                    return getattr(choice.message, 'tool_calls', None)
+                if hasattr(choice, "message"):
+                    return getattr(choice.message, "tool_calls", None)
         return None
 class StreamingChunkProcessor:
     """Process streaming chunks to extract only new content."""
     def __init__(self, output_type: Type[T], response_field_name: Optional[str] = None):
         self.output_type = output_type
         self.response_field_name = response_field_name
         self.previous_chunk = None
         self.previous_content = ""
     def process_chunk(self, chunk: Any) -> Optional[str]:
         """Process a chunk and return only the new content."""
         # Handle list types (e.g., list[str])
-        from ...typing import get_origin
+        from .....typing import get_origin
         origin = get_origin(self.output_type)
         if origin is list:
             return self._process_list_chunk(chunk)
         elif self.response_field_name and hasattr(chunk, self.response_field_name):
             return self._process_field_chunk(chunk)
         else:
             return self._process_simple_chunk(chunk)
     def _process_list_chunk(self, chunk: Any) -> Optional[str]:
         """Process chunks for list types."""
         current_list = []
         if isinstance(chunk, list):
             current_list = chunk
-        elif hasattr(chunk, 'value') and isinstance(chunk.value, list):
+        elif hasattr(chunk, "value") and isinstance(chunk.value, list):
             current_list = chunk.value
-        elif hasattr(chunk, self.response_field_name) and isinstance(getattr(chunk, self.response_field_name), list):
+        elif hasattr(chunk, self.response_field_name) and isinstance(
+            getattr(chunk, self.response_field_name), list
+        ):
             current_list = getattr(chunk, self.response_field_name)
         if not current_list:
             return None
         # For list types, return only new items
         if self.previous_chunk is None:
             # First chunk - return the last item
@@ -120,24 +125,26 @@ class StreamingChunkProcessor:
                 return str(current_list[-1])
         else:
             # Subsequent chunks - return only new items
-            prev_list = self.previous_chunk if isinstance(self.previous_chunk, list) else []
+            prev_list = (
+                self.previous_chunk if isinstance(self.previous_chunk, list) else []
+            )
             prev_len = len(prev_list)
             if len(current_list) > prev_len:
                 new_items = current_list[prev_len:]
                 self.previous_chunk = current_list
                 if new_items:
                     return str(new_items[-1])
         return None
     def _process_field_chunk(self, chunk: Any) -> Optional[str]:
         """Process chunks with a specific response field."""
         if not hasattr(chunk, self.response_field_name):
             return None
         field_value = getattr(chunk, self.response_field_name)
         if isinstance(field_value, str):
             # For string fields, return only new content
             if self.previous_chunk is None:
@@ -147,9 +154,9 @@ class StreamingChunkProcessor:
             else:
                 prev_value = self.previous_content
                 current_value = field_value
                 if current_value.startswith(prev_value):
-                    new_content = current_value[len(prev_value):]
+                    new_content = current_value[len(prev_value) :]
                     self.previous_chunk = chunk
                     self.previous_content = current_value
                     return new_content if new_content else None
@@ -166,23 +173,23 @@ class StreamingChunkProcessor:
             else:
                 prev_field = getattr(self.previous_chunk, self.response_field_name, [])
                 prev_len = len(prev_field) if isinstance(prev_field, list) else 0
                 if len(field_value) > prev_len:
                     new_items = field_value[prev_len:]
                     self.previous_chunk = chunk
                     if new_items:
                         return str(new_items[-1])
         return None
     def _process_simple_chunk(self, chunk: Any) -> Optional[str]:
         """Process simple chunks without response fields."""
-        if hasattr(chunk, 'value'):
+        if hasattr(chunk, "value"):
             value = chunk.value
             if isinstance(value, str):
                 if self.previous_content:
                     if value.startswith(self.previous_content):
-                        new_content = value[len(self.previous_content):]
+                        new_content = value[len(self.previous_content) :]
                         self.previous_content = value
                         return new_content if new_content else None
                     else:
@@ -194,7 +201,7 @@ class StreamingChunkProcessor:
         elif isinstance(chunk, str):
             if self.previous_content:
                 if chunk.startswith(self.previous_content):
-                    new_content = chunk[len(self.previous_content):]
+                    new_content = chunk[len(self.previous_content) :]
                     self.previous_content = chunk
                     return new_content if new_content else None
                 else:
@@ -206,83 +213,95 @@ class StreamingChunkProcessor:
         elif self.output_type in (int, float, bool):
             # For primitive types, return string representation
             return str(chunk)
         return None
 class InstructorStreamWrapper:
     """Wrapper for instructor streams that collects raw responses via hooks."""
     def __init__(self, stream: Iterator[Any], collector: InstructorStreamCollector):
         self._stream = stream
         self.collector = collector
     def __iter__(self):
         return self
     def __next__(self):
         chunk = next(self._stream)
         self.collector.add_chunk(chunk)
         return chunk
     def get_raw_content(self):
         return self.collector.get_raw_content()
     def get_raw_completion(self):
         return self.collector.get_raw_completion()
     def get_tool_calls(self):
         return self.collector.get_tool_calls()
 class AsyncInstructorStreamWrapper:
     """Async wrapper for instructor streams that collects raw responses via hooks."""
-    def __init__(self, stream: AsyncIterator[Any], collector: InstructorStreamCollector):
+    def __init__(
+        self, stream: AsyncIterator[Any], collector: InstructorStreamCollector
+    ):
         self._stream = stream
         self.collector = collector
     def __aiter__(self):
         return self
     async def __anext__(self):
         chunk = await self._stream.__anext__()
         self.collector.add_chunk(chunk)
         return chunk
     def get_raw_content(self):
         return self.collector.get_raw_content()
     def get_raw_completion(self):
         return self.collector.get_raw_completion()
     def get_tool_calls(self):
         return self.collector.get_tool_calls()
-class Stream(Generic[T]):
-    """Synchronous stream wrapper for language model streaming.
+class LanguageModelStream(
+    BaseGenAIModelStream[LanguageModelResponseChunk[T]], Generic[T]
+):
+    """Unified stream wrapper for language model streaming.
-    This class provides a unified interface for streaming responses
-    from both LiteLLM and Instructor, handling the different chunk
-    formats and providing consistent access patterns.
+    This class provides a unified interface for both sync and async streaming responses
+    from both LiteLLM and Instructor, handling the different chunk formats and providing
+    consistent access patterns. It inherits from BaseGenAIModelStream and manages
+    both sync and async streaming in a single class.
     """
     def __init__(
         self,
-        stream: Iterator[Any],
+        stream: Union[Iterator[Any], AsyncIterator[Any]],
         output_type: Type[T] = str,
         model: Optional[str] = None,
         response_field_name: Optional[str] = None,
     ):
         """Initialize the stream.
         Args:
-            stream: The underlying stream iterator
+            stream: The underlying stream iterator (sync or async)
             output_type: The expected output type
             model: The model name
             response_field_name: The field name for structured outputs
         """
+        # Initialize base class
+        super().__init__(
+            type="language_model",
+            model=model or "unknown",
+            stream=stream,
+        )
         self._stream = stream
         self._output_type = output_type
         self._model = model
@@ -292,9 +311,31 @@ class Stream(Generic[T]):
         self._is_instructor = output_type != str
         self._is_consumed = False
         self._previous_chunk_output = None
+        self._is_async = hasattr(stream, "__anext__")
+        self._full_content = ""
     def __iter__(self) -> Iterator[LanguageModelResponseChunk[T]]:
-        """Iterate over response chunks."""
+        """Iterate over response chunks (sync mode)."""
+        if self._is_async:
+            # This is a workaround to allow sync iteration over an async stream
+            # It's not ideal, but it works for simple cases.
+            # A better solution would be to use a dedicated sync entrypoint
+            # if this is a common use case.
+            try:
+                loop = asyncio.get_running_loop()
+            except RuntimeError:
+                loop = asyncio.new_event_loop()
+                asyncio.set_event_loop(loop)
+            async_iter = self.__aiter__()
+            while True:
+                try:
+                    # We are calling the async __anext__ which returns a processed chunk
+                    yield loop.run_until_complete(async_iter.__anext__())
+                except StopAsyncIteration:
+                    break
+            return
         for chunk in self._stream:
             response_chunk = self._process_chunk(chunk)
             if response_chunk:
@@ -302,18 +343,46 @@ class Stream(Generic[T]):
                 yield response_chunk
         self._is_consumed = True
+    def __aiter__(self) -> AsyncIterator[LanguageModelResponseChunk[T]]:
+        """Async iterate over response chunks (async mode)."""
+        if not self._is_async:
+            raise RuntimeError(
+                "Cannot use async iteration on sync stream. Use regular for loop instead."
+            )
+        return self
+    async def __anext__(self) -> LanguageModelResponseChunk[T]:
+        """Get the next response chunk (async mode)."""
+        if not self._is_async:
+            raise RuntimeError(
+                "Cannot use async iteration on sync stream. Use regular for loop instead."
+            )
+        try:
+            chunk = await self._stream.__anext__()
+            response_chunk = self._process_chunk(chunk)
+            if response_chunk:
+                self._chunks.append(response_chunk)
+                return response_chunk
+            else:
+                return await self.__anext__()  # Skip empty chunks
+        except StopAsyncIteration:
+            self._is_consumed = True
+            raise StopAsyncIteration
     def _process_chunk(self, chunk: Any) -> Optional[LanguageModelResponseChunk[T]]:
         """Process a raw chunk into a LanguageModelResponseChunk."""
         if self._is_instructor:
             # Handle instructor streaming (Partial/Iterable)
-            output = chunk
             # Use the chunk processor to get only new content
-            if not hasattr(self, '_chunk_processor'):
-                self._chunk_processor = StreamingChunkProcessor(self._output_type, self._response_field_name)
+            if not hasattr(self, "_chunk_processor"):
+                self._chunk_processor = StreamingChunkProcessor(
+                    self._output_type, self._response_field_name
+                )
             content = self._chunk_processor.process_chunk(chunk)
             # Extract the proper output value
             if self._response_field_name and hasattr(chunk, self._response_field_name):
                 output_value = getattr(chunk, self._response_field_name)
@@ -335,9 +404,12 @@ class Stream(Generic[T]):
                 if hasattr(choice, "delta") and choice.delta:
                     content = getattr(choice.delta, "content", None)
+                if content is not None:
+                    self._full_content += content
                 return LanguageModelResponseChunk(
                     content=content,
-                    output=content,
+                    output=self._full_content,
                     model=getattr(chunk, "model", self._model),
                     finish_reason=getattr(choice, "finish_reason", None),
                     chunk=chunk,
@@ -346,11 +418,34 @@ class Stream(Generic[T]):
         return None
     def collect(self) -> LanguageModelResponse[T]:
-        """Collect all chunks and return a complete LanguageModelResponse object."""
+        """Collect all chunks and return a complete LanguageModelResponse object (sync mode)."""
+        if self._is_async:
+            raise RuntimeError(
+                "Cannot use sync collect() on async stream. Use async collect() instead."
+            )
         if not self._chunks:
             # Consume the stream if not already consumed
             list(self)
+        return self._build_response()
+    async def async_collect(self) -> LanguageModelResponse[T]:
+        """Collect all chunks and return a complete LanguageModelResponse object (async mode)."""
+        if not self._is_async:
+            raise RuntimeError(
+                "Cannot use async collect() on sync stream. Use sync collect() instead."
+            )
+        if not self._chunks:
+            # Consume the stream if not already consumed
+            async for _ in self:
+                pass
+        return self._build_response()
+    def _build_response(self) -> LanguageModelResponse[T]:
+        """Build the final LanguageModelResponse from collected chunks."""
         if self._is_instructor and self._chunks:
             # For instructor, the final chunk contains the complete object
             final_chunk = self._chunks[-1]
@@ -359,7 +454,7 @@ class Stream(Generic[T]):
             raw_content = None
             raw_completion = None
             tool_calls = None
             if hasattr(self._stream, "collector"):
                 collector = self._stream.collector
                 raw_content = collector.get_raw_content()
@@ -367,8 +462,16 @@ class Stream(Generic[T]):
                 tool_calls = collector.get_tool_calls()
             elif hasattr(self._stream, "get_raw_content"):
                 raw_content = self._stream.get_raw_content()
-                raw_completion = self._stream.get_raw_completion() if hasattr(self._stream, "get_raw_completion") else None
-                tool_calls = self._stream.get_tool_calls() if hasattr(self._stream, "get_tool_calls") else None
+                raw_completion = (
+                    self._stream.get_raw_completion()
+                    if hasattr(self._stream, "get_raw_completion")
+                    else None
+                )
+                tool_calls = (
+                    self._stream.get_tool_calls()
+                    if hasattr(self._stream, "get_tool_calls")
+                    else None
+                )
             return LanguageModelResponse(
                 output=final_chunk.output,
@@ -395,7 +498,7 @@ class Stream(Generic[T]):
             )
     def to_response(self) -> LanguageModelResponse[T]:
-        """Convert the stream to a LanguageModelResponse object.
+        """Convert the stream to a LanguageModelResponse object (sync mode).
         This method can only be called after the stream has been fully consumed.
         It's an alias for collect() with a check for consumption state.
@@ -404,8 +507,13 @@ class Stream(Generic[T]):
             LanguageModelResponse[T]: The complete response object
         Raises:
-            RuntimeError: If the stream has not been fully consumed
+            RuntimeError: If the stream has not been fully consumed or is async
         """
+        if self._is_async:
+            raise RuntimeError(
+                "Cannot use sync to_response() on async stream. Use async to_response() instead."
+            )
         if not self._is_consumed and not self._chunks:
             raise RuntimeError(
                 "Stream must be fully consumed before converting to response. "
@@ -414,194 +522,59 @@ class Stream(Generic[T]):
         return self.collect()
-    def to_message(self) -> Any:
-        """Convert the stream to a ChatCompletionMessageParam.
+    async def async_to_response(self) -> LanguageModelResponse[T]:
+        """Convert the stream to a LanguageModelResponse object (async mode).
         This method can only be called after the stream has been fully consumed.
-        It converts the final response to a message format.
+        It's an alias for async_collect() with a check for consumption state.
         Returns:
-            ChatCompletionMessageParam: The response as a chat message
+            LanguageModelResponse[T]: The complete response object
         Raises:
-            RuntimeError: If the stream has not been fully consumed
+            RuntimeError: If the stream has not been fully consumed or is sync
         """
-        if not self._is_consumed and not self._chunks:
+        if not self._is_async:
             raise RuntimeError(
-                "Stream must be fully consumed before converting to message. "
-                "Use collect() or iterate through the stream first."
+                "Cannot use async to_response() on sync stream. Use sync to_response() instead."
             )
-        response = self.collect()
-        return response.to_message()
-class AsyncStream(Generic[T]):
-    """Asynchronous stream wrapper for language model streaming.
-    This class provides a unified interface for async streaming responses
-    from both LiteLLM and Instructor, handling the different chunk
-    formats and providing consistent access patterns.
-    """
-    def __init__(
-        self,
-        stream: AsyncIterator[Any],
-        output_type: Type[T] = str,
-        model: Optional[str] = None,
-        response_field_name: Optional[str] = None,
-    ):
-        """Initialize the async stream.
-        Args:
-            stream: The underlying async stream iterator
-            output_type: The expected output type
-            model: The model name
-            response_field_name: The field name for structured outputs
-        """
-        self._stream = stream
-        self._output_type = output_type
-        self._model = model
-        self._response_field_name = response_field_name
-        self._chunks: List[LanguageModelResponseChunk[T]] = []
-        self._final_output: Optional[T] = None
-        self._is_instructor = output_type != str
-        self._is_consumed = False
-        self._previous_chunk_output = None
-    def __aiter__(self) -> AsyncIterator[LanguageModelResponseChunk[T]]:
-        """Async iterate over response chunks."""
-        return self
-    async def __anext__(self) -> LanguageModelResponseChunk[T]:
-        """Get the next response chunk."""
-        try:
-            chunk = await self._stream.__anext__()
-            response_chunk = self._process_chunk(chunk)
-            if response_chunk:
-                self._chunks.append(response_chunk)
-                return response_chunk
-            else:
-                return await self.__anext__()  # Skip empty chunks
-        except StopAsyncIteration:
-            self._is_consumed = True
-            raise StopAsyncIteration
-    def _process_chunk(self, chunk: Any) -> Optional[LanguageModelResponseChunk[T]]:
-        """Process a raw chunk into a LanguageModelResponseChunk."""
-        if self._is_instructor:
-            # Handle instructor streaming (Partial/Iterable)
-            output = chunk
-            # Use the chunk processor to get only new content
-            if not hasattr(self, '_chunk_processor'):
-                self._chunk_processor = StreamingChunkProcessor(self._output_type, self._response_field_name)
-            content = self._chunk_processor.process_chunk(chunk)
-            # Extract the proper output value
-            if self._response_field_name and hasattr(chunk, self._response_field_name):
-                output_value = getattr(chunk, self._response_field_name)
-            else:
-                output_value = chunk
-            return LanguageModelResponseChunk(
-                output=output_value,
-                content=content,
-                model=self._model,
-                chunk=chunk,
-                is_final=hasattr(chunk, "_is_final") and chunk._is_final,
-            )
-        else:
-            # Handle LiteLLM streaming (ChatCompletionChunk)
-            if hasattr(chunk, "choices") and chunk.choices:
-                choice = chunk.choices[0]
-                content = None
-                if hasattr(choice, "delta") and choice.delta:
-                    content = getattr(choice.delta, "content", None)
-                return LanguageModelResponseChunk(
-                    content=content,
-                    output=content,
-                    model=getattr(chunk, "model", self._model),
-                    finish_reason=getattr(choice, "finish_reason", None),
-                    chunk=chunk,
-                    is_final=getattr(choice, "finish_reason", None) is not None,
-                )
-        return None
-    async def collect(self) -> LanguageModelResponse[T]:
-        """Collect all chunks and return a complete LanguageModelResponse object."""
-        if not self._chunks:
-            # Consume the stream if not already consumed
-            async for _ in self:
-                pass
-        if self._is_instructor and self._chunks:
-            # For instructor, the final chunk contains the complete object
-            final_chunk = self._chunks[-1]
-            # Check if stream collector is available for raw content
-            raw_content = None
-            raw_completion = None
-            tool_calls = None
-            if hasattr(self._stream, "collector"):
-                collector = self._stream.collector
-                raw_content = collector.get_raw_content()
-                raw_completion = collector.get_raw_completion()
-                tool_calls = collector.get_tool_calls()
-            elif hasattr(self._stream, "get_raw_content"):
-                raw_content = self._stream.get_raw_content()
-                raw_completion = self._stream.get_raw_completion() if hasattr(self._stream, "get_raw_completion") else None
-                tool_calls = self._stream.get_tool_calls() if hasattr(self._stream, "get_tool_calls") else None
-            return LanguageModelResponse(
-                output=final_chunk.output,
-                model=final_chunk.model or self._model or "unknown",
-                completion=raw_completion,
-                content=raw_content,
-                tool_calls=tool_calls,
+        if not self._is_consumed and not self._chunks:
+            raise RuntimeError(
+                "Stream must be fully consumed before converting to response. "
+                "Use async_collect() or iterate through the stream first."
             )
-        else:
-            # For LiteLLM, combine content from all chunks
-            content_parts = [chunk.content for chunk in self._chunks if chunk.content]
-            combined_content = "".join(content_parts)
-            # Create a mock completion for consistency
-            mock_completion = None
-            if self._chunks:
-                mock_completion = self._chunks[-1].chunk
+        return await self.async_collect()
-            return LanguageModelResponse(
-                output=combined_content,
-                model=self._model or "unknown",
-                completion=mock_completion,
-                content=combined_content,
-            )
-    async def to_response(self) -> LanguageModelResponse[T]:
-        """Convert the stream to a LanguageModelResponse object.
+    def to_message(self) -> Any:
+        """Convert the stream to a ChatCompletionMessageParam (sync mode).
         This method can only be called after the stream has been fully consumed.
-        It's an alias for collect() with a check for consumption state.
+        It converts the final response to a message format.
         Returns:
-            LanguageModelResponse[T]: The complete response object
+            ChatCompletionMessageParam: The response as a chat message
         Raises:
-            RuntimeError: If the stream has not been fully consumed
+            RuntimeError: If the stream has not been fully consumed or is async
         """
+        if self._is_async:
+            raise RuntimeError(
+                "Cannot use sync to_message() on async stream. Use async to_message() instead."
+            )
         if not self._is_consumed and not self._chunks:
             raise RuntimeError(
-                "Stream must be fully consumed before converting to response. "
+                "Stream must be fully consumed before converting to message. "
                 "Use collect() or iterate through the stream first."
             )
-        return await self.collect()
+        response = self.collect()
+        return response.to_message()
-    async def to_message(self) -> Any:
-        """Convert the stream to a ChatCompletionMessageParam.
+    async def async_to_message(self) -> Any:
+        """Convert the stream to a ChatCompletionMessageParam (async mode).
         This method can only be called after the stream has been fully consumed.
         It converts the final response to a message format.
@@ -610,13 +583,18 @@ class AsyncStream(Generic[T]):
             ChatCompletionMessageParam: The response as a chat message
         Raises:
-            RuntimeError: If the stream has not been fully consumed
+            RuntimeError: If the stream has not been fully consumed or is sync
         """
+        if not self._is_async:
+            raise RuntimeError(
+                "Cannot use async to_message() on sync stream. Use sync to_message() instead."
+            )
         if not self._is_consumed and not self._chunks:
             raise RuntimeError(
                 "Stream must be fully consumed before converting to message. "
-                "Use collect() or iterate through the stream first."
+                "Use async_collect() or iterate through the stream first."
             )
-        response = await self.collect()
-        return response.to_message()
+        response = await self.async_collect()
+        return response.to_message()

hammad-python 0.0.19__py3-none-any.whl → 0.0.20__py3-none-any.whl

hammad-python 0.0.19py3-none-any.whl → 0.0.20py3-none-any.whl