PyPI - vectorvein - Versions diffs - 0.1.77__py3-none-any.whl → 0.1.78__py3-none-any.whl - Mend

vectorvein 0.1.77py3-none-any.whl → 0.1.78py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

vectorvein/chat_clients/__init__.py +35 -34
vectorvein/chat_clients/anthropic_client.py +28 -12
vectorvein/chat_clients/base_client.py +13 -13
vectorvein/chat_clients/gemini_client.py +20 -12
vectorvein/chat_clients/minimax_client.py +20 -12
vectorvein/chat_clients/openai_compatible_client.py +20 -10
vectorvein/types/defaults.py +22 -2
vectorvein/types/llm_parameters.py +13 -0
{vectorvein-0.1.77.dist-info → vectorvein-0.1.78.dist-info}/METADATA +1 -1
{vectorvein-0.1.77.dist-info → vectorvein-0.1.78.dist-info}/RECORD +12 -12
{vectorvein-0.1.77.dist-info → vectorvein-0.1.78.dist-info}/WHEEL +0 -0
{vectorvein-0.1.77.dist-info → vectorvein-0.1.78.dist-info}/entry_points.txt +0 -0

vectorvein/chat_clients/__init__.py CHANGED Viewed

@@ -21,6 +21,7 @@ from .moonshot_client import MoonshotChatClient, AsyncMoonshotChatClient
 from .deepseek_client import DeepSeekChatClient, AsyncDeepSeekChatClient
 from ..types import defaults as defs
+from ..types.llm_parameters import NOT_GIVEN, NotGiven
 from ..types.enums import BackendType, ContextLengthControlType
 from .anthropic_client import AnthropicChatClient, AsyncAnthropicChatClient
 from .utils import format_messages, get_token_counts, get_message_token_counts, ToolCallContentProcessor
@@ -69,7 +70,7 @@ def create_chat_client(
     backend: Literal[BackendType.Anthropic],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -83,7 +84,7 @@ def create_chat_client(
     backend: Literal[BackendType.DeepSeek],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -97,7 +98,7 @@ def create_chat_client(
     backend: Literal[BackendType.Gemini],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -111,7 +112,7 @@ def create_chat_client(
     backend: Literal[BackendType.Groq],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -125,7 +126,7 @@ def create_chat_client(
     backend: Literal[BackendType.Local],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -139,7 +140,7 @@ def create_chat_client(
     backend: Literal[BackendType.MiniMax],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -153,7 +154,7 @@ def create_chat_client(
     backend: Literal[BackendType.Mistral],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -167,7 +168,7 @@ def create_chat_client(
     backend: Literal[BackendType.Moonshot],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -181,7 +182,7 @@ def create_chat_client(
     backend: Literal[BackendType.OpenAI],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -195,7 +196,7 @@ def create_chat_client(
     backend: Literal[BackendType.Qwen],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -209,7 +210,7 @@ def create_chat_client(
     backend: Literal[BackendType.Yi],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -223,7 +224,7 @@ def create_chat_client(
     backend: Literal[BackendType.ZhiPuAI],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -237,7 +238,7 @@ def create_chat_client(
     backend: Literal[BackendType.Baichuan],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -251,7 +252,7 @@ def create_chat_client(
     backend: Literal[BackendType.StepFun],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -265,7 +266,7 @@ def create_chat_client(
     backend: Literal[BackendType.XAI],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -279,7 +280,7 @@ def create_chat_client(
     backend: BackendType,
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -292,7 +293,7 @@ def create_chat_client(
     backend: BackendType,
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -322,7 +323,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.Anthropic],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -336,7 +337,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.DeepSeek],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -350,7 +351,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.Gemini],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -364,7 +365,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.Groq],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -378,7 +379,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.Local],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -392,7 +393,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.MiniMax],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -406,7 +407,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.Mistral],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -420,7 +421,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.Moonshot],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -434,7 +435,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.OpenAI],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -448,7 +449,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.Qwen],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -462,7 +463,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.Yi],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -476,7 +477,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.ZhiPuAI],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -490,7 +491,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.Baichuan],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -504,7 +505,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.StepFun],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -518,7 +519,7 @@ def create_async_chat_client(
     backend: Literal[BackendType.XAI],
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -532,7 +533,7 @@ def create_async_chat_client(
     backend: BackendType,
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",
@@ -545,7 +546,7 @@ def create_async_chat_client(
     backend: BackendType,
     model: str | None = None,
     stream: bool = False,
-    temperature: float = 0.7,
+    temperature: float | None | NotGiven = NOT_GIVEN,
     context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
     random_endpoint: bool = True,
     endpoint_id: str = "",

vectorvein/chat_clients/anthropic_client.py CHANGED Viewed

@@ -157,7 +157,7 @@ class AnthropicChatClient(BaseChatClient):
         self,
         model: str = defs.ANTHROPIC_DEFAULT_MODEL,
         stream: bool = True,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
         random_endpoint: bool = True,
         endpoint_id: str = "",
@@ -253,7 +253,7 @@ class AnthropicChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -272,7 +272,7 @@ class AnthropicChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[True],
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -291,7 +291,7 @@ class AnthropicChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: bool,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -309,7 +309,7 @@ class AnthropicChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] | Literal[True] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -401,6 +401,8 @@ class AnthropicChatClient(BaseChatClient):
             tool_choice = NOT_GIVEN
         if isinstance(top_p, OpenAINotGiven) or top_p is None:
             top_p = NOT_GIVEN
+        if isinstance(self.temperature, NotGiven) or self.temperature is None:
+            self.temperature = NOT_GIVEN
         if messages[0].get("role") == "system":
             system_prompt: str = messages[0]["content"]
@@ -492,7 +494,13 @@ class AnthropicChatClient(BaseChatClient):
                         result["usage"]["total_tokens"] = (
                             result["usage"]["prompt_tokens"] + result["usage"]["completion_tokens"]
                         )
-                        yield ChatCompletionDeltaMessage(usage=Usage(**result["usage"]))
+                        yield ChatCompletionDeltaMessage(
+                            usage=Usage(
+                                prompt_tokens=result["usage"]["prompt_tokens"],
+                                completion_tokens=result["usage"]["completion_tokens"],
+                                total_tokens=result["usage"]["total_tokens"],
+                            )
+                        )
             return generator()
         else:
@@ -538,7 +546,7 @@ class AsyncAnthropicChatClient(BaseAsyncChatClient):
         self,
         model: str = defs.ANTHROPIC_DEFAULT_MODEL,
         stream: bool = True,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
         random_endpoint: bool = True,
         endpoint_id: str = "",
@@ -633,7 +641,7 @@ class AsyncAnthropicChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -652,7 +660,7 @@ class AsyncAnthropicChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[True],
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -671,7 +679,7 @@ class AsyncAnthropicChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: bool,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -689,7 +697,7 @@ class AsyncAnthropicChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] | Literal[True] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -783,6 +791,8 @@ class AsyncAnthropicChatClient(BaseAsyncChatClient):
             tool_choice = NOT_GIVEN
         if isinstance(top_p, OpenAINotGiven) or top_p is None:
             top_p = NOT_GIVEN
+        if isinstance(self.temperature, NotGiven) or self.temperature is None:
+            self.temperature = NOT_GIVEN
         if messages[0].get("role") == "system":
             system_prompt = messages[0]["content"]
@@ -874,7 +884,13 @@ class AsyncAnthropicChatClient(BaseAsyncChatClient):
                         result["usage"]["total_tokens"] = (
                             result["usage"]["prompt_tokens"] + result["usage"]["completion_tokens"]
                         )
-                        yield ChatCompletionDeltaMessage(usage=Usage(**result["usage"]))
+                        yield ChatCompletionDeltaMessage(
+                            usage=Usage(
+                                prompt_tokens=result["usage"]["prompt_tokens"],
+                                completion_tokens=result["usage"]["completion_tokens"],
+                                total_tokens=result["usage"]["total_tokens"],
+                            )
+                        )
             return generator()
         else:

vectorvein/chat_clients/base_client.py CHANGED Viewed

@@ -9,8 +9,8 @@ import httpx
 from openai import OpenAI, AsyncOpenAI, AzureOpenAI, AsyncAzureOpenAI
 from anthropic import (
     Anthropic,
-    AnthropicVertex,
     AsyncAnthropic,
+    AnthropicVertex,
     AsyncAnthropicVertex,
     AnthropicBedrock,
     AsyncAnthropicBedrock,
@@ -39,7 +39,7 @@ class BaseChatClient(ABC):
         self,
         model: str = "",
         stream: bool = False,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
         random_endpoint: bool = True,
         endpoint_id: str = "",
@@ -108,7 +108,7 @@ class BaseChatClient(ABC):
         messages: list,
         model: str | None = None,
         stream: Literal[False] = False,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -128,7 +128,7 @@ class BaseChatClient(ABC):
         messages: list,
         model: str | None = None,
         stream: Literal[True],
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -148,7 +148,7 @@ class BaseChatClient(ABC):
         messages: list,
         model: str | None = None,
         stream: bool,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -167,7 +167,7 @@ class BaseChatClient(ABC):
         messages: list,
         model: str | None = None,
         stream: Literal[False] | Literal[True] = False,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -184,7 +184,7 @@ class BaseChatClient(ABC):
         *,
         messages: list,
         model: str | None = None,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -216,7 +216,7 @@ class BaseAsyncChatClient(ABC):
         self,
         model: str = "",
         stream: bool = False,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
         random_endpoint: bool = True,
         endpoint_id: str = "",
@@ -293,7 +293,7 @@ class BaseAsyncChatClient(ABC):
         messages: list,
         model: str | None = None,
         stream: Literal[False] = False,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: list | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -313,7 +313,7 @@ class BaseAsyncChatClient(ABC):
         messages: list,
         model: str | None = None,
         stream: Literal[True],
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: list | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -333,7 +333,7 @@ class BaseAsyncChatClient(ABC):
         messages: list,
         model: str | None = None,
         stream: bool,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: list | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -352,7 +352,7 @@ class BaseAsyncChatClient(ABC):
         messages: list,
         model: str | None = None,
         stream: Literal[False] | Literal[True] = False,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: list | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -369,7 +369,7 @@ class BaseAsyncChatClient(ABC):
         *,
         messages: list,
         model: str | None = None,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: list | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,

vectorvein/chat_clients/gemini_client.py CHANGED Viewed

@@ -29,7 +29,7 @@ class GeminiChatClient(BaseChatClient):
         self,
         model: str = defs.GEMINI_DEFAULT_MODEL,
         stream: bool = True,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
         random_endpoint: bool = True,
         endpoint_id: str = "",
@@ -63,7 +63,7 @@ class GeminiChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -82,7 +82,7 @@ class GeminiChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[True],
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -101,7 +101,7 @@ class GeminiChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: bool,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -119,7 +119,7 @@ class GeminiChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] | Literal[True] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -169,6 +169,10 @@ class GeminiChatClient(BaseChatClient):
         if top_p:
             top_p_params = {"top_p": top_p}
+        temperature_params = {}
+        if temperature:
+            temperature_params = {"temperature": temperature}
         request_body = {
             "contents": messages,
             "safetySettings": [
@@ -178,8 +182,8 @@ class GeminiChatClient(BaseChatClient):
                 }
             ],
             "generationConfig": {
-                "temperature": self.temperature,
                 "maxOutputTokens": max_tokens,
+                **temperature_params,
                 **top_p_params,
                 **response_format_params,
             },
@@ -277,7 +281,7 @@ class AsyncGeminiChatClient(BaseAsyncChatClient):
         self,
         model: str = defs.GEMINI_DEFAULT_MODEL,
         stream: bool = True,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
         random_endpoint: bool = True,
         endpoint_id: str = "",
@@ -311,7 +315,7 @@ class AsyncGeminiChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -330,7 +334,7 @@ class AsyncGeminiChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[True],
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -349,7 +353,7 @@ class AsyncGeminiChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: bool,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -367,7 +371,7 @@ class AsyncGeminiChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] | Literal[True] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -417,6 +421,10 @@ class AsyncGeminiChatClient(BaseAsyncChatClient):
         if top_p:
             top_p_params = {"top_p": top_p}
+        temperature_params = {}
+        if temperature:
+            temperature_params = {"temperature": temperature}
         request_body = {
             "contents": messages,
             "safetySettings": [
@@ -426,8 +434,8 @@ class AsyncGeminiChatClient(BaseAsyncChatClient):
                 }
             ],
             "generationConfig": {
-                "temperature": self.temperature,
                 "maxOutputTokens": max_tokens,
+                **temperature_params,
                 **top_p_params,
                 **response_format_params,
             },

vectorvein/chat_clients/minimax_client.py CHANGED Viewed

@@ -51,7 +51,7 @@ class MiniMaxChatClient(BaseChatClient):
         self,
         model: str = defs.MINIMAX_DEFAULT_MODEL,
         stream: bool = True,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
         random_endpoint: bool = True,
         endpoint_id: str = "",
@@ -85,7 +85,7 @@ class MiniMaxChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -104,7 +104,7 @@ class MiniMaxChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[True],
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -123,7 +123,7 @@ class MiniMaxChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: bool,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -140,7 +140,7 @@ class MiniMaxChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] | Literal[True] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -198,6 +198,10 @@ class MiniMaxChatClient(BaseChatClient):
         else:
             top_p_params = {}
+        temperature_params = {}
+        if temperature:
+            temperature_params = {"temperature": temperature}
         if max_tokens is None:
             max_output_tokens = self.model_setting.max_output_tokens
             if max_output_tokens is not None:
@@ -223,9 +227,9 @@ class MiniMaxChatClient(BaseChatClient):
             "model": self.model_id,
             "messages": messages,
             "max_tokens": max_tokens,
-            "temperature": self.temperature,
             "stream": self.stream,
             "mask_sensitive_info": False,
+            **temperature_params,
             **top_p_params,
             **tools_params,
             **kwargs,
@@ -298,7 +302,7 @@ class AsyncMiniMaxChatClient(BaseAsyncChatClient):
         self,
         model: str = defs.MINIMAX_DEFAULT_MODEL,
         stream: bool = True,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
         random_endpoint: bool = True,
         endpoint_id: str = "",
@@ -332,7 +336,7 @@ class AsyncMiniMaxChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -351,7 +355,7 @@ class AsyncMiniMaxChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[True],
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -370,7 +374,7 @@ class AsyncMiniMaxChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: bool,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -388,7 +392,7 @@ class AsyncMiniMaxChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] | Literal[True] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -444,6 +448,10 @@ class AsyncMiniMaxChatClient(BaseAsyncChatClient):
         else:
             top_p_params = {}
+        temperature_params = {}
+        if temperature:
+            temperature_params = {"temperature": temperature}
         if max_tokens is None:
             max_output_tokens = self.model_setting.max_output_tokens
             if max_output_tokens is not None:
@@ -469,9 +477,9 @@ class AsyncMiniMaxChatClient(BaseAsyncChatClient):
             "model": self.model_id,
             "messages": messages,
             "max_tokens": max_tokens,
-            "temperature": self.temperature,
             "stream": self.stream,
             "mask_sensitive_info": False,
+            **temperature_params,
             **top_p_params,
             **tools_params,
             **kwargs,

vectorvein/chat_clients/openai_compatible_client.py CHANGED Viewed

@@ -38,7 +38,7 @@ class OpenAICompatibleChatClient(BaseChatClient):
         self,
         model: str = "",
         stream: bool = True,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
         random_endpoint: bool = True,
         endpoint_id: str = "",
@@ -88,7 +88,7 @@ class OpenAICompatibleChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -107,7 +107,7 @@ class OpenAICompatibleChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[True],
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -126,7 +126,7 @@ class OpenAICompatibleChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: bool,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -144,7 +144,7 @@ class OpenAICompatibleChatClient(BaseChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] | Literal[True] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -158,6 +158,8 @@ class OpenAICompatibleChatClient(BaseChatClient):
             self.model = model
         if stream is not None:
             self.stream = stream
+        if isinstance(temperature, AnthropicNotGiven):
+            temperature = NOT_GIVEN
         if temperature is not None:
             self.temperature = temperature
         if isinstance(top_p, AnthropicNotGiven):
@@ -233,6 +235,8 @@ class OpenAICompatibleChatClient(BaseChatClient):
                             completion_tokens=chunk.usage.completion_tokens or 0,
                             prompt_tokens=chunk.usage.prompt_tokens or 0,
                             total_tokens=chunk.usage.total_tokens or 0,
+                            prompt_tokens_details=chunk.usage.prompt_tokens_details,
+                            completion_tokens_details=chunk.usage.completion_tokens_details,
                         )
                     if len(chunk.choices) == 0:
@@ -279,6 +283,7 @@ class OpenAICompatibleChatClient(BaseChatClient):
             result = {
                 "content": response.choices[0].message.content,
+                "reasoning_content": getattr(response.choices[0].message, "reasoning_content", None),
                 "usage": response.usage.model_dump() if response.usage else None,
             }
             if tools:
@@ -305,7 +310,7 @@ class AsyncOpenAICompatibleChatClient(BaseAsyncChatClient):
         self,
         model: str = "",
         stream: bool = True,
-        temperature: float = 0.7,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         context_length_control: ContextLengthControlType = defs.CONTEXT_LENGTH_CONTROL,
         random_endpoint: bool = True,
         endpoint_id: str = "",
@@ -355,7 +360,7 @@ class AsyncOpenAICompatibleChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -374,7 +379,7 @@ class AsyncOpenAICompatibleChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[True],
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -393,7 +398,7 @@ class AsyncOpenAICompatibleChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: bool,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -411,7 +416,7 @@ class AsyncOpenAICompatibleChatClient(BaseAsyncChatClient):
         messages: list,
         model: str | None = None,
         stream: Literal[False] | Literal[True] = False,
-        temperature: float | None = None,
+        temperature: float | None | NotGiven = NOT_GIVEN,
         max_tokens: int | None = None,
         tools: Iterable[ToolParam] | NotGiven = NOT_GIVEN,
         tool_choice: ToolChoice | NotGiven = NOT_GIVEN,
@@ -425,6 +430,8 @@ class AsyncOpenAICompatibleChatClient(BaseAsyncChatClient):
             self.model = model
         if stream is not None:
             self.stream = stream
+        if isinstance(temperature, AnthropicNotGiven):
+            temperature = NOT_GIVEN
         if temperature is not None:
             self.temperature = temperature
         if isinstance(top_p, AnthropicNotGiven):
@@ -500,6 +507,8 @@ class AsyncOpenAICompatibleChatClient(BaseAsyncChatClient):
                             completion_tokens=chunk.usage.completion_tokens or 0,
                             prompt_tokens=chunk.usage.prompt_tokens or 0,
                             total_tokens=chunk.usage.total_tokens or 0,
+                            completion_tokens_details=chunk.usage.completion_tokens_details,
+                            prompt_tokens_details=chunk.usage.prompt_tokens_details,
                         )
                     if len(chunk.choices) == 0:
@@ -546,6 +555,7 @@ class AsyncOpenAICompatibleChatClient(BaseAsyncChatClient):
             )
             result = {
                 "content": response.choices[0].message.content,
+                "reasoning_content": getattr(response.choices[0].message, "reasoning_content", None),
                 "usage": response.usage.model_dump() if response.usage else None,
             }
             if tools:

vectorvein/types/defaults.py CHANGED Viewed

@@ -39,11 +39,18 @@ MOONSHOT_DEFAULT_MODEL: Final[str] = "moonshot-v1-8k"
 DEEPSEEK_MODELS: Final[Dict[str, Dict[str, Any]]] = {
     "deepseek-chat": {
         "id": "deepseek-chat",
-        "context_length": 128000,
-        "max_output_tokens": 4096,
+        "context_length": 64000,
+        "max_output_tokens": 8192,
         "function_call_available": True,
         "response_format_available": True,
     },
+    "deepseek-reasoner": {
+        "id": "deepseek-reasoner",
+        "context_length": 64000,
+        "max_output_tokens": 8192,
+        "function_call_available": False,
+        "response_format_available": False,
+    },
 }
 DEEPSEEK_DEFAULT_MODEL: Final[str] = "deepseek-chat"
@@ -812,4 +819,17 @@ XAI_MODELS: Final[Dict[str, Dict[str, Any]]] = {
         "function_call_available": True,
         "response_format_available": True,
     },
+    "grok-2-latest": {
+        "id": "grok-2-latest",
+        "context_length": 131072,
+        "function_call_available": True,
+        "response_format_available": True,
+    },
+    "grok-2-vision-latest": {
+        "id": "grok-2-vision-latest",
+        "context_length": 32768,
+        "function_call_available": True,
+        "response_format_available": True,
+        "native_multimodal": True,
+    },
 }

vectorvein/types/llm_parameters.py CHANGED Viewed

@@ -13,6 +13,7 @@ from openai._types import NotGiven as OpenAINotGiven
 from openai._types import NOT_GIVEN as OPENAI_NOT_GIVEN
 from openai.types.chat.chat_completion_chunk import ChoiceDeltaToolCall
 from openai.types.chat.chat_completion_tool_param import ChatCompletionToolParam
+from openai.types.completion_usage import CompletionTokensDetails, PromptTokensDetails
 from openai.types.chat.chat_completion_message_tool_call import ChatCompletionMessageToolCall
 from openai.types.chat.chat_completion_stream_options_param import ChatCompletionStreamOptionsParam
 from openai.types.chat.chat_completion_tool_choice_option_param import ChatCompletionToolChoiceOptionParam
@@ -80,13 +81,23 @@ class BackendSettings(BaseModel):
 class Usage(BaseModel):
     completion_tokens: int
     prompt_tokens: int
     total_tokens: int
+    completion_tokens_details: Optional[CompletionTokensDetails] = None
+    """Breakdown of tokens used in a completion."""
+    prompt_tokens_details: Optional[PromptTokensDetails] = None
+    """Breakdown of tokens used in the prompt."""
 class ChatCompletionMessage(BaseModel):
     content: Optional[str] = None
+    reasoning_content: Optional[str] = None
     tool_calls: Optional[List[ChatCompletionMessageToolCall]] = None
     """The tool calls generated by the model, such as function calls."""
@@ -98,6 +109,8 @@ class ChatCompletionMessage(BaseModel):
 class ChatCompletionDeltaMessage(BaseModel):
     content: Optional[str] = None
+    reasoning_content: Optional[str] = None
     tool_calls: Optional[List[ChoiceDeltaToolCall]] = None
     """The tool calls generated by the model, such as function calls."""

{vectorvein-0.1.77.dist-info → vectorvein-0.1.78.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: vectorvein
-Version: 0.1.77
+Version: 0.1.78
 Summary: VectorVein python SDK
 Author-Email: Anderson <andersonby@163.com>
 License: MIT

{vectorvein-0.1.77.dist-info → vectorvein-0.1.78.dist-info}/RECORD RENAMED Viewed

@@ -1,20 +1,20 @@
-vectorvein-0.1.77.dist-info/METADATA,sha256=EGx61L2VDmmghx_inG3CK2RuFi3tp8H2VOprx_XuqSE,641
-vectorvein-0.1.77.dist-info/WHEEL,sha256=thaaA2w1JzcGC48WYufAs8nrYZjJm8LqNfnXFOFyCC4,90
-vectorvein-0.1.77.dist-info/entry_points.txt,sha256=6OYgBcLyFCUgeqLgnvMyOJxPCWzgy7se4rLPKtNonMs,34
+vectorvein-0.1.78.dist-info/METADATA,sha256=zoS7DULHUtC0Tygj-G517o8MD0QL8wLMoagcHU8qS7Q,641
+vectorvein-0.1.78.dist-info/WHEEL,sha256=thaaA2w1JzcGC48WYufAs8nrYZjJm8LqNfnXFOFyCC4,90
+vectorvein-0.1.78.dist-info/entry_points.txt,sha256=6OYgBcLyFCUgeqLgnvMyOJxPCWzgy7se4rLPKtNonMs,34
 vectorvein/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-vectorvein/chat_clients/__init__.py,sha256=Oev7Lv1DIEWCMD-2Pm7e2cwzX7JFQTnIK-j6o4iUuyQ,17725
-vectorvein/chat_clients/anthropic_client.py,sha256=Uy9E8t6hrYymNobRsPRCX5W-KsBXRun-8rAiRsN8M00,37217
+vectorvein/chat_clients/__init__.py,sha256=omQuG4PRRPNflSAgtdU--rwsWG6vMpwMEyIGZyFVHVQ,18596
+vectorvein/chat_clients/anthropic_client.py,sha256=PGIKldH4FnGrqozoY_FZ6LqhDHC-jY7NF5J1F1zT2Ok,38257
 vectorvein/chat_clients/baichuan_client.py,sha256=CVMvpgjdrZGv0BWnTOBD-f2ufZ3wq3496wqukumsAr4,526
-vectorvein/chat_clients/base_client.py,sha256=Dar-2b7YR13YcWlH6sLIrKNr9_6IrpdUMjdwVFQyu0Q,13350
+vectorvein/chat_clients/base_client.py,sha256=Rw-BYFxy86ohZQH8KABiXP6xuNQBjWC3JkeN6WsXfLw,13638
 vectorvein/chat_clients/deepseek_client.py,sha256=3qWu01NlJAP2N-Ff62d5-CZXZitlizE1fzb20LNetig,526
-vectorvein/chat_clients/gemini_client.py,sha256=BsOhK4LI04pxak6wtmSju63it2P-zzIAXhCtgC6DfOQ,20453
+vectorvein/chat_clients/gemini_client.py,sha256=qqqjQ9X8sIgJaT8xgvtG_cY-lmNGzA_f9V4tUcGRcBo,20853
 vectorvein/chat_clients/groq_client.py,sha256=Uow4pgdmFi93ZQSoOol2-0PhhqkW-S0XuSldvppz5U4,498
 vectorvein/chat_clients/local_client.py,sha256=55nOsxzqUf79q3Y14MKROA71zxhsT7p7FsDZ89rts2M,422
-vectorvein/chat_clients/minimax_client.py,sha256=TOfYDLJvs9JWSyU7S8V5SV3ozOC8anI2QEDdKy29HMk,19633
+vectorvein/chat_clients/minimax_client.py,sha256=ooJU92UCACC4TVWKJ-uo8vqQ8qF3K14ziAuSFm8Wj3M,20025
 vectorvein/chat_clients/mistral_client.py,sha256=1aKSylzBDaLYcFnaBIL4-sXSzWmXfBeON9Q0rq-ziWw,534
 vectorvein/chat_clients/moonshot_client.py,sha256=gbu-6nGxx8uM_U2WlI4Wus881rFRotzHtMSoYOcruGU,526
 vectorvein/chat_clients/openai_client.py,sha256=Nz6tV45pWcsOupxjnsRsGTicbQNJWIZyxuJoJ5DGMpg,527
-vectorvein/chat_clients/openai_compatible_client.py,sha256=tL_pj8OFhSo3yvHQxshjO695pTesaOrHLGVnkmfQZqw,22953
+vectorvein/chat_clients/openai_compatible_client.py,sha256=nuBcsoPOuv6fKs8wb5uE2tVeqGWwZfRu_DuFaukEQSg,23881
 vectorvein/chat_clients/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 vectorvein/chat_clients/qwen_client.py,sha256=-ryh-m9PgsO0fc4ulcCmPTy1155J8YUy15uPoJQOHA0,513
 vectorvein/chat_clients/stepfun_client.py,sha256=zsD2W5ahmR4DD9cqQTXmJr3txrGuvxbRWhFlRdwNijI,519
@@ -26,11 +26,11 @@ vectorvein/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 vectorvein/server/token_server.py,sha256=36F9PKSNOX8ZtYBXY_l-76GQTpUSmQ2Y8EMy1H7wtdQ,1353
 vectorvein/settings/__init__.py,sha256=g01y74x0k2JEAqNpRGG0PDs0NTULjOAZV6HRhydPX1c,3874
 vectorvein/settings/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-vectorvein/types/defaults.py,sha256=4qF31QJSFexF8E-Og8aGM0wCzegtPe65vxd8VQj7oKA,25579
+vectorvein/types/defaults.py,sha256=LB6G8RoWWDdZkFw0EGTpLxFXlV557BBTzmUXgNDhlUk,26227
 vectorvein/types/enums.py,sha256=7KTJSVtQueImmbr1fSwv3rQVtc0RyMWXJmoE2tDOaso,1667
 vectorvein/types/exception.py,sha256=gnW4GnJ76jND6UGnodk9xmqkcbeS7Cz2rvncA2HpD5E,69
-vectorvein/types/llm_parameters.py,sha256=I-b__6OZhobxneSOTWfoug2xJr6HBljanHVXU6cByUM,5447
+vectorvein/types/llm_parameters.py,sha256=CLhDSp9KI_zzjIXUvjiTuGxfYXpubTNBCVcJ6RgH2iY,5879
 vectorvein/types/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 vectorvein/utilities/media_processing.py,sha256=CTRq-lGlFkFgP_FSRhNwF_qUgmOrXPf2_1Ok9HY42_g,5887
 vectorvein/utilities/retry.py,sha256=6KFS9R2HdhqM3_9jkjD4F36ZSpEx2YNFGOVlpOsUetM,2208
-vectorvein-0.1.77.dist-info/RECORD,,
+vectorvein-0.1.78.dist-info/RECORD,,

{vectorvein-0.1.77.dist-info → vectorvein-0.1.78.dist-info}/WHEEL RENAMED Viewed

File without changes

{vectorvein-0.1.77.dist-info → vectorvein-0.1.78.dist-info}/entry_points.txt RENAMED Viewed

File without changes

vectorvein 0.1.77__py3-none-any.whl → 0.1.78__py3-none-any.whl

vectorvein 0.1.77py3-none-any.whl → 0.1.78py3-none-any.whl