PyPI - openaivec - Versions diffs - 0.13.4__py3-none-any.whl → 0.13.6__py3-none-any.whl - Mend

openaivec 0.13.4py3-none-any.whl → 0.13.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

openaivec/embeddings.py +10 -8
openaivec/model.py +9 -11
openaivec/optimize.py +1 -1
openaivec/pandas_ext.py +61 -42
openaivec/prompt.py +58 -8
openaivec/provider.py +10 -0
openaivec/proxy.py +82 -65
openaivec/responses.py +35 -18
openaivec/spark.py +40 -34
openaivec/task/customer_support/inquiry_classification.py +9 -9
openaivec/task/customer_support/urgency_analysis.py +13 -13
openaivec/task/nlp/keyword_extraction.py +2 -2
openaivec/task/nlp/named_entity_recognition.py +2 -2
openaivec/util.py +2 -2
{openaivec-0.13.4.dist-info → openaivec-0.13.6.dist-info}/METADATA +9 -9
{openaivec-0.13.4.dist-info → openaivec-0.13.6.dist-info}/RECORD +18 -18
{openaivec-0.13.4.dist-info → openaivec-0.13.6.dist-info}/WHEEL +0 -0
{openaivec-0.13.4.dist-info → openaivec-0.13.6.dist-info}/licenses/LICENSE +0 -0

openaivec/embeddings.py CHANGED Viewed

@@ -31,16 +31,17 @@ class BatchEmbeddings:
     client: OpenAI
     model_name: str
-    cache: BatchingMapProxy[str, NDArray[np.float32]] = field(default_factory=lambda: BatchingMapProxy(batch_size=128))
+    cache: BatchingMapProxy[str, NDArray[np.float32]] = field(default_factory=lambda: BatchingMapProxy(batch_size=None))
     @classmethod
-    def of(cls, client: OpenAI, model_name: str, batch_size: int = 128) -> "BatchEmbeddings":
+    def of(cls, client: OpenAI, model_name: str, batch_size: int | None = None) -> "BatchEmbeddings":
         """Factory constructor.
         Args:
             client (OpenAI): OpenAI client.
             model_name (str): For Azure OpenAI, use your deployment name. For OpenAI, use the model name.
-            batch_size (int, optional): Max unique inputs per API call. Defaults to 128.
+            batch_size (int | None, optional): Max unique inputs per API call. Defaults to None
+                (automatic batch size optimization). Set to a positive integer for fixed batch size.
         Returns:
             BatchEmbeddings: Configured instance backed by a batching proxy.
@@ -127,7 +128,7 @@ class AsyncBatchEmbeddings:
     client: AsyncOpenAI
     model_name: str
     cache: AsyncBatchingMapProxy[str, NDArray[np.float32]] = field(
-        default_factory=lambda: AsyncBatchingMapProxy(batch_size=128, max_concurrency=8)
+        default_factory=lambda: AsyncBatchingMapProxy(batch_size=None, max_concurrency=8)
     )
     @classmethod
@@ -135,7 +136,7 @@ class AsyncBatchEmbeddings:
         cls,
         client: AsyncOpenAI,
         model_name: str,
-        batch_size: int = 128,
+        batch_size: int | None = None,
         max_concurrency: int = 8,
     ) -> "AsyncBatchEmbeddings":
         """Factory constructor.
@@ -143,7 +144,8 @@ class AsyncBatchEmbeddings:
         Args:
             client (AsyncOpenAI): OpenAI async client.
             model_name (str): For Azure OpenAI, use your deployment name. For OpenAI, use the model name.
-            batch_size (int, optional): Max unique inputs per API call. Defaults to 128.
+            batch_size (int | None, optional): Max unique inputs per API call. Defaults to None
+                (automatic batch size optimization). Set to a positive integer for fixed batch size.
             max_concurrency (int, optional): Max concurrent API calls. Defaults to 8.
         Returns:
@@ -155,8 +157,8 @@ class AsyncBatchEmbeddings:
             cache=AsyncBatchingMapProxy(batch_size=batch_size, max_concurrency=max_concurrency),
         )
-    @observe(_LOGGER)
     @backoff_async(exceptions=[RateLimitError, InternalServerError], scale=1, max_retries=12)
+    @observe(_LOGGER)
     async def _embed_chunk(self, inputs: List[str]) -> List[NDArray[np.float32]]:
         """Embed one minibatch of strings asynchronously.
@@ -186,4 +188,4 @@ class AsyncBatchEmbeddings:
         Returns:
             List[NDArray[np.float32]]: Embedding vectors aligned to ``inputs``.
         """
-        return await self.cache.map(inputs, self._embed_chunk)
+        return await self.cache.map(inputs, self._embed_chunk)  # type: ignore[arg-type]

openaivec/model.py CHANGED Viewed

@@ -1,13 +1,11 @@
 from dataclasses import dataclass
-from typing import Type, TypeVar
+from typing import Generic, Type, TypeVar
-from pydantic import BaseModel
-ResponseFormat = TypeVar("ResponseFormat", bound=BaseModel | str)
+ResponseFormat = TypeVar("ResponseFormat")
 @dataclass(frozen=True)
-class PreparedTask:
+class PreparedTask(Generic[ResponseFormat]):
     """A data class representing a complete task configuration for OpenAI API calls.
     This class encapsulates all the necessary parameters for executing a task,
@@ -84,10 +82,10 @@ class OpenAIAPIKey:
     """Container for OpenAI API key configuration.
     Attributes:
-        value (str): The API key for OpenAI services.
+        value (str | None): The API key for OpenAI services.
     """
-    value: str
+    value: str | None
 @dataclass(frozen=True)
@@ -95,10 +93,10 @@ class AzureOpenAIAPIKey:
     """Container for Azure OpenAI API key configuration.
     Attributes:
-        value (str): The API key for Azure OpenAI services.
+        value (str | None): The API key for Azure OpenAI services.
     """
-    value: str
+    value: str | None
 @dataclass(frozen=True)
@@ -106,10 +104,10 @@ class AzureOpenAIBaseURL:
     """Container for Azure OpenAI base URL configuration.
     Attributes:
-        value (str): The base URL for Azure OpenAI services.
+        value (str | None): The base URL for Azure OpenAI services.
     """
-    value: str
+    value: str | None
 @dataclass(frozen=True)

openaivec/optimize.py CHANGED Viewed

@@ -21,7 +21,7 @@ class BatchSizeSuggester:
     min_duration: float = 30.0
     max_duration: float = 60.0
     step_ratio: float = 0.1
-    sample_size: int = 10
+    sample_size: int = 4
     _history: List[PerformanceMetric] = field(default_factory=list)
     _lock: threading.RLock = field(default_factory=threading.RLock, repr=False)
     _batch_size_changed_at: datetime | None = field(default=None, init=False)

openaivec/pandas_ext.py CHANGED Viewed

@@ -42,7 +42,7 @@ to easily interact with OpenAI APIs for tasks like generating responses or embed
 import inspect
 import json
 import logging
-from typing import Any, Awaitable, Callable, List, Type, TypeVar
+from typing import Awaitable, Callable, List, Type, TypeVar
 import numpy as np
 import pandas as pd
@@ -184,6 +184,7 @@ class OpenAIVecSeriesAccessor:
         Args:
             cache (BatchingMapProxy[str, np.ndarray]): Pre-configured cache
                 instance for managing API call batching and deduplication.
+                Set cache.batch_size=None to enable automatic batch size optimization.
         Returns:
             pandas.Series: Series whose values are ``np.ndarray`` objects
@@ -217,7 +218,7 @@ class OpenAIVecSeriesAccessor:
         self,
         instructions: str,
         response_format: Type[ResponseFormat] = str,
-        batch_size: int = 128,
+        batch_size: int | None = None,
         temperature: float | None = 0.0,
         top_p: float = 1.0,
         show_progress: bool = False,
@@ -247,8 +248,9 @@ class OpenAIVecSeriesAccessor:
             instructions (str): System prompt prepended to every user message.
             response_format (Type[ResponseFormat], optional): Pydantic model or built‑in
                 type the assistant should return. Defaults to ``str``.
-            batch_size (int, optional): Number of prompts grouped into a single
-                request. Defaults to ``128``.
+            batch_size (int | None, optional): Number of prompts grouped into a single
+                request. Defaults to ``None`` (automatic batch size optimization
+                based on execution time). Set to a positive integer for fixed batch size.
             temperature (float, optional): Sampling temperature. Defaults to ``0.0``.
             top_p (float, optional): Nucleus sampling parameter. Defaults to ``1.0``.
             show_progress (bool, optional): Show progress bar in Jupyter notebooks. Defaults to ``False``.
@@ -266,7 +268,7 @@ class OpenAIVecSeriesAccessor:
     def task_with_cache(
         self,
-        task: PreparedTask,
+        task: PreparedTask[ResponseFormat],
         cache: BatchingMapProxy[str, ResponseFormat],
     ) -> pd.Series:
         """Execute a prepared task on every Series element using a provided cache.
@@ -280,6 +282,7 @@ class OpenAIVecSeriesAccessor:
                 response format, and other parameters for processing the inputs.
             cache (BatchingMapProxy[str, ResponseFormat]): Pre-configured cache
                 instance for managing API call batching and deduplication.
+                Set cache.batch_size=None to enable automatic batch size optimization.
         Returns:
             pandas.Series: Series whose values are instances of the task's
@@ -311,7 +314,7 @@ class OpenAIVecSeriesAccessor:
         )
         return pd.Series(client.parse(self._obj.tolist()), index=self._obj.index, name=self._obj.name)
-    def task(self, task: PreparedTask, batch_size: int = 128, show_progress: bool = False) -> pd.Series:
+    def task(self, task: PreparedTask, batch_size: int | None = None, show_progress: bool = False) -> pd.Series:
         """Execute a prepared task on every Series element.
         This method applies a pre-configured task to each element in the Series,
@@ -343,8 +346,9 @@ class OpenAIVecSeriesAccessor:
         Args:
             task (PreparedTask): A pre-configured task containing instructions,
                 response format, and other parameters for processing the inputs.
-            batch_size (int, optional): Number of prompts grouped into a single
-                request to optimize API usage. Defaults to 128.
+            batch_size (int | None, optional): Number of prompts grouped into a single
+                request to optimize API usage. Defaults to ``None`` (automatic batch size
+                optimization based on execution time). Set to a positive integer for fixed batch size.
             show_progress (bool, optional): Show progress bar in Jupyter notebooks. Defaults to ``False``.
         Returns:
@@ -356,7 +360,7 @@ class OpenAIVecSeriesAccessor:
             cache=BatchingMapProxy(batch_size=batch_size, show_progress=show_progress),
         )
-    def embeddings(self, batch_size: int = 128, show_progress: bool = False) -> pd.Series:
+    def embeddings(self, batch_size: int | None = None, show_progress: bool = False) -> pd.Series:
         """Compute OpenAI embeddings for every Series element.
         Example:
@@ -378,8 +382,9 @@ class OpenAIVecSeriesAccessor:
             The default embedding model is `text-embedding-3-small`.
         Args:
-            batch_size (int, optional): Number of inputs grouped into a
-                single request. Defaults to ``128``.
+            batch_size (int | None, optional): Number of inputs grouped into a
+                single request. Defaults to ``None`` (automatic batch size optimization
+                based on execution time). Set to a positive integer for fixed batch size.
             show_progress (bool, optional): Show progress bar in Jupyter notebooks. Defaults to ``False``.
         Returns:
@@ -494,6 +499,7 @@ class OpenAIVecDataFrameAccessor:
             instructions (str): System prompt for the assistant.
             cache (BatchingMapProxy[str, ResponseFormat]): Pre-configured cache
                 instance for managing API call batching and deduplication.
+                Set cache.batch_size=None to enable automatic batch size optimization.
             response_format (Type[ResponseFormat], optional): Desired Python type of the
                 responses. Defaults to ``str``.
             temperature (float, optional): Sampling temperature. Defaults to ``0.0``.
@@ -538,7 +544,7 @@ class OpenAIVecDataFrameAccessor:
         self,
         instructions: str,
         response_format: Type[ResponseFormat] = str,
-        batch_size: int = 128,
+        batch_size: int | None = None,
         temperature: float | None = 0.0,
         top_p: float = 1.0,
         show_progress: bool = False,
@@ -573,8 +579,9 @@ class OpenAIVecDataFrameAccessor:
             instructions (str): System prompt for the assistant.
             response_format (Type[ResponseFormat], optional): Desired Python type of the
                 responses. Defaults to ``str``.
-            batch_size (int, optional): Number of requests sent in one batch.
-                Defaults to ``128``.
+            batch_size (int | None, optional): Number of requests sent in one batch.
+                Defaults to ``None`` (automatic batch size optimization
+                based on execution time). Set to a positive integer for fixed batch size.
             temperature (float, optional): Sampling temperature. Defaults to ``0.0``.
             top_p (float, optional): Nucleus sampling parameter. Defaults to ``1.0``.
             show_progress (bool, optional): Show progress bar in Jupyter notebooks. Defaults to ``False``.
@@ -590,7 +597,7 @@ class OpenAIVecDataFrameAccessor:
             top_p=top_p,
         )
-    def task(self, task: PreparedTask, batch_size: int = 128, show_progress: bool = False) -> pd.Series:
+    def task(self, task: PreparedTask, batch_size: int | None = None, show_progress: bool = False) -> pd.Series:
         """Execute a prepared task on each DataFrame row after serialising it to JSON.
         This method applies a pre-configured task to each row in the DataFrame,
@@ -618,8 +625,9 @@ class OpenAIVecDataFrameAccessor:
         Args:
             task (PreparedTask): A pre-configured task containing instructions,
                 response format, and other parameters for processing the inputs.
-            batch_size (int, optional): Number of requests sent in one batch
-                to optimize API usage. Defaults to 128.
+            batch_size (int | None, optional): Number of requests sent in one batch
+                to optimize API usage. Defaults to ``None`` (automatic batch size
+                optimization based on execution time). Set to a positive integer for fixed batch size.
             show_progress (bool, optional): Show progress bar in Jupyter notebooks. Defaults to ``False``.
         Returns:
@@ -634,7 +642,7 @@ class OpenAIVecDataFrameAccessor:
             )
         )
-    def fillna(self, target_column_name: str, max_examples: int = 500, batch_size: int = 128) -> pd.DataFrame:
+    def fillna(self, target_column_name: str, max_examples: int = 500, batch_size: int | None = None) -> pd.DataFrame:
         """Fill missing values in a DataFrame column using AI-powered inference.
         This method uses machine learning to intelligently fill missing (NaN) values
@@ -648,8 +656,9 @@ class OpenAIVecDataFrameAccessor:
             max_examples (int, optional): The maximum number of example rows to use
                 for context when predicting missing values. Higher values may improve
                 accuracy but increase API costs and processing time. Defaults to 500.
-            batch_size (int, optional): Number of requests sent in one batch
-                to optimize API usage. Defaults to 128.
+            batch_size (int | None, optional): Number of requests sent in one batch
+                to optimize API usage. Defaults to ``None`` (automatic batch size
+                optimization based on execution time). Set to a positive integer for fixed batch size.
         Returns:
             pandas.DataFrame: A new DataFrame with missing values filled in the target
@@ -721,7 +730,7 @@ class OpenAIVecDataFrameAccessor:
         return self._obj.apply(
             lambda row: np.dot(row[col1], row[col2]) / (np.linalg.norm(row[col1]) * np.linalg.norm(row[col2])),
             axis=1,
-        ).rename("similarity")
+        ).rename("similarity")  # type: ignore[arg-type]
 @pd.api.extensions.register_series_accessor("aio")
@@ -750,6 +759,7 @@ class AsyncOpenAIVecSeriesAccessor:
             instructions (str): System prompt prepended to every user message.
             cache (AsyncBatchingMapProxy[str, ResponseFormat]): Pre-configured cache
                 instance for managing API call batching and deduplication.
+                Set cache.batch_size=None to enable automatic batch size optimization.
             response_format (Type[ResponseFormat], optional): Pydantic model or built‑in
                 type the assistant should return. Defaults to ``str``.
             temperature (float, optional): Sampling temperature. Defaults to ``0.0``.
@@ -804,6 +814,7 @@ class AsyncOpenAIVecSeriesAccessor:
         Args:
             cache (AsyncBatchingMapProxy[str, np.ndarray]): Pre-configured cache
                 instance for managing API call batching and deduplication.
+                Set cache.batch_size=None to enable automatic batch size optimization.
         Returns:
             pandas.Series: Series whose values are ``np.ndarray`` objects
@@ -844,7 +855,7 @@ class AsyncOpenAIVecSeriesAccessor:
     async def task_with_cache(
         self,
-        task: PreparedTask,
+        task: PreparedTask[ResponseFormat],
         cache: AsyncBatchingMapProxy[str, ResponseFormat],
     ) -> pd.Series:
         """Execute a prepared task on every Series element using a provided cache (asynchronously).
@@ -859,6 +870,7 @@ class AsyncOpenAIVecSeriesAccessor:
                 response format, and other parameters for processing the inputs.
             cache (AsyncBatchingMapProxy[str, ResponseFormat]): Pre-configured cache
                 instance for managing API call batching and deduplication.
+                Set cache.batch_size=None to enable automatic batch size optimization.
         Returns:
             pandas.Series: Series whose values are instances of the task's
@@ -902,7 +914,7 @@ class AsyncOpenAIVecSeriesAccessor:
         self,
         instructions: str,
         response_format: Type[ResponseFormat] = str,
-        batch_size: int = 128,
+        batch_size: int | None = None,
         temperature: float | None = 0.0,
         top_p: float = 1.0,
         max_concurrency: int = 8,
@@ -934,8 +946,9 @@ class AsyncOpenAIVecSeriesAccessor:
             instructions (str): System prompt prepended to every user message.
             response_format (Type[ResponseFormat], optional): Pydantic model or built‑in
                 type the assistant should return. Defaults to ``str``.
-            batch_size (int, optional): Number of prompts grouped into a single
-                request. Defaults to ``128``.
+            batch_size (int | None, optional): Number of prompts grouped into a single
+                request. Defaults to ``None`` (automatic batch size optimization
+                based on execution time). Set to a positive integer for fixed batch size.
             temperature (float, optional): Sampling temperature. Defaults to ``0.0``.
             top_p (float, optional): Nucleus sampling parameter. Defaults to ``1.0``.
             max_concurrency (int, optional): Maximum number of concurrent
@@ -959,7 +972,7 @@ class AsyncOpenAIVecSeriesAccessor:
         )
     async def embeddings(
-        self, batch_size: int = 128, max_concurrency: int = 8, show_progress: bool = False
+        self, batch_size: int | None = None, max_concurrency: int = 8, show_progress: bool = False
     ) -> pd.Series:
         """Compute OpenAI embeddings for every Series element (asynchronously).
@@ -983,8 +996,9 @@ class AsyncOpenAIVecSeriesAccessor:
             The default embedding model is `text-embedding-3-small`.
         Args:
-            batch_size (int, optional): Number of inputs grouped into a
-                single request. Defaults to ``128``.
+            batch_size (int | None, optional): Number of inputs grouped into a
+                single request. Defaults to ``None`` (automatic batch size optimization
+                based on execution time). Set to a positive integer for fixed batch size.
             max_concurrency (int, optional): Maximum number of concurrent
                 requests. Defaults to ``8``.
             show_progress (bool, optional): Show progress bar in Jupyter notebooks. Defaults to ``False``.
@@ -1003,7 +1017,7 @@ class AsyncOpenAIVecSeriesAccessor:
         )
     async def task(
-        self, task: PreparedTask, batch_size: int = 128, max_concurrency: int = 8, show_progress: bool = False
+        self, task: PreparedTask, batch_size: int | None = None, max_concurrency: int = 8, show_progress: bool = False
     ) -> pd.Series:
         """Execute a prepared task on every Series element (asynchronously).
@@ -1037,8 +1051,9 @@ class AsyncOpenAIVecSeriesAccessor:
         Args:
             task (PreparedTask): A pre-configured task containing instructions,
                 response format, and other parameters for processing the inputs.
-            batch_size (int, optional): Number of prompts grouped into a single
-                request to optimize API usage. Defaults to 128.
+            batch_size (int | None, optional): Number of prompts grouped into a single
+                request to optimize API usage. Defaults to ``None`` (automatic batch size
+                optimization based on execution time). Set to a positive integer for fixed batch size.
             max_concurrency (int, optional): Maximum number of concurrent
                 requests. Defaults to 8.
             show_progress (bool, optional): Show progress bar in Jupyter notebooks. Defaults to ``False``.
@@ -1084,6 +1099,7 @@ class AsyncOpenAIVecDataFrameAccessor:
             instructions (str): System prompt for the assistant.
             cache (AsyncBatchingMapProxy[str, ResponseFormat]): Pre-configured cache
                 instance for managing API call batching and deduplication.
+                Set cache.batch_size=None to enable automatic batch size optimization.
             response_format (Type[ResponseFormat], optional): Desired Python type of the
                 responses. Defaults to ``str``.
             temperature (float, optional): Sampling temperature. Defaults to ``0.0``.
@@ -1134,7 +1150,7 @@ class AsyncOpenAIVecDataFrameAccessor:
         self,
         instructions: str,
         response_format: Type[ResponseFormat] = str,
-        batch_size: int = 128,
+        batch_size: int | None = None,
         temperature: float | None = 0.0,
         top_p: float = 1.0,
         max_concurrency: int = 8,
@@ -1171,8 +1187,9 @@ class AsyncOpenAIVecDataFrameAccessor:
             instructions (str): System prompt for the assistant.
             response_format (Type[ResponseFormat], optional): Desired Python type of the
                 responses. Defaults to ``str``.
-            batch_size (int, optional): Number of requests sent in one batch.
-                Defaults to ``128``.
+            batch_size (int | None, optional): Number of requests sent in one batch.
+                Defaults to ``None`` (automatic batch size optimization
+                based on execution time). Set to a positive integer for fixed batch size.
             temperature (float, optional): Sampling temperature. Defaults to ``0.0``.
             top_p (float, optional): Nucleus sampling parameter. Defaults to ``1.0``.
             max_concurrency (int, optional): Maximum number of concurrent
@@ -1196,7 +1213,7 @@ class AsyncOpenAIVecDataFrameAccessor:
         )
     async def task(
-        self, task: PreparedTask, batch_size: int = 128, max_concurrency: int = 8, show_progress: bool = False
+        self, task: PreparedTask, batch_size: int | None = None, max_concurrency: int = 8, show_progress: bool = False
     ) -> pd.Series:
         """Execute a prepared task on each DataFrame row after serialising it to JSON (asynchronously).
@@ -1235,8 +1252,9 @@ class AsyncOpenAIVecDataFrameAccessor:
         Args:
             task (PreparedTask): A pre-configured task containing instructions,
                 response format, and other parameters for processing the inputs.
-            batch_size (int, optional): Number of requests sent in one batch
-                to optimize API usage. Defaults to 128.
+            batch_size (int | None, optional): Number of requests sent in one batch
+                to optimize API usage. Defaults to ``None`` (automatic batch size
+                optimization based on execution time). Set to a positive integer for fixed batch size.
             max_concurrency (int, optional): Maximum number of concurrent
                 requests. Defaults to 8.
             show_progress (bool, optional): Show progress bar in Jupyter notebooks. Defaults to ``False``.
@@ -1286,7 +1304,7 @@ class AsyncOpenAIVecDataFrameAccessor:
         else:
             return result
-    async def assign(self, **kwargs: Any) -> pd.DataFrame:
+    async def assign(self, **kwargs) -> pd.DataFrame:
         """Asynchronously assign new columns to the DataFrame, evaluating sequentially.
         This method extends pandas' `assign` method by supporting asynchronous
@@ -1321,7 +1339,7 @@ class AsyncOpenAIVecDataFrameAccessor:
             ```
         Args:
-            **kwargs: Any. Column names as keys and either static values or callables
+            **kwargs: Column names as keys and either static values or callables
                 (synchronous or asynchronous) as values.
         Returns:
@@ -1346,7 +1364,7 @@ class AsyncOpenAIVecDataFrameAccessor:
         return df_current
     async def fillna(
-        self, target_column_name: str, max_examples: int = 500, batch_size: int = 128, max_concurrency: int = 8
+        self, target_column_name: str, max_examples: int = 500, batch_size: int | None = None, max_concurrency: int = 8
     ) -> pd.DataFrame:
         """Fill missing values in a DataFrame column using AI-powered inference (asynchronously).
@@ -1361,8 +1379,9 @@ class AsyncOpenAIVecDataFrameAccessor:
             max_examples (int, optional): The maximum number of example rows to use
                 for context when predicting missing values. Higher values may improve
                 accuracy but increase API costs and processing time. Defaults to 500.
-            batch_size (int, optional): Number of requests sent in one batch
-                to optimize API usage. Defaults to 128.
+            batch_size (int | None, optional): Number of requests sent in one batch
+                to optimize API usage. Defaults to ``None`` (automatic batch size
+                optimization based on execution time). Set to a positive integer for fixed batch size.
             max_concurrency (int, optional): Maximum number of concurrent
                 requests. Defaults to 8.

openaivec/prompt.py CHANGED Viewed

@@ -44,7 +44,7 @@ this will produce an XML string that looks like this:
 import difflib
 import logging
-from typing import Any, List
+from typing import List
 from xml.etree import ElementTree
 from openai import OpenAI
@@ -126,6 +126,7 @@ _PROMPT: str = """
             Receive the prompt in JSON format with fields "purpose",
             "cautions", and "examples". Ensure the entire prompt is free
             from logical contradictions, redundancies, and ambiguities.
+            IMPORTANT: The "examples" array must always contain at least one example throughout all iterations.
         </Instruction>
         <Instruction id="2">
             - Modify only one element per iteration among “purpose”, “examples”, or
@@ -155,8 +156,10 @@ _PROMPT: str = """
         </Instruction>
         <Instruction id="6">
             In the "examples" field, enhance the examples to cover a wide range of scenarios.
+            CRITICAL: The examples array must NEVER be empty - always maintain at least one example.
             Add as many non-redundant examples as possible,
             since having more examples leads to better coverage and understanding.
+            You may modify existing examples or add new ones, but never remove all examples.
         </Instruction>
         <Instruction id="7">
             Verify that the improved prompt adheres to the Request and
@@ -166,6 +169,7 @@ _PROMPT: str = """
             Generate the final refined FewShotPrompt as an iteration in
             the Response, ensuring the final output is consistent,
             unambiguous, and free from any redundancies or contradictions.
+            MANDATORY: Verify that the examples array contains at least one example before completing.
         </Instruction>
     </Instructions>
     <Example>
@@ -339,11 +343,29 @@ def _render_prompt(prompt: FewShotPrompt) -> str:
 class FewShotPromptBuilder:
+    """Builder for creating few-shot prompts with validation.
+    Usage:
+        builder = (FewShotPromptBuilder()
+                  .purpose("Your task description")
+                  .example("input1", "output1")  # At least one required
+                  .example("input2", "output2")
+                  .build())
+    Note:
+        Both .purpose() and at least one .example() call are required before
+        calling .build(), .improve(), or .get_object().
+    """
     _prompt: FewShotPrompt
     _steps: List[Step]
     def __init__(self):
-        """Initialize an empty FewShotPromptBuilder."""
+        """Initialize an empty FewShotPromptBuilder.
+        Note:
+            You must call .purpose() and at least one .example() before building.
+        """
         self._prompt = FewShotPrompt(purpose="", cautions=[], examples=[])
     @classmethod
@@ -402,6 +424,8 @@ class FewShotPromptBuilder:
     ) -> "FewShotPromptBuilder":
         """Add a single input/output example.
+        At least one example is required before calling .build(), .improve(), or .get_object().
         Args:
             input_value (str | BaseModel): Example input; if a Pydantic model is
                 provided it is serialised to JSON.
@@ -442,7 +466,13 @@ class FewShotPromptBuilder:
         Returns:
             FewShotPromptBuilder: The current builder instance containing the refined prompt and iteration history.
+        Raises:
+            ValueError: If the prompt is not valid (missing purpose or examples).
         """
+        # Validate before making API call to provide early feedback
+        self._validate()
         _client = client or CONTAINER.resolve(OpenAI)
         _model_name = model_name or CONTAINER.resolve(ResponsesModelName).value
@@ -459,12 +489,25 @@ class FewShotPromptBuilder:
         self._steps = [Step(id=0, analysis="Original Prompt", prompt=self._prompt)]
         # add the histories
-        for step in response.output_parsed.iterations:
-            self._steps.append(step)
+        if response.output_parsed:
+            for step in response.output_parsed.iterations:
+                self._steps.append(step)
         # set the final prompt
         self._prompt = self._steps[-1].prompt
+        # Validate the improved prompt to ensure examples weren't removed by LLM
+        try:
+            self._validate()
+        except ValueError as e:
+            _logger.warning(f"LLM produced invalid prompt during improve(): {e}")
+            # Restore original prompt if LLM produced invalid result
+            self._prompt = self._steps[0].prompt
+            raise ValueError(
+                f"LLM improvement failed to maintain required fields: {e}. "
+                "This may indicate an issue with the improvement instructions or model behavior."
+            )
         return self
     def explain(self) -> "FewShotPromptBuilder":
@@ -500,9 +543,14 @@ class FewShotPromptBuilder:
         """
         # Validate that 'purpose' and 'examples' are not empty.
         if not self._prompt.purpose:
-            raise ValueError("Purpose is required.")
+            raise ValueError(
+                "Purpose is required. Please call .purpose('your purpose description') before building the prompt."
+            )
         if not self._prompt.examples or len(self._prompt.examples) == 0:
-            raise ValueError("At least one example is required.")
+            raise ValueError(
+                "At least one example is required. Please add examples using "
+                ".example('input', 'output') before building the prompt."
+            )
     def get_object(self) -> FewShotPrompt:
         """Return the underlying FewShotPrompt object.
@@ -522,11 +570,13 @@ class FewShotPromptBuilder:
         self._validate()
         return self.build_xml()
-    def build_json(self, **kwargs: Any) -> str:
+    def build_json(self, **kwargs) -> str:
         """Build and return the prompt as a JSON string.
         Args:
-            **kwargs: Keyword arguments forwarded to ``model_dump_json``.
+            **kwargs: Keyword arguments forwarded to Pydantic's ``model_dump_json``.
+                Common options include ``indent``, ``include``, ``exclude``,
+                ``by_alias``, ``exclude_unset``, ``exclude_defaults``, ``exclude_none``.
         Returns:
             str: JSON representation of the prompt.

openaivec/provider.py CHANGED Viewed

@@ -65,6 +65,11 @@ def provide_openai_client() -> OpenAI:
     azure_api_version = CONTAINER.resolve(AzureOpenAIAPIVersion)
     if all(param.value for param in [azure_api_key, azure_base_url, azure_api_version]):
+        # Type checker support: values are guaranteed non-None by the all() check above
+        assert azure_api_key.value is not None
+        assert azure_base_url.value is not None
+        assert azure_api_version.value is not None
         _check_azure_v1_api_url(azure_base_url.value)
         return AzureOpenAI(
             api_key=azure_api_key.value,
@@ -103,6 +108,11 @@ def provide_async_openai_client() -> AsyncOpenAI:
     azure_api_version = CONTAINER.resolve(AzureOpenAIAPIVersion)
     if all(param.value for param in [azure_api_key, azure_base_url, azure_api_version]):
+        # Type checker support: values are guaranteed non-None by the all() check above
+        assert azure_api_key.value is not None
+        assert azure_base_url.value is not None
+        assert azure_api_version.value is not None
         _check_azure_v1_api_url(azure_base_url.value)
         return AsyncAzureOpenAI(
             api_key=azure_api_key.value,

openaivec 0.13.4__py3-none-any.whl → 0.13.6__py3-none-any.whl

openaivec 0.13.4py3-none-any.whl → 0.13.6py3-none-any.whl