PyPI - openaivec - Versions diffs - 0.13.0__tar.gz → 0.13.1__tar.gz - Mend

openaivec 0.13.0tar.gz → 0.13.1tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (81) hide show

{openaivec-0.13.0 → openaivec-0.13.1}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: openaivec
-Version: 0.13.0
+Version: 0.13.1
 Summary: Generative mutation for tabular calculation
 Project-URL: Homepage, https://microsoft.github.io/openaivec/
 Project-URL: Repository, https://github.com/microsoft/openaivec

{openaivec-0.13.0 → openaivec-0.13.1}/src/openaivec/embeddings.py RENAMED Viewed

@@ -4,7 +4,7 @@ from typing import List
 import numpy as np
 from numpy.typing import NDArray
-from openai import AsyncOpenAI, OpenAI, RateLimitError
+from openai import AsyncOpenAI, InternalServerError, OpenAI, RateLimitError
 from .log import observe
 from .proxy import AsyncBatchingMapProxy, BatchingMapProxy
@@ -47,7 +47,7 @@ class BatchEmbeddings:
         return cls(client=client, model_name=model_name, cache=BatchingMapProxy(batch_size=batch_size))
     @observe(_LOGGER)
-    @backoff(exception=RateLimitError, scale=15, max_retries=8)
+    @backoff(exceptions=[RateLimitError, InternalServerError], scale=1, max_retries=12)
     def _embed_chunk(self, inputs: List[str]) -> List[NDArray[np.float32]]:
         """Embed one minibatch of strings.
@@ -155,7 +155,7 @@ class AsyncBatchEmbeddings:
         )
     @observe(_LOGGER)
-    @backoff_async(exception=RateLimitError, scale=15, max_retries=8)
+    @backoff_async(exceptions=[RateLimitError, InternalServerError], scale=1, max_retries=12)
     async def _embed_chunk(self, inputs: List[str]) -> List[NDArray[np.float32]]:
         """Embed one minibatch of strings asynchronously.

{openaivec-0.13.0 → openaivec-0.13.1}/src/openaivec/responses.py RENAMED Viewed

@@ -2,7 +2,7 @@ from dataclasses import dataclass, field
 from logging import Logger, getLogger
 from typing import Generic, List, Type, cast
-from openai import AsyncOpenAI, OpenAI, RateLimitError
+from openai import AsyncOpenAI, InternalServerError, OpenAI, RateLimitError
 from openai.types.responses import ParsedResponse
 from pydantic import BaseModel
@@ -206,7 +206,7 @@ class BatchResponses(Generic[ResponseFormat]):
         )
     @observe(_LOGGER)
-    @backoff(exception=RateLimitError, scale=15, max_retries=8)
+    @backoff(exceptions=[RateLimitError, InternalServerError], scale=1, max_retries=12)
     def _request_llm(self, user_messages: List[Message[str]]) -> ParsedResponse[Response[ResponseFormat]]:
         """Make a single call to the OpenAI JSON‑mode endpoint.
@@ -400,7 +400,7 @@ class AsyncBatchResponses(Generic[ResponseFormat]):
         )
     @observe(_LOGGER)
-    @backoff_async(exception=RateLimitError, scale=15, max_retries=8)
+    @backoff_async(exceptions=[RateLimitError, InternalServerError], scale=1, max_retries=12)
     async def _request_llm(self, user_messages: List[Message[str]]) -> ParsedResponse[Response[ResponseFormat]]:
         """Make a single async call to the OpenAI JSON‑mode endpoint.

{openaivec-0.13.0 → openaivec-0.13.1}/src/openaivec/util.py RENAMED Viewed

@@ -3,7 +3,7 @@ import functools
 import re
 import time
 from dataclasses import dataclass
-from typing import Awaitable, Callable, List, TypeVar
+from typing import Awaitable, Callable, List, Type, TypeVar
 import numpy as np
 import tiktoken
@@ -34,24 +34,28 @@ def get_exponential_with_cutoff(scale: float) -> float:
             return v
-def backoff(exception: type[Exception], scale: int | None = None, max_retries: int | None = None) -> Callable[..., V]:
+def backoff(
+    exceptions: List[Type[Exception]],
+    scale: int | None = None,
+    max_retries: int | None = None,
+) -> Callable[..., V]:
     """Decorator implementing exponential back‑off retry logic.
     Args:
-        exception (type[Exception]): Exception type that triggers a retry.
+        exceptions (List[Type[Exception]]): List of exception types that trigger a retry.
         scale (int | None): Initial scale parameter for the exponential jitter.
             This scale is used as the mean for the first delay's exponential
             distribution and doubles with each subsequent retry. If ``None``,
             an initial scale of 1.0 is used.
-        max_retries (Optional[int]): Maximum number of retries. ``None`` means
+        max_retries (int | None): Maximum number of retries. ``None`` means
             retry indefinitely.
     Returns:
         Callable[..., V]: A decorated function that retries on the specified
-            exception with exponential back‑off.
+            exceptions with exponential back‑off.
     Raises:
-        exception: Re‑raised when the maximum number of retries is exceeded.
+        Exception: Re‑raised when the maximum number of retries is exceeded.
     """
     def decorator(func: Callable[..., V]) -> Callable[..., V]:
@@ -65,7 +69,7 @@ def backoff(exception: type[Exception], scale: int | None = None, max_retries: i
             while True:
                 try:
                     return func(*args, **kwargs)
-                except exception:
+                except tuple(exceptions):
                     attempt += 1
                     if max_retries is not None and attempt >= max_retries:
                         raise
@@ -83,12 +87,14 @@ def backoff(exception: type[Exception], scale: int | None = None, max_retries: i
 def backoff_async(
-    exception: type[Exception], scale: int | None = None, max_retries: int | None = None
+    exceptions: List[Type[Exception]],
+    scale: int | None = None,
+    max_retries: int | None = None,
 ) -> Callable[..., Awaitable[V]]:
     """Asynchronous version of the backoff decorator.
     Args:
-        exception (type[Exception]): Exception type that triggers a retry.
+        exceptions (List[Type[Exception]]): List of exception types that trigger a retry.
         scale (int | None): Initial scale parameter for the exponential jitter.
             This scale is used as the mean for the first delay's exponential
             distribution and doubles with each subsequent retry. If ``None``,
@@ -98,10 +104,10 @@ def backoff_async(
     Returns:
         Callable[..., Awaitable[V]]: A decorated asynchronous function that
-            retries on the specified exception with exponential back‑off.
+            retries on the specified exceptions with exponential back‑off.
     Raises:
-        exception: Re‑raised when the maximum number of retries is exceeded.
+        Exception: Re‑raised when the maximum number of retries is exceeded.
     """
     def decorator(func: Callable[..., Awaitable[V]]) -> Callable[..., Awaitable[V]]:
@@ -115,7 +121,7 @@ def backoff_async(
             while True:
                 try:
                     return await func(*args, **kwargs)
-                except exception:
+                except tuple(exceptions):
                     attempt += 1
                     if max_retries is not None and attempt >= max_retries:
                         raise

openaivec-0.13.1/tests/test_util.py ADDED Viewed

@@ -0,0 +1,291 @@
+import asyncio
+import time
+from unittest import TestCase
+import tiktoken
+from openaivec.util import TextChunker, backoff, backoff_async
+class TestTextChunker(TestCase):
+    def setUp(self):
+        self.sep = TextChunker(
+            enc=tiktoken.encoding_for_model("text-embedding-3-large"),
+        )
+    def test_split(self):
+        text = """
+Kubernetes was announced by Google on June 6, 2014.[10] The project was conceived and created by Google employees Joe Beda, Brendan Burns, and Craig McLuckie. Others at Google soon joined to help build the project including Ville Aikas, Dawn Chen, Brian Grant, Tim Hockin, and Daniel Smith.[11][12] Other companies such as Red Hat and CoreOS joined the effort soon after, with notable contributors such as Clayton Coleman and Kelsey Hightower.[10]
+The design and development of Kubernetes was inspired by Google's Borg cluster manager and based on Promise Theory.[13][14] Many of its top contributors had previously worked on Borg;[15][16] they codenamed Kubernetes "Project 7" after the Star Trek ex-Borg character Seven of Nine[17] and gave its logo a seven-spoked ship's wheel (designed by Tim Hockin). Unlike Borg, which was written in C++,[15] Kubernetes is written in the Go language.
+Kubernetes was announced in June, 2014 and version 1.0 was released on July 21, 2015.[18] Google worked with the Linux Foundation to form the Cloud Native Computing Foundation (CNCF)[19] and offered Kubernetes as the seed technology.
+Google was already offering a managed Kubernetes service, GKE, and Red Hat was supporting Kubernetes as part of OpenShift since the inception of the Kubernetes project in 2014.[20] In 2017, the principal competitors rallied around Kubernetes and announced adding native support for it:
+VMware (proponent of Pivotal Cloud Foundry)[21] in August,
+Mesosphere, Inc. (proponent of Marathon and Mesos)[22] in September,
+Docker, Inc. (proponent of Docker)[23] in October,
+Microsoft Azure[24] also in October,
+AWS announced support for Kubernetes via the Elastic Kubernetes Service (EKS)[25] in November.
+Cisco Elastic Kubernetes Service (EKS)[26] in November.
+On March 6, 2018, Kubernetes Project reached ninth place in the list of GitHub projects by the number of commits, and second place in authors and issues, after the Linux kernel.[27]
+Until version 1.18, Kubernetes followed an N-2 support policy, meaning that the three most recent minor versions receive security updates and bug fixes.[28] Starting with version 1.19, Kubernetes follows an N-3 support policy.[29]
+"""
+        chunks = self.sep.split(text, max_tokens=256, sep=[".", "\n\n"])
+        # Assert that the number of chunks is as expected
+        enc = tiktoken.encoding_for_model("text-embedding-3-large")
+        for chunk in chunks:
+            self.assertLessEqual(len(enc.encode(chunk)), 256)
+class TestBackoff(TestCase):
+    def test_backoff_no_exception(self):
+        """Test that function executes normally when no exception is raised."""
+        call_count = 0
+        @backoff(exceptions=[ValueError], scale=0.1, max_retries=3)
+        def success_func():
+            nonlocal call_count
+            call_count += 1
+            return "success"
+        result = success_func()
+        self.assertEqual(result, "success")
+        self.assertEqual(call_count, 1)
+    def test_backoff_retries_on_exception(self):
+        """Test that function retries on specified exception."""
+        call_count = 0
+        @backoff(exceptions=[ValueError], scale=0.01, max_retries=3)
+        def fail_twice():
+            nonlocal call_count
+            call_count += 1
+            if call_count < 3:
+                raise ValueError("Test error")
+            return "success"
+        result = fail_twice()
+        self.assertEqual(result, "success")
+        self.assertEqual(call_count, 3)
+    def test_backoff_multiple_exceptions(self):
+        """Test that function retries on multiple exception types."""
+        call_count = 0
+        @backoff(exceptions=[ValueError, TypeError], scale=0.01, max_retries=5)
+        def fail_with_different_errors():
+            nonlocal call_count
+            call_count += 1
+            if call_count == 1:
+                raise ValueError("First error")
+            elif call_count == 2:
+                raise TypeError("Second error")
+            return "success"
+        result = fail_with_different_errors()
+        self.assertEqual(result, "success")
+        self.assertEqual(call_count, 3)
+    def test_backoff_max_retries_exceeded(self):
+        """Test that function raises exception when max retries exceeded."""
+        call_count = 0
+        @backoff(exceptions=[ValueError], scale=0.01, max_retries=2)
+        def always_fail():
+            nonlocal call_count
+            call_count += 1
+            raise ValueError("Always fails")
+        with self.assertRaises(ValueError) as cm:
+            always_fail()
+        self.assertEqual(str(cm.exception), "Always fails")
+        self.assertEqual(call_count, 2)  # Initial call + 1 retry
+    def test_backoff_unhandled_exception_not_retried(self):
+        """Test that unhandled exceptions are not retried."""
+        call_count = 0
+        @backoff(exceptions=[ValueError], scale=0.01, max_retries=3)
+        def raise_unhandled():
+            nonlocal call_count
+            call_count += 1
+            raise TypeError("Unhandled exception")
+        with self.assertRaises(TypeError) as cm:
+            raise_unhandled()
+        self.assertEqual(str(cm.exception), "Unhandled exception")
+        self.assertEqual(call_count, 1)  # No retries for unhandled exception
+    def test_backoff_exponential_delay(self):
+        """Test that delay increases exponentially."""
+        call_times = []
+        @backoff(exceptions=[ValueError], scale=0.01, max_retries=3)
+        def track_timing():
+            call_times.append(time.time())
+            if len(call_times) < 3:
+                raise ValueError("Retry")
+            return "success"
+        result = track_timing()
+        self.assertEqual(result, "success")
+        self.assertEqual(len(call_times), 3)
+        # Check that delays are present (but keep them small for test speed)
+        for i in range(1, len(call_times)):
+            delay = call_times[i] - call_times[i - 1]
+            self.assertGreater(delay, 0)  # Some delay exists
+class TestBackoffAsync(TestCase):
+    def test_backoff_async_no_exception(self):
+        """Test that async function executes normally when no exception is raised."""
+        call_count = 0
+        @backoff_async(exceptions=[ValueError], scale=0.1, max_retries=3)
+        async def success_func():
+            nonlocal call_count
+            call_count += 1
+            await asyncio.sleep(0.01)
+            return "success"
+        result = asyncio.run(success_func())
+        self.assertEqual(result, "success")
+        self.assertEqual(call_count, 1)
+    def test_backoff_async_retries_on_exception(self):
+        """Test that async function retries on specified exception."""
+        call_count = 0
+        @backoff_async(exceptions=[ValueError], scale=0.01, max_retries=3)
+        async def fail_twice():
+            nonlocal call_count
+            call_count += 1
+            await asyncio.sleep(0.01)
+            if call_count < 3:
+                raise ValueError("Test error")
+            return "success"
+        result = asyncio.run(fail_twice())
+        self.assertEqual(result, "success")
+        self.assertEqual(call_count, 3)
+    def test_backoff_async_multiple_exceptions(self):
+        """Test that async function retries on multiple exception types."""
+        call_count = 0
+        @backoff_async(exceptions=[ValueError, TypeError], scale=0.01, max_retries=5)
+        async def fail_with_different_errors():
+            nonlocal call_count
+            call_count += 1
+            await asyncio.sleep(0.01)
+            if call_count == 1:
+                raise ValueError("First error")
+            elif call_count == 2:
+                raise TypeError("Second error")
+            return "success"
+        result = asyncio.run(fail_with_different_errors())
+        self.assertEqual(result, "success")
+        self.assertEqual(call_count, 3)
+    def test_backoff_async_max_retries_exceeded(self):
+        """Test that async function raises exception when max retries exceeded."""
+        call_count = 0
+        @backoff_async(exceptions=[ValueError], scale=0.01, max_retries=2)
+        async def always_fail():
+            nonlocal call_count
+            call_count += 1
+            await asyncio.sleep(0.01)
+            raise ValueError("Always fails")
+        with self.assertRaises(ValueError) as cm:
+            asyncio.run(always_fail())
+        self.assertEqual(str(cm.exception), "Always fails")
+        self.assertEqual(call_count, 2)  # Initial call + 1 retry
+    def test_backoff_async_unhandled_exception_not_retried(self):
+        """Test that unhandled exceptions are not retried in async."""
+        call_count = 0
+        @backoff_async(exceptions=[ValueError], scale=0.01, max_retries=3)
+        async def raise_unhandled():
+            nonlocal call_count
+            call_count += 1
+            await asyncio.sleep(0.01)
+            raise TypeError("Unhandled exception")
+        with self.assertRaises(TypeError) as cm:
+            asyncio.run(raise_unhandled())
+        self.assertEqual(str(cm.exception), "Unhandled exception")
+        self.assertEqual(call_count, 1)  # No retries for unhandled exception
+    def test_backoff_async_with_openai_exceptions(self):
+        """Test backoff with OpenAI exception types."""
+        # Import OpenAI exceptions for testing
+        try:
+            from openai import RateLimitError, InternalServerError
+            from unittest.mock import Mock
+            call_count = 0
+            # Create a mock response object
+            mock_response = Mock()
+            mock_response.request = Mock()
+            mock_response.status_code = 429  # For RateLimitError
+            @backoff_async(exceptions=[RateLimitError, InternalServerError], scale=0.01, max_retries=3)
+            async def simulate_api_errors():
+                nonlocal call_count
+                call_count += 1
+                await asyncio.sleep(0.01)
+                if call_count == 1:
+                    mock_response.status_code = 429
+                    raise RateLimitError("Rate limit hit", response=mock_response, body=None)
+                elif call_count == 2:
+                    mock_response.status_code = 500
+                    raise InternalServerError("Server error", response=mock_response, body=None)
+                return "success"
+            result = asyncio.run(simulate_api_errors())
+            self.assertEqual(result, "success")
+            self.assertEqual(call_count, 3)
+        except ImportError:
+            # Skip test if OpenAI is not installed
+            self.skipTest("OpenAI not installed")
+    def test_backoff_production_settings(self):
+        """Test backoff with production-like settings for OpenAI API."""
+        call_count = 0
+        call_times = []
+        @backoff(exceptions=[ValueError], scale=1, max_retries=12)
+        def simulate_rate_limit_scenario():
+            nonlocal call_count
+            call_count += 1
+            call_times.append(time.time())
+            # Simulate rate limit that clears after a few retries
+            if call_count < 4:
+                raise ValueError("Rate limit hit")
+            return "success"
+        start_time = time.time()
+        result = simulate_rate_limit_scenario()
+        total_time = time.time() - start_time
+        self.assertEqual(result, "success")
+        self.assertEqual(call_count, 4)
+        self.assertEqual(len(call_times), 4)
+        # With scale=1, total time should be reasonable (under 10 seconds)
+        # First attempt: immediate, then ~1s, ~2s, ~4s delays
+        self.assertLess(total_time, 10)
+        self.assertGreater(total_time, 0.5)  # Should have some delay

openaivec-0.13.0/tests/test_util.py DELETED Viewed

@@ -1,41 +0,0 @@
-from unittest import TestCase
-import tiktoken
-from openaivec.util import TextChunker
-class TestTextChunker(TestCase):
-    def setUp(self):
-        self.sep = TextChunker(
-            enc=tiktoken.encoding_for_model("text-embedding-3-large"),
-        )
-    def test_split(self):
-        text = """
-Kubernetes was announced by Google on June 6, 2014.[10] The project was conceived and created by Google employees Joe Beda, Brendan Burns, and Craig McLuckie. Others at Google soon joined to help build the project including Ville Aikas, Dawn Chen, Brian Grant, Tim Hockin, and Daniel Smith.[11][12] Other companies such as Red Hat and CoreOS joined the effort soon after, with notable contributors such as Clayton Coleman and Kelsey Hightower.[10]
-The design and development of Kubernetes was inspired by Google's Borg cluster manager and based on Promise Theory.[13][14] Many of its top contributors had previously worked on Borg;[15][16] they codenamed Kubernetes "Project 7" after the Star Trek ex-Borg character Seven of Nine[17] and gave its logo a seven-spoked ship's wheel (designed by Tim Hockin). Unlike Borg, which was written in C++,[15] Kubernetes is written in the Go language.
-Kubernetes was announced in June, 2014 and version 1.0 was released on July 21, 2015.[18] Google worked with the Linux Foundation to form the Cloud Native Computing Foundation (CNCF)[19] and offered Kubernetes as the seed technology.
-Google was already offering a managed Kubernetes service, GKE, and Red Hat was supporting Kubernetes as part of OpenShift since the inception of the Kubernetes project in 2014.[20] In 2017, the principal competitors rallied around Kubernetes and announced adding native support for it:
-VMware (proponent of Pivotal Cloud Foundry)[21] in August,
-Mesosphere, Inc. (proponent of Marathon and Mesos)[22] in September,
-Docker, Inc. (proponent of Docker)[23] in October,
-Microsoft Azure[24] also in October,
-AWS announced support for Kubernetes via the Elastic Kubernetes Service (EKS)[25] in November.
-Cisco Elastic Kubernetes Service (EKS)[26] in November.
-On March 6, 2018, Kubernetes Project reached ninth place in the list of GitHub projects by the number of commits, and second place in authors and issues, after the Linux kernel.[27]
-Until version 1.18, Kubernetes followed an N-2 support policy, meaning that the three most recent minor versions receive security updates and bug fixes.[28] Starting with version 1.19, Kubernetes follows an N-3 support policy.[29]
-"""
-        chunks = self.sep.split(text, max_tokens=256, sep=[".", "\n\n"])
-        # Assert that the number of chunks is as expected
-        enc = tiktoken.encoding_for_model("text-embedding-3-large")
-        for chunk in chunks:
-            self.assertLessEqual(len(enc.encode(chunk)), 256)