PyPI - eval-ai-library - Versions diffs - 0.3.2__py3-none-any.whl → 0.3.10__py3-none-any.whl - Mend

eval-ai-library 0.3.2py3-none-any.whl → 0.3.10py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of eval-ai-library might be problematic. Click here for more details.

Files changed (12) hide show

{eval_ai_library-0.3.2.dist-info → eval_ai_library-0.3.10.dist-info}/METADATA +379 -1
{eval_ai_library-0.3.2.dist-info → eval_ai_library-0.3.10.dist-info}/RECORD +12 -8
eval_ai_library-0.3.10.dist-info/entry_points.txt +2 -0
eval_lib/__init__.py +11 -1
eval_lib/cli.py +166 -0
eval_lib/dashboard_server.py +172 -0
eval_lib/evaluate.py +24 -1
eval_lib/html.py +736 -0
eval_lib/llm_client.py +47 -1
{eval_ai_library-0.3.2.dist-info → eval_ai_library-0.3.10.dist-info}/WHEEL +0 -0
{eval_ai_library-0.3.2.dist-info → eval_ai_library-0.3.10.dist-info}/licenses/LICENSE +0 -0
{eval_ai_library-0.3.2.dist-info → eval_ai_library-0.3.10.dist-info}/top_level.txt +0 -0

eval_lib/llm_client.py CHANGED Viewed

@@ -2,6 +2,7 @@
 import openai
 import functools
 import anthropic
+from abc import ABC, abstractmethod
 from openai import AsyncAzureOpenAI
 from google import genai
 from google.genai.types import GenerateContentConfig
@@ -13,6 +14,45 @@ from types import SimpleNamespace
 from .price import model_pricing
+class CustomLLMClient(ABC):
+    """
+    Base class for custom LLM clients.
+    Inherit from this to create your own model implementations.
+    Example:
+        class MyCustomLLM(CustomLLMClient):
+            async def chat_complete(self, messages, temperature):
+                # Your implementation
+                return response_text, cost
+            def get_model_name(self):
+                return "my-custom-model"
+    """
+    @abstractmethod
+    async def chat_complete(
+        self,
+        messages: list[dict[str, str]],
+        temperature: float
+    ) -> tuple[str, Optional[float]]:
+        """
+        Generate a response for the given messages.
+        Args:
+            messages: List of message dicts [{"role": "user", "content": "..."}]
+            temperature: Sampling temperature
+        Returns:
+            Tuple of (response_text, cost_in_usd)
+        """
+        pass
+    @abstractmethod
+    def get_model_name(self) -> str:
+        """Return the model name for logging/tracking purposes."""
+        pass
 class LLMConfigurationError(Exception):
     """Raised when LLM client configuration is missing or invalid."""
     pass
@@ -24,6 +64,7 @@ class Provider(str, Enum):
     GOOGLE = "google"
     OLLAMA = "ollama"
     ANTHROPIC = "anthropic"
+    CUSTOM = "custom"
 @dataclass(frozen=True, slots=True)
@@ -308,7 +349,7 @@ _HELPERS = {
 async def chat_complete(
-    llm: str | tuple[str, str] | LLMDescriptor,
+    llm: str | tuple[str, str] | LLMDescriptor | CustomLLMClient,
     messages: list[dict[str, str]],
     temperature: float = 0.0,
 ):
@@ -327,6 +368,11 @@ async def chat_complete(
         LLMConfigurationError: If required API keys or configuration are missing
         ValueError: If provider is not supported
     """
+    # Handle custom LLM clients
+    if isinstance(llm, CustomLLMClient):
+        return await llm.chat_complete(messages, temperature)
+    # Standard providers
     llm = LLMDescriptor.parse(llm)
     helper = _HELPERS.get(llm.provider)

{eval_ai_library-0.3.2.dist-info → eval_ai_library-0.3.10.dist-info}/WHEEL RENAMED Viewed

File without changes

{eval_ai_library-0.3.2.dist-info → eval_ai_library-0.3.10.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{eval_ai_library-0.3.2.dist-info → eval_ai_library-0.3.10.dist-info}/top_level.txt RENAMED Viewed

File without changes

eval-ai-library 0.3.2__py3-none-any.whl → 0.3.10__py3-none-any.whl

Potentially problematic release.

eval-ai-library 0.3.2py3-none-any.whl → 0.3.10py3-none-any.whl