PyPI - indoxrouter - Versions diffs - 0.1.0__py3-none-any.whl → 0.1.2__py3-none-any.whl - Mend

indoxrouter 0.1.0py3-none-any.whl → 0.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

indoxRouter/__init__.py +83 -0
indoxRouter/client.py +564 -218
indoxRouter/client_resourses/__init__.py +20 -0
indoxRouter/client_resourses/base.py +67 -0
indoxRouter/client_resourses/chat.py +144 -0
indoxRouter/client_resourses/completion.py +138 -0
indoxRouter/client_resourses/embedding.py +83 -0
indoxRouter/client_resourses/image.py +116 -0
indoxRouter/client_resourses/models.py +114 -0
indoxRouter/config.py +151 -0
indoxRouter/constants/__init__.py +81 -0
indoxRouter/exceptions/__init__.py +70 -0
indoxRouter/models/__init__.py +111 -0
indoxRouter/providers/__init__.py +50 -50
indoxRouter/providers/ai21labs.json +128 -0
indoxRouter/providers/base_provider.py +62 -30
indoxRouter/providers/claude.json +164 -0
indoxRouter/providers/cohere.json +116 -0
indoxRouter/providers/databricks.json +110 -0
indoxRouter/providers/deepseek.json +110 -0
indoxRouter/providers/google.json +128 -0
indoxRouter/providers/meta.json +128 -0
indoxRouter/providers/mistral.json +146 -0
indoxRouter/providers/nvidia.json +110 -0
indoxRouter/providers/openai.json +308 -0
indoxRouter/providers/openai.py +471 -72
indoxRouter/providers/qwen.json +110 -0
indoxRouter/utils/__init__.py +240 -0
indoxrouter-0.1.2.dist-info/LICENSE +21 -0
indoxrouter-0.1.2.dist-info/METADATA +259 -0
indoxrouter-0.1.2.dist-info/RECORD +33 -0
indoxRouter/api_endpoints.py +0 -336
indoxRouter/client_package.py +0 -138
indoxRouter/init_db.py +0 -71
indoxRouter/main.py +0 -711
indoxRouter/migrations/__init__.py +0 -1
indoxRouter/migrations/env.py +0 -98
indoxRouter/migrations/versions/__init__.py +0 -1
indoxRouter/migrations/versions/initial_schema.py +0 -84
indoxRouter/providers/ai21.py +0 -268
indoxRouter/providers/claude.py +0 -177
indoxRouter/providers/cohere.py +0 -171
indoxRouter/providers/databricks.py +0 -166
indoxRouter/providers/deepseek.py +0 -166
indoxRouter/providers/google.py +0 -216
indoxRouter/providers/llama.py +0 -164
indoxRouter/providers/meta.py +0 -227
indoxRouter/providers/mistral.py +0 -182
indoxRouter/providers/nvidia.py +0 -164
indoxrouter-0.1.0.dist-info/METADATA +0 -179
indoxrouter-0.1.0.dist-info/RECORD +0 -27
{indoxrouter-0.1.0.dist-info → indoxrouter-0.1.2.dist-info}/WHEEL +0 -0
{indoxrouter-0.1.0.dist-info → indoxrouter-0.1.2.dist-info}/top_level.txt +0 -0

indoxRouter/providers/openai.py CHANGED Viewed

@@ -1,122 +1,521 @@
-from typing import Dict, Any
-import json
+"""
+OpenAI provider for indoxRouter.
+"""
 import os
-from pathlib import Path
-from openai import OpenAI as OpenAIClient
+from typing import Dict, List, Any, Optional, Union
+import openai
+from openai import OpenAI
+from datetime import datetime
 from .base_provider import BaseProvider
+from ..exceptions import AuthenticationError, RequestError, RateLimitError
+from ..utils import calculate_cost, get_model_info
+from ..models import ChatMessage
 class Provider(BaseProvider):
-    """
-    OpenAI provider implementation
-    """
+    """OpenAI provider implementation."""
     def __init__(self, api_key: str, model_name: str):
         """
-        Initialize the OpenAI provider
+        Initialize the OpenAI provider.
         Args:
-            api_key: OpenAI API key
-            model_name: Model name to use (e.g., 'gpt-4')
+            api_key: The API key for OpenAI.
+            model_name: The name of the model to use.
         """
         super().__init__(api_key, model_name)
-        self.client = OpenAIClient(api_key=api_key)
-        self.model_config = self._load_model_config(model_name)
+        self.client = OpenAI(api_key=api_key)
+        self.model_info = get_model_info("openai", model_name)
-    def _load_model_config(self, model_name: str) -> Dict[str, Any]:
+    def chat(self, messages: List[Dict[str, str]], **kwargs) -> Dict[str, Any]:
         """
-        Load model configuration from JSON file
+        Send a chat request to OpenAI.
         Args:
-            model_name: Model name
+            messages: A list of message dictionaries with 'role' and 'content' keys.
+            **kwargs: Additional parameters to pass to the OpenAI API.
         Returns:
-            Model configuration dictionary
+            A dictionary containing the response from OpenAI.
+            If stream=True and return_generator=True, returns a generator that yields chunks of the response.
+        Raises:
+            AuthenticationError: If the API key is invalid.
+            RequestError: If the request fails.
+            RateLimitError: If the rate limit is exceeded.
         """
-        # Get the path to the model configuration file
-        config_path = Path(__file__).parent / "openai.json"
+        try:
+            # Check if streaming is requested
+            stream = kwargs.pop("stream", False)
+            # Check if we should return a generator
+            return_generator = kwargs.pop("return_generator", False)
+            # If streaming is requested, we need to handle it differently
+            if stream:
+                # Remove stream from kwargs to avoid passing it twice
+                openai_messages = []
+                for msg in messages:
+                    if isinstance(msg, ChatMessage):
+                        openai_messages.append(
+                            {"role": msg.role, "content": msg.content}
+                        )
+                    else:
+                        openai_messages.append(msg)
+                # Create the streaming response
+                stream_response = self.client.chat.completions.create(
+                    model=self.model_name,
+                    messages=openai_messages,
+                    stream=True,
+                    **kwargs,
+                )
+                # If return_generator is True, return a generator that yields chunks
+                if return_generator:
+                    # Create a streaming generator with usage tracking
+                    return StreamingGenerator(
+                        stream_response=stream_response,
+                        model_name=self.model_name,
+                        messages=messages,
+                    )
+                # Otherwise, collect the full response content from the stream
+                content = ""
+                for chunk in stream_response:
+                    if hasattr(chunk, "choices") and len(chunk.choices) > 0:
+                        delta = chunk.choices[0].delta
+                        if hasattr(delta, "content") and delta.content is not None:
+                            content += delta.content
+                # For streaming responses, we don't have usage information directly
+                # We'll provide a minimal response with the content
+                return {
+                    "data": content,
+                    "model": self.model_name,
+                    "provider": "openai",
+                    "success": True,
+                    "message": "Successfully completed streaming chat request",
+                    "cost": 0.0,  # We don't have cost information for streaming responses
+                    "timestamp": datetime.now().isoformat(),
+                    "usage": {
+                        "tokens_prompt": 0,  # We don't have token information for streaming responses
+                        "tokens_completion": 0,
+                        "tokens_total": 0,
+                    },
+                    "finish_reason": "stop",  # Default finish reason
+                    "raw_response": None,  # We don't have the raw response for streaming
+                }
-        # Load the configuration
-        with open(config_path, "r") as f:
-            config = json.load(f)
+            # Handle non-streaming responses as before
+            openai_messages = []
+            for msg in messages:
+                if isinstance(msg, ChatMessage):
+                    openai_messages.append({"role": msg.role, "content": msg.content})
+                else:
+                    openai_messages.append(msg)
+            response = self.client.chat.completions.create(
+                model=self.model_name,
+                messages=openai_messages,
+                **kwargs,
+            )
+            # Extract the response content
+            content = response.choices[0].message.content
-        # Find the model configuration
-        for model in config.get("models", []):
-            if model.get("id") == model_name:
-                return model
+            # Extract usage information from the response
+            prompt_tokens = (
+                response.usage.prompt_tokens
+                if hasattr(response.usage, "prompt_tokens")
+                else 0
+            )
+            completion_tokens = (
+                response.usage.completion_tokens
+                if hasattr(response.usage, "completion_tokens")
+                else 0
+            )
+            total_tokens = (
+                response.usage.total_tokens
+                if hasattr(response.usage, "total_tokens")
+                else 0
+            )
-        # If model not found, raise an error
-        raise ValueError(f"Model {model_name} not found in OpenAI configuration")
+            cost = calculate_cost(
+                f"openai/{self.model_name}",
+                input_tokens=prompt_tokens,
+                output_tokens=completion_tokens,
+            )
-    def estimate_cost(self, prompt: str, max_tokens: int) -> float:
+            # Create a response dictionary with the extracted information
+            return {
+                "data": content,
+                "model": self.model_name,
+                "provider": "openai",
+                "success": True,
+                "message": "Successfully completed chat request",
+                "cost": cost,
+                "timestamp": datetime.now().isoformat(),
+                # Add usage as dict with consistent field names
+                "usage": {
+                    "tokens_prompt": prompt_tokens,
+                    "tokens_completion": completion_tokens,
+                    "tokens_total": total_tokens,
+                },
+                # Optional fields
+                "finish_reason": response.choices[0].finish_reason,
+                "raw_response": response.model_dump(),
+            }
+        except openai.AuthenticationError:
+            raise AuthenticationError("Invalid OpenAI API key.")
+        except openai.RateLimitError:
+            raise RateLimitError("OpenAI rate limit exceeded.")
+        except Exception as e:
+            raise RequestError(f"OpenAI request failed: {str(e)}")
+    def complete(self, prompt: str, **kwargs) -> Dict[str, Any]:
         """
-        Estimate the cost of generating a completion
+        Send a completion request to OpenAI.
         Args:
-            prompt: The prompt to generate a completion for
-            max_tokens: Maximum number of tokens to generate
+            prompt: The prompt to complete.
+            **kwargs: Additional parameters to pass to the OpenAI API.
         Returns:
-            Estimated cost in credits
+            A dictionary containing the response from OpenAI.
+            If stream=True and return_generator=True, returns a generator that yields chunks of the response.
+        Raises:
+            AuthenticationError: If the API key is invalid.
+            RequestError: If the request fails.
+            RateLimitError: If the rate limit is exceeded.
         """
-        input_tokens = self.count_tokens(prompt)
-        max_output_tokens = min(
-            max_tokens, self.model_config.get("max_output_tokens", 4096)
-        )
-        return (
-            input_tokens * self.model_config["inputPricePer1KTokens"] / 1000
-            + max_output_tokens * self.model_config["outputPricePer1KTokens"] / 1000
-        )
+        # Check if streaming is requested
+        stream = kwargs.pop("stream", False)
+        return_generator = kwargs.pop("return_generator", False)
-    def count_tokens(self, text: str) -> int:
+        # For OpenAI, we'll use the chat API for completions as well
+        messages = [{"role": "user", "content": prompt}]
+        # If streaming is requested, handle it through the chat method
+        if stream:
+            return self.chat(
+                messages, stream=True, return_generator=return_generator, **kwargs
+            )
+        # Otherwise, use the regular chat method
+        return self.chat(messages, **kwargs)
+    def embed(self, text: Union[str, List[str]], **kwargs) -> Dict[str, Any]:
         """
-        Count the number of tokens in a text
+        Send an embedding request to OpenAI.
         Args:
-            text: Text to count tokens for
+            text: The text to embed. Can be a single string or a list of strings.
+            **kwargs: Additional parameters to pass to the OpenAI API.
         Returns:
-            Number of tokens
+            A dictionary containing the embeddings from OpenAI.
+        Raises:
+            AuthenticationError: If the API key is invalid.
+            RequestError: If the request fails.
+            RateLimitError: If the rate limit is exceeded.
         """
-        # Simple approximation - in production, use tiktoken or similar
-        return len(text.split()) * 1.3
+        try:
+            # Ensure text is a list
+            if isinstance(text, str):
+                text = [text]
+            # Use the embedding model
+            response = self.client.embeddings.create(
+                model=self.model_name, input=text, **kwargs
+            )
-    def generate(self, prompt: str, **kwargs) -> Dict[str, Any]:
+            # Extract embeddings
+            embeddings = [item.embedding for item in response.data]
+            # Create a list of embedding objects with the expected structure
+            embedding_objects = []
+            for i, embedding in enumerate(embeddings):
+                embedding_objects.append(
+                    {
+                        "embedding": embedding,
+                        "index": i,
+                        "text": text[i] if i < len(text) else "",
+                    }
+                )
+            # Extract usage information from the response
+            prompt_tokens = (
+                response.usage.prompt_tokens
+                if hasattr(response.usage, "prompt_tokens")
+                else 0
+            )
+            total_tokens = (
+                response.usage.total_tokens
+                if hasattr(response.usage, "total_tokens")
+                else 0
+            )
+            embedding_price_per_1k = get_model_info("openai", self.model_name).get(
+                "inputPricePer1KTokens"
+            )
+            # Calculate the cost
+            cost = (prompt_tokens / 1000) * embedding_price_per_1k
+            # Create usage information
+            usage = {
+                "tokens_prompt": prompt_tokens,
+                "tokens_completion": 0,
+                "tokens_total": total_tokens,
+                "cost": cost,
+                "latency": 0.0,  # We don't have latency information from the API
+                "timestamp": datetime.now().isoformat(),
+            }
+            return {
+                "data": embedding_objects,
+                "model": self.model_name,
+                "provider": "openai",
+                "success": True,
+                "message": "Successfully generated embeddings",
+                "usage": usage,
+                "raw_response": response.model_dump(),
+            }
+        except openai.AuthenticationError:
+            raise AuthenticationError("Invalid OpenAI API key.")
+        except openai.RateLimitError:
+            raise RateLimitError("OpenAI rate limit exceeded.")
+        except Exception as e:
+            raise RequestError(f"OpenAI embedding request failed: {str(e)}")
+    def generate_image(self, prompt: str, **kwargs) -> Dict[str, Any]:
         """
-        Generate a completion using OpenAI
+        Generate an image from a prompt using OpenAI.
         Args:
-            prompt: The prompt to generate a completion for
-            **kwargs: Additional parameters for the generation
+            prompt: The prompt to generate an image from.
+            **kwargs: Additional parameters to pass to the OpenAI API.
         Returns:
-            Dictionary containing the response text, cost, and other metadata
+            A dictionary containing the image URL or data.
+        Raises:
+            AuthenticationError: If the API key is invalid.
+            RequestError: If the request fails.
+            RateLimitError: If the rate limit is exceeded.
         """
-        # Make API call
-        response = self.client.chat.completions.create(
-            model=self.model_name,
-            messages=[{"role": "user", "content": prompt}],
-            **kwargs,
-        )
+        try:
+            # Use DALL-E model
+            model = kwargs.get("model", "dall-e-3")
+            size = kwargs.get("size", "1024x1024")
+            quality = kwargs.get("quality", "standard")
+            n = kwargs.get("n", 1)
+            response = self.client.images.generate(
+                model=model, prompt=prompt, size=size, quality=quality, n=n
+            )
+            # Extract image URLs
+            images = [item.url for item in response.data]
+            # For image generation, we don't have token usage, so we'll estimate cost
+            # based on the model and parameters
+            cost = calculate_cost(
+                f"openai/{model}",  # e.g., "openai/dall-e-3"
+                input_tokens=n,  # Number of images
+                output_tokens=0,
+            )
+            # Create usage information
+            usage = {
+                "tokens_prompt": 0,  # We don't have token information for images
+                "tokens_completion": 0,
+                "tokens_total": 0,
+                "cost": cost,
+                "latency": 0.0,
+                "timestamp": datetime.now().isoformat(),
+            }
+            return {
+                "data": images,
+                "model": model,
+                "provider": "openai",
+                "success": True,
+                "message": "Successfully generated images",
+                "usage": usage,
+                "sizes": [size] * n,
+                "formats": ["url"] * n,
+                "raw_response": response.model_dump(),
+            }
+        except openai.AuthenticationError:
+            raise AuthenticationError("Invalid OpenAI API key.")
+        except openai.RateLimitError:
+            raise RateLimitError("OpenAI rate limit exceeded.")
+        except Exception as e:
+            raise RequestError(f"OpenAI image generation request failed: {str(e)}")
+    def get_token_count(self, text: str) -> int:
+        """
+        Get the number of tokens in a text using OpenAI's tokenizer.
+        Args:
+            text: The text to count tokens for.
+        Returns:
+            The number of tokens in the text.
+        """
+        try:
+            # Use tiktoken for token counting
+            import tiktoken
+            encoding = tiktoken.encoding_for_model(self.model_name)
+            return len(encoding.encode(text))
+        except ImportError:
+            # Fallback to a simple approximation if tiktoken is not available
+            return len(text.split()) * 1.3  # Rough approximation
+    def get_model_info(self) -> Dict[str, Any]:
+        """
+        Get information about the model.
+        Returns:
+            A dictionary containing information about the model.
+        """
+        return self.model_info
+class StreamingGenerator:
+    """
+    A generator class that yields chunks of text from a streaming response
+    and provides methods to get usage information at any point.
+    """
+    def __init__(self, stream_response, model_name, messages):
+        """
+        Initialize the streaming generator.
+        Args:
+            stream_response: The streaming response from the provider.
+            model_name: The name of the model being used.
+            messages: The messages sent to the provider.
+        """
+        self.stream_response = stream_response
+        self.model_name = model_name
+        self.messages = messages
+        self.full_content = ""
+        self.finish_reason = None
+        self.is_finished = False
+        # Try to initialize tiktoken for token counting
+        try:
+            import tiktoken
+            self.encoding = tiktoken.encoding_for_model(model_name)
+            self.has_tiktoken = True
+        except (ImportError, Exception):
+            self.has_tiktoken = False
+        # Estimate prompt tokens
+        self.prompt_tokens = self._count_prompt_tokens()
+    def _count_prompt_tokens(self):
+        """Count tokens in the prompt messages."""
+        if self.has_tiktoken:
+            # Use tiktoken for accurate token counting
+            prompt_text = " ".join(
+                [
+                    msg.get("content", "") if isinstance(msg, dict) else msg.content
+                    for msg in self.messages
+                ]
+            )
+            return len(self.encoding.encode(prompt_text))
+        else:
+            # Fallback to character-based estimation
+            prompt_text = " ".join(
+                [
+                    msg.get("content", "") if isinstance(msg, dict) else msg.content
+                    for msg in self.messages
+                ]
+            )
+            return len(prompt_text) // 4  # Rough estimate: 4 chars per token
+    def _count_completion_tokens(self):
+        """Count tokens in the completion text."""
+        if self.has_tiktoken:
+            # Use tiktoken for accurate token counting
+            return len(self.encoding.encode(self.full_content))
+        else:
+            # Fallback to character-based estimation
+            return len(self.full_content) // 4  # Rough estimate: 4 chars per token
+    def get_usage_info(self):
+        """
+        Get usage information based on the current state.
+        Returns:
+            A dictionary with usage information.
+        """
+        completion_tokens = self._count_completion_tokens()
+        total_tokens = self.prompt_tokens + completion_tokens
         # Calculate cost
-        input_cost = (response.usage.prompt_tokens / 1000) * self.model_config[
-            "inputPricePer1KTokens"
-        ]
-        output_cost = (response.usage.completion_tokens / 1000) * self.model_config[
-            "outputPricePer1KTokens"
-        ]
-        total_cost = input_cost + output_cost
-        # Return standardized response
+        cost = calculate_cost(
+            f"openai/{self.model_name}",
+            input_tokens=self.prompt_tokens,
+            output_tokens=completion_tokens,
+        )
         return {
-            "text": response.choices[0].message.content,
-            "cost": total_cost,
             "usage": {
-                "prompt_tokens": response.usage.prompt_tokens,
-                "completion_tokens": response.usage.completion_tokens,
-                "total_tokens": response.usage.prompt_tokens
-                + response.usage.completion_tokens,
+                "tokens_prompt": self.prompt_tokens,
+                "tokens_completion": completion_tokens,
+                "tokens_total": total_tokens,
             },
+            "cost": cost,
             "model": self.model_name,
+            "provider": "openai",
+            "finish_reason": self.finish_reason,
+            "is_finished": self.is_finished,
         }
+    def __iter__(self):
+        return self
+    def __next__(self):
+        """Get the next chunk from the stream."""
+        if self.is_finished:
+            raise StopIteration
+        try:
+            chunk = next(self.stream_response)
+            if hasattr(chunk, "choices") and len(chunk.choices) > 0:
+                # Check for finish reason
+                if (
+                    hasattr(chunk.choices[0], "finish_reason")
+                    and chunk.choices[0].finish_reason
+                ):
+                    self.finish_reason = chunk.choices[0].finish_reason
+                # Get content delta
+                delta = chunk.choices[0].delta
+                if hasattr(delta, "content") and delta.content is not None:
+                    content_chunk = delta.content
+                    self.full_content += content_chunk
+                    return content_chunk
+                # If we got a chunk with no content but with finish_reason, we're done
+                if self.finish_reason:
+                    self.is_finished = True
+                    raise StopIteration
+            # If we got here, try the next chunk
+            return next(self)
+        except StopIteration:
+            self.is_finished = True
+            raise

indoxrouter 0.1.0__py3-none-any.whl → 0.1.2__py3-none-any.whl

indoxrouter 0.1.0py3-none-any.whl → 0.1.2py3-none-any.whl