PyPI - inferencesh - Versions diffs - 0.2.7__py3-none-any.whl → 0.2.9__py3-none-any.whl - Mend

inferencesh 0.2.7py3-none-any.whl → 0.2.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

inferencesh/__init__.py +28 -1
inferencesh/models/__init__.py +25 -0
inferencesh/models/base.py +94 -0
inferencesh/models/file.py +182 -0
inferencesh/models/llm.py +356 -0
inferencesh/utils/__init__.py +6 -0
inferencesh/utils/download.py +51 -0
inferencesh/utils/storage.py +16 -0
{inferencesh-0.2.7.dist-info → inferencesh-0.2.9.dist-info}/METADATA +1 -1
inferencesh-0.2.9.dist-info/RECORD +14 -0
{inferencesh-0.2.7.dist-info → inferencesh-0.2.9.dist-info}/WHEEL +1 -1
inferencesh/sdk.py +0 -415
inferencesh-0.2.7.dist-info/RECORD +0 -8
{inferencesh-0.2.7.dist-info → inferencesh-0.2.9.dist-info}/entry_points.txt +0 -0
{inferencesh-0.2.7.dist-info → inferencesh-0.2.9.dist-info}/licenses/LICENSE +0 -0
{inferencesh-0.2.7.dist-info → inferencesh-0.2.9.dist-info}/top_level.txt +0 -0

inferencesh/__init__.py CHANGED Viewed

@@ -2,4 +2,31 @@
 __version__ = "0.1.2"
-from .sdk import BaseApp, BaseAppInput, BaseAppOutput, File, LLMInput, ContextMessage, ContextMessageWithImage, LLMInputWithImage
+from .models import (
+    BaseApp,
+    BaseAppInput,
+    BaseAppOutput,
+    File,
+    ContextMessageRole,
+    Message,
+    ContextMessage,
+    ContextMessageWithImage,
+    LLMInput,
+    LLMInputWithImage,
+)
+from .utils import StorageDir, download
+__all__ = [
+    "BaseApp",
+    "BaseAppInput",
+    "BaseAppOutput",
+    "File",
+    "ContextMessageRole",
+    "Message",
+    "ContextMessage",
+    "ContextMessageWithImage",
+    "LLMInput",
+    "LLMInputWithImage",
+    "StorageDir",
+    "download",
+]

inferencesh/models/__init__.py ADDED Viewed

@@ -0,0 +1,25 @@
+"""Models package for inference.sh SDK."""
+from .base import BaseApp, BaseAppInput, BaseAppOutput
+from .file import File
+from .llm import (
+    ContextMessageRole,
+    Message,
+    ContextMessage,
+    ContextMessageWithImage,
+    LLMInput,
+    LLMInputWithImage,
+)
+__all__ = [
+    "BaseApp",
+    "BaseAppInput",
+    "BaseAppOutput",
+    "File",
+    "ContextMessageRole",
+    "Message",
+    "ContextMessage",
+    "ContextMessageWithImage",
+    "LLMInput",
+    "LLMInputWithImage",
+]

inferencesh/models/base.py ADDED Viewed

@@ -0,0 +1,94 @@
+from typing import Any, Dict, List
+from pydantic import BaseModel, ConfigDict
+import inspect
+import ast
+import textwrap
+from collections import OrderedDict
+class OrderedSchemaModel(BaseModel):
+    """A base model that ensures the JSON schema properties and required fields are in the order of field definition."""
+    @classmethod
+    def model_json_schema(cls, by_alias: bool = True, **kwargs: Any) -> Dict[str, Any]:
+        schema = super().model_json_schema(by_alias=by_alias, **kwargs)
+        field_order = cls._get_field_order()
+        if field_order:
+            # Order properties
+            ordered_properties = OrderedDict()
+            for field_name in field_order:
+                if field_name in schema['properties']:
+                    ordered_properties[field_name] = schema['properties'][field_name]
+            # Add any remaining properties that weren't in field_order
+            for field_name, field_schema in schema['properties'].items():
+                if field_name not in ordered_properties:
+                    ordered_properties[field_name] = field_schema
+            schema['properties'] = ordered_properties
+            # Order required fields
+            if 'required' in schema:
+                ordered_required = [field for field in field_order if field in schema['required']]
+                # Add any remaining required fields that weren't in field_order
+                ordered_required.extend([field for field in schema['required'] if field not in ordered_required])
+                schema['required'] = ordered_required
+        return schema
+    @classmethod
+    def _get_field_order(cls) -> List[str]:
+        """Get the order of fields as they were defined in the class."""
+        source = inspect.getsource(cls)
+        # Unindent the entire source code
+        source = textwrap.dedent(source)
+        try:
+            module = ast.parse(source)
+        except IndentationError:
+            # If we still get an IndentationError, wrap the class in a dummy module
+            source = f"class DummyModule:\n{textwrap.indent(source, '    ')}"
+            module = ast.parse(source)
+            # Adjust to look at the first class def inside DummyModule
+            # noinspection PyUnresolvedReferences
+            class_def = module.body[0].body[0]
+        else:
+            # Find the class definition
+            class_def = next(
+                node for node in module.body if isinstance(node, ast.ClassDef) and node.name == cls.__name__
+            )
+        # Extract field names in the order they were defined
+        field_order = []
+        for node in class_def.body:
+            if isinstance(node, ast.AnnAssign) and isinstance(node.target, ast.Name):
+                field_order.append(node.target.id)
+        return field_order
+class BaseAppInput(OrderedSchemaModel):
+    pass
+class BaseAppOutput(OrderedSchemaModel):
+    pass
+class BaseApp(BaseModel):
+    model_config = ConfigDict(
+        arbitrary_types_allowed=True,
+        extra='allow'
+    )
+    async def setup(self):
+        pass
+    async def run(self, app_input: BaseAppInput) -> BaseAppOutput:
+        raise NotImplementedError("run method must be implemented")
+    async def unload(self):
+        pass

inferencesh/models/file.py ADDED Viewed

@@ -0,0 +1,182 @@
+from typing import Optional, Union, Any
+from pydantic import BaseModel, Field, PrivateAttr, model_validator
+import mimetypes
+import os
+import urllib.request
+import urllib.parse
+import tempfile
+from tqdm import tqdm
+class File(BaseModel):
+    """A class representing a file in the inference.sh ecosystem."""
+    uri: Optional[str] = Field(default=None)  # Original location (URL or file path)
+    path: Optional[str] = None  # Resolved local file path
+    content_type: Optional[str] = None  # MIME type of the file
+    size: Optional[int] = None  # File size in bytes
+    filename: Optional[str] = None  # Original filename if available
+    _tmp_path: Optional[str] = PrivateAttr(default=None)  # Internal storage for temporary file path
+    def __init__(self, initializer=None, **data):
+        if initializer is not None:
+            if isinstance(initializer, str):
+                data['uri'] = initializer
+            elif isinstance(initializer, File):
+                data = initializer.model_dump()
+            else:
+                raise ValueError(f'Invalid input for File: {initializer}')
+        super().__init__(**data)
+    @model_validator(mode='before')
+    @classmethod
+    def convert_str_to_file(cls, values):
+        if isinstance(values, str):  # Only accept strings
+            return {"uri": values}
+        elif isinstance(values, dict):
+            return values
+        raise ValueError(f'Invalid input for File: {values}')
+    @model_validator(mode='after')
+    def validate_required_fields(self) -> 'File':
+        """Validate that either uri or path is provided."""
+        if not self.uri and not self.path:
+            raise ValueError("Either 'uri' or 'path' must be provided")
+        return self
+    def model_post_init(self, _: Any) -> None:
+        """Initialize file path and metadata after model creation.
+        This method handles:
+        1. Downloading URLs to local files if uri is a URL
+        2. Converting relative paths to absolute paths
+        3. Populating file metadata
+        """
+        # Handle uri if provided
+        if self.uri:
+            if self._is_url(self.uri):
+                self._download_url()
+            else:
+                # Convert relative paths to absolute, leave absolute paths unchanged
+                self.path = os.path.abspath(self.uri)
+        # Handle path if provided
+        if self.path:
+            # Convert relative paths to absolute, leave absolute paths unchanged
+            self.path = os.path.abspath(self.path)
+            self._populate_metadata()
+            return
+        raise ValueError("Either 'uri' or 'path' must be provided and be valid")
+    def _is_url(self, path: str) -> bool:
+        """Check if the path is a URL."""
+        parsed = urllib.parse.urlparse(path)
+        return parsed.scheme in ('http', 'https')
+    def _download_url(self) -> None:
+        """Download the URL to a temporary file and update the path."""
+        original_url = self.uri
+        tmp_file = None
+        try:
+            # Create a temporary file with a suffix based on the URL path
+            suffix = os.path.splitext(urllib.parse.urlparse(original_url).path)[1]
+            tmp_file = tempfile.NamedTemporaryFile(delete=False, suffix=suffix)
+            self._tmp_path = tmp_file.name
+            # Set up request with user agent
+            headers = {
+                'User-Agent': (
+                    'Mozilla/5.0 (Windows NT 10.0; Win64; x64) '
+                    'AppleWebKit/537.36 (KHTML, like Gecko) '
+                    'Chrome/91.0.4472.124 Safari/537.36'
+                )
+            }
+            req = urllib.request.Request(original_url, headers=headers)
+            # Download the file with progress bar
+            print(f"Downloading URL: {original_url} to {self._tmp_path}")
+            try:
+                with urllib.request.urlopen(req) as response:
+                    total_size = int(response.headers.get('content-length', 0))
+                    block_size = 1024  # 1 Kibibyte
+                    with tqdm(total=total_size, unit='iB', unit_scale=True) as pbar:
+                        with open(self._tmp_path, 'wb') as out_file:
+                            while True:
+                                buffer = response.read(block_size)
+                                if not buffer:
+                                    break
+                                out_file.write(buffer)
+                                pbar.update(len(buffer))
+                self.path = self._tmp_path
+            except (urllib.error.URLError, urllib.error.HTTPError) as e:
+                raise RuntimeError(f"Failed to download URL {original_url}: {str(e)}")
+            except IOError as e:
+                raise RuntimeError(f"Failed to write downloaded file to {self._tmp_path}: {str(e)}")
+        except Exception as e:
+            # Clean up temp file if something went wrong
+            if tmp_file is not None and hasattr(self, '_tmp_path'):
+                try:
+                    os.unlink(self._tmp_path)
+                except (OSError, IOError):
+                    pass
+            raise RuntimeError(f"Error downloading URL {original_url}: {str(e)}")
+    def __del__(self):
+        """Cleanup temporary file if it exists."""
+        if hasattr(self, '_tmp_path') and self._tmp_path:
+            try:
+                os.unlink(self._tmp_path)
+            except (OSError, IOError):
+                pass
+    def _populate_metadata(self) -> None:
+        """Populate file metadata from the path if it exists."""
+        if os.path.exists(self.path):
+            if not self.content_type:
+                self.content_type = self._guess_content_type()
+            if not self.size:
+                self.size = self._get_file_size()
+            if not self.filename:
+                self.filename = self._get_filename()
+    @classmethod
+    def from_path(cls, path: Union[str, os.PathLike]) -> 'File':
+        """Create a File instance from a file path."""
+        return cls(uri=str(path))
+    def _guess_content_type(self) -> Optional[str]:
+        """Guess the MIME type of the file."""
+        return mimetypes.guess_type(self.path)[0]
+    def _get_file_size(self) -> int:
+        """Get the size of the file in bytes."""
+        return os.path.getsize(self.path)
+    def _get_filename(self) -> str:
+        """Get the base filename from the path."""
+        return os.path.basename(self.path)
+    def exists(self) -> bool:
+        """Check if the file exists."""
+        return os.path.exists(self.path)
+    def refresh_metadata(self) -> None:
+        """Refresh all metadata from the file."""
+        if os.path.exists(self.path):
+            self.content_type = self._guess_content_type()
+            self.size = self._get_file_size()  # Always update size
+            self.filename = self._get_filename()
+    @classmethod
+    def model_json_schema(cls, **kwargs):
+        schema = super().model_json_schema(**kwargs)
+        schema["$id"] = "/schemas/File"
+        # Create a schema that accepts either a string or the full object
+        return {
+            "oneOf": [
+                {"type": "string"},  # Accept string input
+                schema  # Accept full object input
+            ]
+        }

inferencesh/models/llm.py ADDED Viewed

@@ -0,0 +1,356 @@
+from typing import Optional, List, Any, Callable, Dict, Generator
+from enum import Enum
+from pydantic import Field
+from queue import Queue
+from threading import Thread
+import time
+from contextlib import contextmanager
+from .base import BaseAppInput, BaseAppOutput
+from .file import File
+class ContextMessageRole(str, Enum):
+    USER = "user"
+    ASSISTANT = "assistant"
+    SYSTEM = "system"
+class Message(BaseAppInput):
+    role: ContextMessageRole
+    content: str
+class ContextMessage(BaseAppInput):
+    role: ContextMessageRole = Field(
+        description="The role of the message",
+    )
+    text: str = Field(
+        description="The text content of the message"
+    )
+    image: Optional[File] = Field(
+        description="The image url of the message",
+        default=None
+    )
+class LLMInput(BaseAppInput):
+    system_prompt: str = Field(
+        description="The system prompt to use for the model",
+        default="You are a helpful assistant that can answer questions and help with tasks.",
+        examples=[
+            "You are a helpful assistant that can answer questions and help with tasks.",
+            "You are a certified medical professional who can provide accurate health information.",
+            "You are a certified financial advisor who can give sound investment guidance.",
+            "You are a certified cybersecurity expert who can explain security best practices.",
+            "You are a certified environmental scientist who can discuss climate and sustainability.",
+        ]
+    )
+    context: List[ContextMessage] = Field(
+        description="The context to use for the model",
+        examples=[
+            [
+                {"role": "user", "content": [{"type": "text", "text": "What is the capital of France?"}]},
+                {"role": "assistant", "content": [{"type": "text", "text": "The capital of France is Paris."}]}
+            ],
+            [
+                {"role": "user", "content": [{"type": "text", "text": "What is the weather like today?"}]},
+                {"role": "assistant", "content": [{"type": "text", "text": "I apologize, but I don't have access to real-time weather information. You would need to check a weather service or app to get current weather conditions for your location."}]}
+            ],
+            [
+                {"role": "user", "content": [{"type": "text", "text": "Can you help me write a poem about spring?"}]},
+                {"role": "assistant", "content": [{"type": "text", "text": "Here's a short poem about spring:\n\nGreen buds awakening,\nSoft rain gently falling down,\nNew life springs anew.\n\nWarm sun breaks through clouds,\nBirds return with joyful song,\nNature's sweet rebirth."}]}
+            ],
+            [
+                {"role": "user", "content": [{"type": "text", "text": "Explain quantum computing in simple terms"}]},
+                {"role": "assistant", "content": [{"type": "text", "text": "Quantum computing is like having a super-powerful calculator that can solve many problems at once instead of one at a time. While regular computers use bits (0s and 1s), quantum computers use quantum bits or \"qubits\" that can be both 0 and 1 at the same time - kind of like being in two places at once! This allows them to process huge amounts of information much faster than regular computers for certain types of problems."}]}
+            ]
+        ],
+        default=[]
+    )
+    text: str = Field(
+        description="The user prompt to use for the model",
+        examples=[
+            "What is the capital of France?",
+            "What is the weather like today?",
+            "Can you help me write a poem about spring?",
+            "Explain quantum computing in simple terms"
+        ],
+    )
+    image: Optional[File] = Field(
+        description="The image to use for the model",
+        default=None
+    )
+    # Optional parameters
+    temperature: float = Field(default=0.7)
+    top_p: float = Field(default=0.95)
+    max_tokens: int = Field(default=4096)
+    context_size: int = Field(default=4096)
+    # Model specific flags
+    enable_thinking: bool = Field(default=False)
+class LLMUsage(BaseAppOutput):
+    stop_reason: str = ""
+    time_to_first_token: float = 0.0
+    tokens_per_second: float = 0.0
+    prompt_tokens: int = 0
+    completion_tokens: int = 0
+    total_tokens: int = 0
+class LLMOutput(BaseAppOutput):
+    response: str
+    thinking_content: Optional[str] = None
+    usage: Optional[LLMUsage] = None
+@contextmanager
+def timing_context():
+    """Context manager to track timing information for LLM generation."""
+    class TimingInfo:
+        def __init__(self):
+            self.start_time = time.time()
+            self.first_token_time = None
+        def mark_first_token(self):
+            if self.first_token_time is None:
+                self.first_token_time = time.time()
+        @property
+        def stats(self):
+            end_time = time.time()
+            if self.first_token_time is None:
+                self.first_token_time = end_time
+            time_to_first = self.first_token_time - self.start_time
+            generation_time = end_time - self.first_token_time
+            return {
+                "time_to_first_token": time_to_first,
+                "generation_time": generation_time
+            }
+    timing = TimingInfo()
+    try:
+        yield timing
+    finally:
+        pass
+def build_messages(
+    input_data: LLMInput,
+    transform_user_message: Optional[Callable[[str], str]] = None
+) -> List[Dict[str, Any]]:
+    """Build messages for LLaMA.cpp chat completion.
+    Args:
+        input_data: The input data
+        transform_user_message: Optional function to transform user message text before building messages
+    """
+    messages = [
+        {
+            "role": "system",
+            "content": [{"type": "text", "text": input_data.system_prompt}],
+        }
+    ]
+    # Add context messages
+    for msg in input_data.context:
+        message_content = []
+        text = msg.text
+        if transform_user_message and msg.role == ContextMessageRole.USER:
+            text = transform_user_message(text)
+        if text:
+            message_content.append({"type": "text", "text": text})
+        if hasattr(msg, 'image') and msg.image:
+            if msg.image.path:
+                message_content.append({"type": "image_url", "image_url": {"url": msg.image.path}})
+            elif msg.image.uri:
+                message_content.append({"type": "image_url", "image_url": {"url": msg.image.uri}})
+        messages.append({
+            "role": msg.role,
+            "content": message_content
+        })
+    # Add user message
+    user_content = []
+    text = input_data.text
+    if transform_user_message:
+        text = transform_user_message(text)
+    if text:
+        user_content.append({"type": "text", "text": text})
+    if hasattr(input_data, 'image') and input_data.image:
+        if input_data.image.path:
+            user_content.append({"type": "image_url", "image_url": {"url": input_data.image.path}})
+        elif input_data.image.uri:
+            user_content.append({"type": "image_url", "image_url": {"url": input_data.image.uri}})
+    messages.append({"role": "user", "content": user_content})
+    return messages
+def stream_generate(
+    model: Any,
+    messages: List[Dict[str, Any]],
+    output_cls: type[LLMOutput],
+    temperature: float = 0.7,
+    top_p: float = 0.95,
+    max_tokens: int = 4096,
+    stop: Optional[List[str]] = None,
+    handle_thinking: bool = False,
+    transform_response: Optional[Callable[[str, str], tuple[str, LLMOutput]]] = None,
+) -> Generator[LLMOutput, None, None]:
+    """Stream generate from LLaMA.cpp model with timing and usage tracking.
+    Args:
+        model: The LLaMA.cpp model instance
+        messages: List of messages to send to the model
+        output_cls: Output class type to use for responses
+        temperature: Sampling temperature
+        top_p: Top-p sampling threshold
+        max_tokens: Maximum tokens to generate
+        stop: Optional list of stop sequences
+        handle_thinking: Whether to handle thinking tags
+        transform_response: Optional function to transform responses, takes (piece, buffer) and returns (new_buffer, output)
+    """
+    response_queue: Queue[Optional[tuple[str, dict]]] = Queue()
+    thread_exception = None
+    usage_stats = {
+        "prompt_tokens": 0,
+        "completion_tokens": 0,
+        "total_tokens": 0,
+        "stop_reason": ""
+    }
+    with timing_context() as timing:
+        def generation_thread():
+            nonlocal thread_exception, usage_stats
+            try:
+                completion = model.create_chat_completion(
+                    messages=messages,
+                    stream=True,
+                    temperature=temperature,
+                    top_p=top_p,
+                    max_tokens=max_tokens,
+                    stop=stop
+                )
+                for chunk in completion:
+                    # Get usage from root level if present
+                    if "usage" in chunk and chunk["usage"] is not None:
+                        usage_stats.update(chunk["usage"])
+                    # Get content from choices
+                    delta = chunk.get("choices", [{}])[0]
+                    content = None
+                    finish_reason = None
+                    if "message" in delta:
+                        content = delta["message"].get("content", "")
+                        finish_reason = delta.get("finish_reason")
+                    elif "delta" in delta:
+                        content = delta["delta"].get("content", "")
+                        finish_reason = delta.get("finish_reason")
+                    if content:
+                        if not timing.first_token_time:
+                            timing.mark_first_token()
+                        response_queue.put((content, {}))
+                    if finish_reason:
+                        usage_stats["stop_reason"] = finish_reason
+            except Exception as e:
+                thread_exception = e
+            finally:
+                timing_stats = timing.stats
+                generation_time = timing_stats["generation_time"]
+                tokens_per_second = (usage_stats["completion_tokens"] / generation_time) if generation_time > 0 else 0
+                response_queue.put((None, {
+                    "time_to_first_token": timing_stats["time_to_first_token"],
+                    "tokens_per_second": tokens_per_second
+                }))
+        thread = Thread(target=generation_thread, daemon=True)
+        thread.start()
+        buffer = ""
+        thinking_content = "" if handle_thinking else None
+        in_thinking = handle_thinking
+        try:
+            while True:
+                try:
+                    result = response_queue.get(timeout=30.0)
+                    if thread_exception:
+                        raise thread_exception
+                    piece, timing_stats = result
+                    if piece is None:
+                        # Final yield with complete usage stats
+                        usage = LLMUsage(
+                            stop_reason=usage_stats["stop_reason"],
+                            time_to_first_token=timing_stats["time_to_first_token"],
+                            tokens_per_second=timing_stats["tokens_per_second"],
+                            prompt_tokens=usage_stats["prompt_tokens"],
+                            completion_tokens=usage_stats["completion_tokens"],
+                            total_tokens=usage_stats["total_tokens"]
+                        )
+                        if transform_response:
+                            buffer, output = transform_response(piece or "", buffer)
+                            output.usage = usage
+                            yield output
+                        else:
+                            # Handle thinking vs response content if enabled
+                            if handle_thinking and "</think>" in piece:
+                                parts = piece.split("</think>")
+                                if in_thinking:
+                                    thinking_content += parts[0].replace("<think>", "")
+                                    buffer = parts[1] if len(parts) > 1 else ""
+                                    in_thinking = False
+                                else:
+                                    buffer += piece
+                            else:
+                                if in_thinking:
+                                    thinking_content += piece.replace("<think>", "")
+                                else:
+                                    buffer += piece
+                            yield output_cls(
+                                response=buffer.strip(),
+                                thinking_content=thinking_content.strip() if thinking_content else None,
+                                usage=usage
+                            )
+                        break
+                    if transform_response:
+                        buffer, output = transform_response(piece, buffer)
+                        yield output
+                    else:
+                        # Handle thinking vs response content if enabled
+                        if handle_thinking and "</think>" in piece:
+                            parts = piece.split("</think>")
+                            if in_thinking:
+                                thinking_content += parts[0].replace("<think>", "")
+                                buffer = parts[1] if len(parts) > 1 else ""
+                                in_thinking = False
+                            else:
+                                buffer += piece
+                        else:
+                            if in_thinking:
+                                thinking_content += piece.replace("<think>", "")
+                            else:
+                                buffer += piece
+                        yield output_cls(
+                            response=buffer.strip(),
+                            thinking_content=thinking_content.strip() if thinking_content else None
+                        )
+                except Exception as e:
+                    if thread_exception and isinstance(e, thread_exception.__class__):
+                        raise thread_exception
+                    break
+        finally:
+            if thread and thread.is_alive():
+                thread.join(timeout=2.0)

inferencesh/utils/__init__.py ADDED Viewed

@@ -0,0 +1,6 @@
+"""Utilities package for inference.sh SDK."""
+from .storage import StorageDir
+from .download import download
+__all__ = ["StorageDir", "download"]

inferencesh/utils/download.py ADDED Viewed

@@ -0,0 +1,51 @@
+import hashlib
+import os
+import urllib.parse
+import shutil
+from pathlib import Path
+from typing import Union
+from ..models.file import File
+from .storage import StorageDir
+def download(url: str, directory: Union[str, Path, StorageDir]) -> str:
+    """Download a file to the specified directory and return its path.
+    Args:
+        url: The URL to download from
+        directory: The directory to save the file to. Can be a string path,
+                  Path object, or StorageDir enum value.
+    Returns:
+        str: The path to the downloaded file
+    """
+    # Convert directory to Path
+    dir_path = Path(directory)
+    dir_path.mkdir(exist_ok=True)
+    # Create hash directory from URL
+    url_hash = hashlib.sha256(url.encode()).hexdigest()[:12]
+    hash_dir = dir_path / url_hash
+    hash_dir.mkdir(exist_ok=True)
+    # Keep original filename
+    filename = os.path.basename(urllib.parse.urlparse(url).path)
+    if not filename:
+        filename = 'download'
+    output_path = hash_dir / filename
+    # If file exists in directory and it's not a temp directory, return it
+    if output_path.exists() and directory != StorageDir.TEMP:
+        return str(output_path)
+    # Download the file
+    file = File(url)
+    if file.path:
+        shutil.copy2(file.path, output_path)
+        # Prevent the File instance from deleting its temporary file
+        file._tmp_path = None
+        return str(output_path)
+    raise RuntimeError(f"Failed to download {url}")

inferencesh/utils/storage.py ADDED Viewed

@@ -0,0 +1,16 @@
+from enum import Enum
+from pathlib import Path
+class StorageDir(str, Enum):
+    """Standard storage directories used by the SDK."""
+    DATA = "/app/data"   # Persistent storage/cache directory
+    TEMP = "/app/tmp"    # Temporary storage directory
+    CACHE = "/app/cache" # Cache directory
+    @property
+    def path(self) -> Path:
+        """Get the Path object for this storage directory, ensuring it exists."""
+        path = Path(self.value)
+        path.mkdir(parents=True, exist_ok=True)
+        return path

{inferencesh-0.2.7.dist-info → inferencesh-0.2.9.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: inferencesh
-Version: 0.2.7
+Version: 0.2.9
 Summary: inference.sh Python SDK
 Author: Inference Shell Inc.
 Author-email: "Inference Shell Inc." <hello@inference.sh>

inferencesh-0.2.9.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,14 @@
+inferencesh/__init__.py,sha256=H26z9pSgivkYfH2OfO5ff6emzmiV_Tc77umCRpdvg0Y,561
+inferencesh/models/__init__.py,sha256=CI9X3WyiXdRHUxKAwFuKSFCxrHwECPRrVJinJBugdP0,484
+inferencesh/models/base.py,sha256=4gZQRi8J7y9U6PrGD9pRIehd1MJVJAqGakPQDs2AKFM,3251
+inferencesh/models/file.py,sha256=5xnpypcRahM1YcEjj64rv9g2gTimxrZb41YT4r440hU,7393
+inferencesh/models/llm.py,sha256=jcBHgBK7uNTc1blfRqVBnYYfvGT952At7DL3NI_OKGc,14784
+inferencesh/utils/__init__.py,sha256=-xiD6uo2XzcrPAWFb_fUbaimmnW4KFKc-8IvBzaxNd4,148
+inferencesh/utils/download.py,sha256=7n5twvoNYDcFnKJyefImaj2YfzRI7vddQw4usZbj38c,1521
+inferencesh/utils/storage.py,sha256=E4J8emd4eFKdmdDgAqzz3TpaaDd3n0l8gYlMHuY8yIU,519
+inferencesh-0.2.9.dist-info/licenses/LICENSE,sha256=OsgqEWIh2el_QMj0y8O1A5Q5Dl-dxqqYbFE6fszuR4s,1086
+inferencesh-0.2.9.dist-info/METADATA,sha256=1vPRr6hhz0tbMYuY4CXd9AiAKs11DAiPjkvK_5yCqwY,2756
+inferencesh-0.2.9.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+inferencesh-0.2.9.dist-info/entry_points.txt,sha256=6IC-fyozAqW3ljsMLGCXxJ0_ui2Jb-2fLHtoH1RTnEE,45
+inferencesh-0.2.9.dist-info/top_level.txt,sha256=TSMHg3T1ThMl1HGAWmzBClwOYH1ump5neof9BfHIwaA,12
+inferencesh-0.2.9.dist-info/RECORD,,

{inferencesh-0.2.7.dist-info → inferencesh-0.2.9.dist-info}/WHEEL RENAMED Viewed

@@ -1,5 +1,5 @@
 Wheel-Version: 1.0
-Generator: setuptools (80.4.0)
+Generator: setuptools (80.9.0)
 Root-Is-Purelib: true
 Tag: py3-none-any

inferencesh/sdk.py DELETED Viewed

@@ -1,415 +0,0 @@
-from typing import Optional, Union
-from pydantic import BaseModel, ConfigDict, PrivateAttr, model_validator, Field, field_validator
-import mimetypes
-import os
-import urllib.request
-import urllib.parse
-import tempfile
-from typing import Any, Dict, List
-import inspect
-import ast
-import textwrap
-from collections import OrderedDict
-from enum import Enum
-import shutil
-from pathlib import Path
-import hashlib
-from tqdm import tqdm
-# inspired by https://github.com/pydantic/pydantic/issues/7580
-class OrderedSchemaModel(BaseModel):
-    """A base model that ensures the JSON schema properties and required fields are in the order of field definition."""
-    @classmethod
-    def model_json_schema(cls, by_alias: bool = True, **kwargs: Any) -> Dict[str, Any]:
-        schema = super().model_json_schema(by_alias=by_alias, **kwargs)
-        field_order = cls._get_field_order()
-        if field_order:
-            # Order properties
-            ordered_properties = OrderedDict()
-            for field_name in field_order:
-                if field_name in schema['properties']:
-                    ordered_properties[field_name] = schema['properties'][field_name]
-            # Add any remaining properties that weren't in field_order
-            for field_name, field_schema in schema['properties'].items():
-                if field_name not in ordered_properties:
-                    ordered_properties[field_name] = field_schema
-            schema['properties'] = ordered_properties
-            # Order required fields
-            if 'required' in schema:
-                ordered_required = [field for field in field_order if field in schema['required']]
-                # Add any remaining required fields that weren't in field_order
-                ordered_required.extend([field for field in schema['required'] if field not in ordered_required])
-                schema['required'] = ordered_required
-        return schema
-    @classmethod
-    def _get_field_order(cls) -> List[str]:
-        """Get the order of fields as they were defined in the class."""
-        source = inspect.getsource(cls)
-        # Unindent the entire source code
-        source = textwrap.dedent(source)
-        try:
-            module = ast.parse(source)
-        except IndentationError:
-            # If we still get an IndentationError, wrap the class in a dummy module
-            source = f"class DummyModule:\n{textwrap.indent(source, '    ')}"
-            module = ast.parse(source)
-            # Adjust to look at the first class def inside DummyModule
-            # noinspection PyUnresolvedReferences
-            class_def = module.body[0].body[0]
-        else:
-            # Find the class definition
-            class_def = next(
-                node for node in module.body if isinstance(node, ast.ClassDef) and node.name == cls.__name__
-            )
-        # Extract field names in the order they were defined
-        field_order = []
-        for node in class_def.body:
-            if isinstance(node, ast.AnnAssign) and isinstance(node.target, ast.Name):
-                field_order.append(node.target.id)
-        return field_order
-class BaseAppInput(OrderedSchemaModel):
-    pass
-class BaseAppOutput(OrderedSchemaModel):
-    pass
-class BaseApp(BaseModel):
-    model_config = ConfigDict(
-        arbitrary_types_allowed=True,
-        extra='allow'
-    )
-    async def setup(self):
-        pass
-    async def run(self, app_input: BaseAppInput) -> BaseAppOutput:
-        raise NotImplementedError("run method must be implemented")
-    async def unload(self):
-        pass
-class File(BaseModel):
-    """A class representing a file in the inference.sh ecosystem."""
-    uri: Optional[str] = Field(default=None)  # Original location (URL or file path)
-    path: Optional[str] = None  # Resolved local file path
-    content_type: Optional[str] = None  # MIME type of the file
-    size: Optional[int] = None  # File size in bytes
-    filename: Optional[str] = None  # Original filename if available
-    _tmp_path: Optional[str] = PrivateAttr(default=None)  # Internal storage for temporary file path
-    def __init__(self, initializer=None, **data):
-        if initializer is not None:
-            if isinstance(initializer, str):
-                data['uri'] = initializer
-            elif isinstance(initializer, File):
-                data = initializer.model_dump()
-            else:
-                raise ValueError(f'Invalid input for File: {initializer}')
-        super().__init__(**data)
-    @model_validator(mode='before')
-    @classmethod
-    def convert_str_to_file(cls, values):
-        if isinstance(values, str):  # Only accept strings
-            return {"uri": values}
-        elif isinstance(values, dict):
-            return values
-        raise ValueError(f'Invalid input for File: {values}')
-    @model_validator(mode='after')
-    def validate_required_fields(self) -> 'File':
-        """Validate that either uri or path is provided."""
-        if not self.uri and not self.path:
-            raise ValueError("Either 'uri' or 'path' must be provided")
-        return self
-    def model_post_init(self, _: Any) -> None:
-        """Initialize file path and metadata after model creation.
-        This method handles:
-        1. Downloading URLs to local files if uri is a URL
-        2. Converting relative paths to absolute paths
-        3. Populating file metadata
-        """
-        # Handle uri if provided
-        if self.uri:
-            if self._is_url(self.uri):
-                self._download_url()
-            else:
-                # Convert relative paths to absolute, leave absolute paths unchanged
-                self.path = os.path.abspath(self.uri)
-        # Handle path if provided
-        if self.path:
-            # Convert relative paths to absolute, leave absolute paths unchanged
-            self.path = os.path.abspath(self.path)
-            self._populate_metadata()
-            return
-        raise ValueError("Either 'uri' or 'path' must be provided and be valid")
-    def _is_url(self, path: str) -> bool:
-        """Check if the path is a URL."""
-        parsed = urllib.parse.urlparse(path)
-        return parsed.scheme in ('http', 'https')
-    def _download_url(self) -> None:
-        """Download the URL to a temporary file and update the path."""
-        original_url = self.uri
-        tmp_file = None
-        try:
-            # Create a temporary file with a suffix based on the URL path
-            suffix = os.path.splitext(urllib.parse.urlparse(original_url).path)[1]
-            tmp_file = tempfile.NamedTemporaryFile(delete=False, suffix=suffix)
-            self._tmp_path = tmp_file.name
-            # Set up request with user agent
-            headers = {
-                'User-Agent': (
-                    'Mozilla/5.0 (Windows NT 10.0; Win64; x64) '
-                    'AppleWebKit/537.36 (KHTML, like Gecko) '
-                    'Chrome/91.0.4472.124 Safari/537.36'
-                )
-            }
-            req = urllib.request.Request(original_url, headers=headers)
-            # Download the file with progress bar
-            print(f"Downloading URL: {original_url} to {self._tmp_path}")
-            try:
-                with urllib.request.urlopen(req) as response:
-                    total_size = int(response.headers.get('content-length', 0))
-                    block_size = 1024  # 1 Kibibyte
-                    with tqdm(total=total_size, unit='iB', unit_scale=True) as pbar:
-                        with open(self._tmp_path, 'wb') as out_file:
-                            while True:
-                                buffer = response.read(block_size)
-                                if not buffer:
-                                    break
-                                out_file.write(buffer)
-                                pbar.update(len(buffer))
-                self.path = self._tmp_path
-            except (urllib.error.URLError, urllib.error.HTTPError) as e:
-                raise RuntimeError(f"Failed to download URL {original_url}: {str(e)}")
-            except IOError as e:
-                raise RuntimeError(f"Failed to write downloaded file to {self._tmp_path}: {str(e)}")
-        except Exception as e:
-            # Clean up temp file if something went wrong
-            if tmp_file is not None and hasattr(self, '_tmp_path'):
-                try:
-                    os.unlink(self._tmp_path)
-                except (OSError, IOError):
-                    pass
-            raise RuntimeError(f"Error downloading URL {original_url}: {str(e)}")
-    def __del__(self):
-        """Cleanup temporary file if it exists."""
-        if hasattr(self, '_tmp_path') and self._tmp_path:
-            try:
-                os.unlink(self._tmp_path)
-            except (OSError, IOError):
-                pass
-    def _populate_metadata(self) -> None:
-        """Populate file metadata from the path if it exists."""
-        if os.path.exists(self.path):
-            if not self.content_type:
-                self.content_type = self._guess_content_type()
-            if not self.size:
-                self.size = self._get_file_size()
-            if not self.filename:
-                self.filename = self._get_filename()
-    @classmethod
-    def from_path(cls, path: Union[str, os.PathLike]) -> 'File':
-        """Create a File instance from a file path."""
-        return cls(uri=str(path))
-    def _guess_content_type(self) -> Optional[str]:
-        """Guess the MIME type of the file."""
-        return mimetypes.guess_type(self.path)[0]
-    def _get_file_size(self) -> int:
-        """Get the size of the file in bytes."""
-        return os.path.getsize(self.path)
-    def _get_filename(self) -> str:
-        """Get the base filename from the path."""
-        return os.path.basename(self.path)
-    def exists(self) -> bool:
-        """Check if the file exists."""
-        return os.path.exists(self.path)
-    def refresh_metadata(self) -> None:
-        """Refresh all metadata from the file."""
-        if os.path.exists(self.path):
-            self.content_type = self._guess_content_type()
-            self.size = self._get_file_size()  # Always update size
-            self.filename = self._get_filename()
-    @classmethod
-    def model_json_schema(cls, **kwargs):
-        schema = super().model_json_schema(**kwargs)
-        schema["$id"] = "/schemas/File"
-        # Create a schema that accepts either a string or the full object
-        return {
-            "oneOf": [
-                {"type": "string"},  # Accept string input
-                schema  # Accept full object input
-            ]
-        }
-class ContextMessageRole(str, Enum):
-    USER = "user"
-    ASSISTANT = "assistant"
-    SYSTEM = "system"
-class Message(BaseModel):
-    role: ContextMessageRole
-    content: str
-class ContextMessage(BaseModel):
-    role: ContextMessageRole = Field(
-        description="The role of the message",
-    )
-    text: str = Field(
-        description="The text content of the message"
-    )
-class ContextMessageWithImage(ContextMessage):
-    image: Optional[File] = Field(
-        description="The image url of the message",
-        default=None
-    )
-class LLMInput(BaseAppInput):
-    system_prompt: str = Field(
-        description="The system prompt to use for the model",
-        default="You are a helpful assistant that can answer questions and help with tasks.",
-        examples=[
-            "You are a helpful assistant that can answer questions and help with tasks.",
-            "You are a certified medical professional who can provide accurate health information.",
-            "You are a certified financial advisor who can give sound investment guidance.",
-            "You are a certified cybersecurity expert who can explain security best practices.",
-            "You are a certified environmental scientist who can discuss climate and sustainability.",
-        ]
-    )
-    context: list[ContextMessage] = Field(
-        description="The context to use for the model",
-        examples=[
-            [
-                {"role": "user", "content": [{"type": "text", "text": "What is the capital of France?"}]},
-                {"role": "assistant", "content": [{"type": "text", "text": "The capital of France is Paris."}]}
-            ],
-            [
-                {"role": "user", "content": [{"type": "text", "text": "What is the weather like today?"}]},
-                {"role": "assistant", "content": [{"type": "text", "text": "I apologize, but I don't have access to real-time weather information. You would need to check a weather service or app to get current weather conditions for your location."}]}
-            ],
-            [
-                {"role": "user", "content": [{"type": "text", "text": "Can you help me write a poem about spring?"}]},
-                {"role": "assistant", "content": [{"type": "text", "text": "Here's a short poem about spring:\n\nGreen buds awakening,\nSoft rain gently falling down,\nNew life springs anew.\n\nWarm sun breaks through clouds,\nBirds return with joyful song,\nNature's sweet rebirth."}]}
-            ],
-            [
-                {"role": "user", "content": [{"type": "text", "text": "Explain quantum computing in simple terms"}]},
-                {"role": "assistant", "content": [{"type": "text", "text": "Quantum computing is like having a super-powerful calculator that can solve many problems at once instead of one at a time. While regular computers use bits (0s and 1s), quantum computers use quantum bits or \"qubits\" that can be both 0 and 1 at the same time - kind of like being in two places at once! This allows them to process huge amounts of information much faster than regular computers for certain types of problems."}]}
-            ]
-        ],
-        default=[]
-    )
-    text: str = Field(
-        description="The user prompt to use for the model",
-        examples=[
-            "What is the capital of France?",
-            "What is the weather like today?",
-            "Can you help me write a poem about spring?",
-            "Explain quantum computing in simple terms"
-        ],
-    )
-class LLMInputWithImage(LLMInput):
-    context: list[ContextMessageWithImage] = Field(
-        description="The context to use for the model",
-        examples=[
-            [
-                {"role": "user", "content": [{"type": "text", "text": "What is the capital of France?"}, {"type": "image", "url": "https://example.com/image.jpg"}]},
-                {"role": "assistant", "content": [{"type": "text", "text": "The capital of France is Paris."}]}
-            ],
-        ],
-        default=[]
-    )
-    image: Optional[File] = Field(
-        description="The image to use for the model",
-        default=None
-    )
-class StorageDir(str, Enum):
-    """Standard storage directories used by the SDK."""
-    DATA = "/app/data"   # Persistent storage/cache directory
-    TEMP = "/app/tmp"    # Temporary storage directory
-    CACHE = "/app/cache" # Cache directory
-    @property
-    def path(self) -> Path:
-        """Get the Path object for this storage directory, ensuring it exists."""
-        path = Path(self.value)
-        path.mkdir(parents=True, exist_ok=True)
-        return path
-def download(url: str, directory: Union[str, Path, StorageDir]) -> str:
-    """Download a file to the specified directory and return its path.
-    Args:
-        url: The URL to download from
-        directory: The directory to save the file to. Can be a string path,
-                  Path object, or StorageDir enum value.
-    Returns:
-        str: The path to the downloaded file
-    """
-    # Convert directory to Path
-    dir_path = Path(directory)
-    dir_path.mkdir(exist_ok=True)
-    # Create hash directory from URL
-    url_hash = hashlib.sha256(url.encode()).hexdigest()[:12]
-    hash_dir = dir_path / url_hash
-    hash_dir.mkdir(exist_ok=True)
-    # Keep original filename
-    filename = os.path.basename(urllib.parse.urlparse(url).path)
-    if not filename:
-        filename = 'download'
-    output_path = hash_dir / filename
-    # If file exists in directory and it's not a temp directory, return it
-    if output_path.exists() and directory != StorageDir.TEMP:
-        return str(output_path)
-    # Download the file
-    file = File(url)
-    if file.path:
-        shutil.copy2(file.path, output_path)
-        # Prevent the File instance from deleting its temporary file
-        file._tmp_path = None
-        return str(output_path)
-    raise RuntimeError(f"Failed to download {url}")

inferencesh-0.2.7.dist-info/RECORD DELETED Viewed

@@ -1,8 +0,0 @@
-inferencesh/__init__.py,sha256=hbKkgHCh0lCdhWyHs3FHHRd8JfLeHkTd1bT4v79Fi8M,192
-inferencesh/sdk.py,sha256=raPhrMovMiZ_di0IwT5bgwATe6avxSs0KBUtzes20R4,16704
-inferencesh-0.2.7.dist-info/licenses/LICENSE,sha256=OsgqEWIh2el_QMj0y8O1A5Q5Dl-dxqqYbFE6fszuR4s,1086
-inferencesh-0.2.7.dist-info/METADATA,sha256=UFRubSIB78URLW_ddkZl18xYrl2xkJUiSNFxUCJwFyY,2756
-inferencesh-0.2.7.dist-info/WHEEL,sha256=DnLRTWE75wApRYVsjgc6wsVswC54sMSJhAEd4xhDpBk,91
-inferencesh-0.2.7.dist-info/entry_points.txt,sha256=6IC-fyozAqW3ljsMLGCXxJ0_ui2Jb-2fLHtoH1RTnEE,45
-inferencesh-0.2.7.dist-info/top_level.txt,sha256=TSMHg3T1ThMl1HGAWmzBClwOYH1ump5neof9BfHIwaA,12
-inferencesh-0.2.7.dist-info/RECORD,,

{inferencesh-0.2.7.dist-info → inferencesh-0.2.9.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{inferencesh-0.2.7.dist-info → inferencesh-0.2.9.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{inferencesh-0.2.7.dist-info → inferencesh-0.2.9.dist-info}/top_level.txt RENAMED Viewed

File without changes

inferencesh 0.2.7__py3-none-any.whl → 0.2.9__py3-none-any.whl

inferencesh 0.2.7py3-none-any.whl → 0.2.9py3-none-any.whl