PyPI - model-library - Versions diffs - 0.1.0__py3-none-any.whl → 0.1.2__py3-none-any.whl - Mend

model-library 0.1.0py3-none-any.whl → 0.1.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

model_library/__init__.py +7 -3
model_library/base/__init__.py +7 -0
model_library/{base.py → base/base.py} +47 -423
model_library/base/batch.py +121 -0
model_library/base/delegate_only.py +94 -0
model_library/base/input.py +100 -0
model_library/base/output.py +175 -0
model_library/base/utils.py +42 -0
model_library/config/all_models.json +164 -2
model_library/config/anthropic_models.yaml +4 -0
model_library/config/deepseek_models.yaml +3 -1
model_library/config/openai_models.yaml +48 -0
model_library/exceptions.py +2 -0
model_library/logging.py +30 -0
model_library/providers/__init__.py +0 -0
model_library/providers/ai21labs.py +2 -0
model_library/providers/alibaba.py +16 -78
model_library/providers/amazon.py +3 -0
model_library/providers/anthropic.py +213 -2
model_library/providers/azure.py +2 -0
model_library/providers/cohere.py +14 -80
model_library/providers/deepseek.py +14 -90
model_library/providers/fireworks.py +17 -81
model_library/providers/google/google.py +22 -20
model_library/providers/inception.py +15 -83
model_library/providers/kimi.py +15 -83
model_library/providers/mistral.py +2 -0
model_library/providers/openai.py +2 -0
model_library/providers/perplexity.py +12 -79
model_library/providers/together.py +2 -0
model_library/providers/vals.py +2 -0
model_library/providers/xai.py +2 -0
model_library/providers/zai.py +15 -83
model_library/register_models.py +75 -55
model_library/registry_utils.py +5 -5
model_library/utils.py +3 -28
{model_library-0.1.0.dist-info → model_library-0.1.2.dist-info}/METADATA +36 -7
model_library-0.1.2.dist-info/RECORD +61 -0
model_library-0.1.0.dist-info/RECORD +0 -53
{model_library-0.1.0.dist-info → model_library-0.1.2.dist-info}/WHEEL +0 -0
{model_library-0.1.0.dist-info → model_library-0.1.2.dist-info}/licenses/LICENSE +0 -0
{model_library-0.1.0.dist-info → model_library-0.1.2.dist-info}/top_level.txt +0 -0

model_library/base/delegate_only.py ADDED Viewed

@@ -0,0 +1,94 @@
+import io
+from typing import Any, Literal, Sequence
+from typing_extensions import override
+from model_library.base import (
+    LLM,
+    FileInput,
+    FileWithId,
+    InputItem,
+    LLMConfig,
+    QueryResult,
+    ToolDefinition,
+)
+class DelegateOnlyException(Exception):
+    """
+    Raised when native model functionality is performed on a
+    delegate-only model.
+    """
+    DEFAULT_MESSAGE: str = "This model supports only delegate-only functionality. Only the query() method should be used."
+    def __init__(self, message: str | None = None):
+        super().__init__(message or DelegateOnlyException.DEFAULT_MESSAGE)
+class DelegateOnly(LLM):
+    @override
+    def get_client(self) -> None:
+        raise DelegateOnlyException()
+    def __init__(
+        self,
+        model_name: str,
+        provider: str,
+        *,
+        config: LLMConfig | None = None,
+    ):
+        config = config or LLMConfig()
+        config.native = False
+        super().__init__(model_name, provider, config=config)
+    @override
+    async def _query_impl(
+        self,
+        input: Sequence[InputItem],
+        *,
+        tools: list[ToolDefinition],
+        **kwargs: object,
+    ) -> QueryResult:
+        assert self.delegate
+        return await self.delegate_query(input, tools=tools, **kwargs)
+    @override
+    async def parse_input(
+        self,
+        input: Sequence[InputItem],
+        **kwargs: Any,
+    ) -> Any:
+        raise DelegateOnlyException()
+    @override
+    async def parse_image(
+        self,
+        image: FileInput,
+    ) -> Any:
+        raise DelegateOnlyException()
+    @override
+    async def parse_file(
+        self,
+        file: FileInput,
+    ) -> Any:
+        raise DelegateOnlyException()
+    @override
+    async def parse_tools(
+        self,
+        tools: list[ToolDefinition],
+    ) -> Any:
+        raise DelegateOnlyException()
+    @override
+    async def upload_file(
+        self,
+        name: str,
+        mime: str,
+        bytes: io.BytesIO,
+        type: Literal["image", "file"] = "file",
+    ) -> FileWithId:
+        raise DelegateOnlyException()

model_library/base/input.py ADDED Viewed

@@ -0,0 +1,100 @@
+from pprint import pformat
+from typing import Annotated, Any, Literal
+from pydantic import BaseModel, Field
+from typing_extensions import override
+from model_library.utils import truncate_str
+"""
+--- FILES ---
+"""
+class FileBase(BaseModel):
+    type: Literal["image", "file"]
+    name: str
+    mime: str
+    @override
+    def __repr__(self):
+        attrs = vars(self).copy()
+        if "base64" in attrs:
+            attrs["base64"] = truncate_str(attrs["base64"])
+        return f"{self.__class__.__name__}(\n{pformat(attrs, indent=2)}\n)"
+class FileWithBase64(FileBase):
+    append_type: Literal["base64"] = "base64"
+    base64: str
+class FileWithUrl(FileBase):
+    append_type: Literal["url"] = "url"
+    url: str
+class FileWithId(FileBase):
+    append_type: Literal["file_id"] = "file_id"
+    file_id: str
+FileInput = Annotated[
+    FileWithBase64 | FileWithUrl | FileWithId,
+    Field(discriminator="append_type"),
+]
+"""
+--- TOOLS ---
+"""
+class ToolBody(BaseModel):
+    name: str
+    description: str
+    properties: dict[str, Any]
+    required: list[str]
+    kwargs: dict[str, Any] = {}
+class ToolDefinition(BaseModel):
+    name: str  # acts as a key
+    body: ToolBody | Any
+class ToolCall(BaseModel):
+    id: str
+    call_id: str | None = None
+    name: str
+    args: dict[str, Any] | str
+"""
+--- INPUT ---
+"""
+RawResponse = Any
+class ToolInput(BaseModel):
+    tools: list[ToolDefinition] = []
+class ToolResult(BaseModel):
+    tool_call: ToolCall
+    result: Any
+class TextInput(BaseModel):
+    text: str
+RawInputItem = dict[
+    str, Any
+]  # to pass in, for example, a mock convertsation with {"role": "user", "content": "Hello"}
+InputItem = (
+    TextInput | FileInput | ToolResult | RawInputItem | RawResponse
+)  # input item can either be a prompt, a file (image or file), a tool call result, raw input, or a previous response

model_library/base/output.py ADDED Viewed

@@ -0,0 +1,175 @@
+"""
+--- OUTPUT ---
+"""
+from pprint import pformat
+from typing import Any, Mapping, Sequence, cast
+from pydantic import BaseModel, Field, computed_field, field_validator
+from typing_extensions import override
+from model_library.base.input import InputItem, ToolCall
+from model_library.base.utils import (
+    sum_optional,
+)
+from model_library.utils import truncate_str
+class Citation(BaseModel):
+    type: str | None = None
+    title: str | None = None
+    url: str | None = None
+    start_index: int | None = None
+    end_index: int | None = None
+    file_id: str | None = None
+    filename: str | None = None
+    index: int | None = None
+    container_id: str | None = None
+class QueryResultExtras(BaseModel):
+    citations: list[Citation] = Field(default_factory=list)
+class QueryResultCost(BaseModel):
+    """
+    Cost information for a query
+    Includes total cost and a structured breakdown.
+    """
+    input: float
+    output: float
+    reasoning: float | None = None
+    cache_read: float | None = None
+    cache_write: float | None = None
+    @computed_field
+    @property
+    def total(self) -> float:
+        return sum(
+            filter(
+                None,
+                [
+                    self.input,
+                    self.output,
+                    self.reasoning,
+                    self.cache_read,
+                    self.cache_write,
+                ],
+            )
+        )
+    @override
+    def __repr__(self):
+        use_cents = self.total < 1
+        def format_cost(value: float | None):
+            if value is None:
+                return None
+            return f"{value * 100:.3f} cents" if use_cents else f"${value:.2f}"
+        return (
+            f"{format_cost(self.total)} "
+            + f"(uncached input: {format_cost(self.input)} | output: {format_cost(self.output)} | reasoning: {format_cost(self.reasoning)} | cache_read: {format_cost(self.cache_read)} | cache_write: {format_cost(self.cache_write)})"
+        )
+class QueryResultMetadata(BaseModel):
+    """
+    Metadata for a query: token usage and timing.
+    """
+    cost: QueryResultCost | None = None  # set post query
+    duration_seconds: float | None = None  # set post query
+    in_tokens: int = 0
+    out_tokens: int = 0
+    reasoning_tokens: int | None = None
+    cache_read_tokens: int | None = None
+    cache_write_tokens: int | None = None
+    @property
+    def default_duration_seconds(self) -> float:
+        return self.duration_seconds or 0
+    def __add__(self, other: "QueryResultMetadata") -> "QueryResultMetadata":
+        return QueryResultMetadata(
+            in_tokens=self.in_tokens + other.in_tokens,
+            out_tokens=self.out_tokens + other.out_tokens,
+            reasoning_tokens=sum_optional(
+                self.reasoning_tokens, other.reasoning_tokens
+            ),
+            cache_read_tokens=sum_optional(
+                self.cache_read_tokens, other.cache_read_tokens
+            ),
+            cache_write_tokens=sum_optional(
+                self.cache_write_tokens, other.cache_write_tokens
+            ),
+            duration_seconds=self.default_duration_seconds
+            + other.default_duration_seconds,
+        )
+    @override
+    def __repr__(self):
+        attrs = vars(self).copy()
+        return f"{self.__class__.__name__}(\n{pformat(attrs, indent=2, sort_dicts=False)}\n)"
+class QueryResult(BaseModel):
+    """
+    Result of a query
+    Contains the text, reasoning, metadata, tool calls, and history
+    """
+    output_text: str | None = None
+    reasoning: str | None = None
+    metadata: QueryResultMetadata = Field(default_factory=QueryResultMetadata)
+    tool_calls: list[ToolCall] = Field(default_factory=list)
+    history: list[InputItem] = Field(default_factory=list)
+    extras: QueryResultExtras = Field(default_factory=QueryResultExtras)
+    raw: dict[str, Any] = Field(default_factory=dict)
+    @property
+    def output_text_str(self) -> str:
+        return self.output_text or ""
+    @field_validator("reasoning", mode="before")
+    def default_reasoning(cls, v: str | None):
+        return None if not v else v  # make reasoning None if empty
+    @property
+    def search_results(self) -> Any | None:
+        """Expose provider-supplied search metadata without additional processing."""
+        raw_dict = cast(dict[str, Any], getattr(self, "raw", {}))
+        raw_candidate = raw_dict.get("search_results")
+        if raw_candidate is not None:
+            return raw_candidate
+        return _get_from_history(self.history, "search_results")
+    @override
+    def __repr__(self):
+        attrs = vars(self).copy()
+        ordered_attrs = {
+            "output_text": truncate_str(attrs.pop("output_text", None), 400),
+            "reasoning": truncate_str(attrs.pop("reasoning", None), 400),
+            "metadata": attrs.pop("metadata", None),
+        }
+        if self.tool_calls:
+            ordered_attrs["tool_calls"] = self.tool_calls
+        return f"{self.__class__.__name__}(\n{pformat(ordered_attrs, indent=2, sort_dicts=False)}\n)"
+def _get_from_history(history: Sequence[InputItem], key: str) -> Any | None:
+    for item in reversed(history):
+        value = getattr(item, key, None)
+        if value is not None:
+            return value
+        extra = getattr(item, "model_extra", None)
+        if isinstance(extra, Mapping):
+            value = cast(Mapping[str, Any], extra).get(key)
+            if value is not None:
+                return value
+    return None

model_library/base/utils.py ADDED Viewed

@@ -0,0 +1,42 @@
+from typing import Sequence, cast
+from model_library.base.input import (
+    FileBase,
+    InputItem,
+    RawInputItem,
+    TextInput,
+    ToolResult,
+)
+from model_library.utils import truncate_str
+def sum_optional(a: int | None, b: int | None) -> int | None:
+    """Sum two optional integers, returning None if both are None.
+    Preserves None to indicate "unknown/not provided" when both inputs are None,
+    otherwise treats None as 0 for summation.
+    """
+    if a is None and b is None:
+        return None
+    return (a or 0) + (b or 0)
+def get_pretty_input_types(input: Sequence["InputItem"]) -> str:
+    # for logging
+    def process_item(item: "InputItem"):
+        match item:
+            case TextInput():
+                return truncate_str(repr(item))
+            case FileBase():  # FileInput
+                return repr(item)
+            case ToolResult():
+                return repr(item)
+            case dict():
+                item = cast(RawInputItem, item)
+                return repr(item)
+            case _:
+                # RawResponse
+                return repr(item)
+    processed_items = [f"  {process_item(item)}" for item in input]
+    return "\n" + "\n".join(processed_items) if processed_items else ""

model_library/config/all_models.json CHANGED Viewed

@@ -1,4 +1,148 @@
 {
+    "openai/gpt-5.1-codex-mini": {
+        "company": "OpenAI",
+        "label": "GPT 5.1 Codex Mini",
+        "description": "OpenAI's miniature coding model",
+        "release_date": "2025-11-13",
+        "open_source": false,
+        "documentation_url": "https://platform.openai.com/docs/models/gpt-5.1-codex-mini",
+        "properties": {
+            "context_window": 400000,
+            "max_token_output": 128000,
+            "training_cutoff": null,
+            "reasoning_model": true
+        },
+        "class_properties": {
+            "supports_images": true,
+            "supports_files": true,
+            "supports_batch_requests": true,
+            "supports_temperature": false,
+            "supports_tools": true,
+            "deprecated": false,
+            "available_for_everyone": false,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {
+            "input": 0.25,
+            "output": 2.0,
+            "cache": {
+                "read": 0.025,
+                "write_markup": 1.0
+            },
+            "batch": {
+                "input_discount": 0.5,
+                "output_discount": 0.5
+            }
+        },
+        "alternative_keys": [],
+        "default_parameters": {
+            "max_output_tokens": 128000,
+            "temperature": 1.0,
+            "reasoning_effort": "high"
+        },
+        "provider_name": "openai",
+        "provider_endpoint": "gpt-5.1-codex-mini",
+        "full_key": "openai/gpt-5.1-codex-mini",
+        "slug": "openai_gpt-5.1-codex-mini"
+    },
+    "openai/gpt-5.1-codex": {
+        "company": "OpenAI",
+        "label": "GPT 5.1 Codex",
+        "description": "OpenAI's latest coding model",
+        "release_date": "2025-11-13",
+        "open_source": false,
+        "documentation_url": "https://platform.openai.com/docs/models/gpt-5.1-codex",
+        "properties": {
+            "context_window": 400000,
+            "max_token_output": 128000,
+            "training_cutoff": null,
+            "reasoning_model": true
+        },
+        "class_properties": {
+            "supports_images": true,
+            "supports_files": true,
+            "supports_batch_requests": true,
+            "supports_temperature": false,
+            "supports_tools": true,
+            "deprecated": false,
+            "available_for_everyone": false,
+            "available_as_evaluator": false,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {
+            "input": 1.25,
+            "output": 10.0,
+            "cache": {
+                "read": 0.125,
+                "write_markup": 1.0
+            },
+            "batch": {
+                "input_discount": 0.5,
+                "output_discount": 0.5
+            }
+        },
+        "alternative_keys": [],
+        "default_parameters": {
+            "max_output_tokens": 128000,
+            "temperature": 1.0,
+            "reasoning_effort": "high"
+        },
+        "provider_name": "openai",
+        "provider_endpoint": "gpt-5.1-codex",
+        "full_key": "openai/gpt-5.1-codex",
+        "slug": "openai_gpt-5.1-codex"
+    },
+    "openai/gpt-5.1-2025-11-13": {
+        "company": "OpenAI",
+        "label": "GPT 5.1",
+        "description": "GPT-5.1 is OpenAI's flagship model for coding and agentic tasks with configurable reasoning and non-reasoning effort.",
+        "release_date": "2025-11-13",
+        "open_source": false,
+        "documentation_url": "https://platform.openai.com/docs/models/gpt-5.1",
+        "properties": {
+            "context_window": 400000,
+            "max_token_output": 128000,
+            "training_cutoff": "2024-09",
+            "reasoning_model": true
+        },
+        "class_properties": {
+            "supports_images": true,
+            "supports_files": true,
+            "supports_batch_requests": true,
+            "supports_temperature": false,
+            "supports_tools": true,
+            "deprecated": false,
+            "available_for_everyone": false,
+            "available_as_evaluator": true,
+            "ignored_for_cost": false
+        },
+        "provider_properties": {},
+        "costs_per_million_token": {
+            "input": 1.25,
+            "output": 10.0,
+            "cache": {
+                "read": 0.125,
+                "write_markup": 1.0
+            },
+            "batch": {
+                "input_discount": 0.5,
+                "output_discount": 0.5
+            }
+        },
+        "alternative_keys": [],
+        "default_parameters": {
+            "max_output_tokens": 128000,
+            "temperature": 1.0,
+            "reasoning_effort": "high"
+        },
+        "provider_name": "openai",
+        "provider_endpoint": "gpt-5.1-2025-11-13",
+        "full_key": "openai/gpt-5.1-2025-11-13",
+        "slug": "openai_gpt-5.1-2025-11-13"
+    },
     "kimi/kimi-k2-thinking": {
         "company": "Kimi",
         "label": "Kimi K2 Thinking",
@@ -187,6 +331,7 @@
         "class_properties": {
             "supports_images": true,
             "supports_files": true,
+            "supports_batch_requests": true,
             "supports_temperature": true,
             "supports_tools": true,
             "deprecated": false,
@@ -234,6 +379,7 @@
         "class_properties": {
             "supports_images": true,
             "supports_files": true,
+            "supports_batch_requests": true,
             "supports_temperature": true,
             "supports_tools": true,
             "deprecated": false,
@@ -386,7 +532,11 @@
         "provider_properties": {},
         "costs_per_million_token": {
             "input": 0.28,
-            "output": 0.42
+            "output": 0.42,
+            "cache": {
+                "read_discount": 0.1,
+                "write_markup": 1.0
+            }
         },
         "alternative_keys": [],
         "default_parameters": {
@@ -424,7 +574,11 @@
         "provider_properties": {},
         "costs_per_million_token": {
             "input": 0.28,
-            "output": 0.42
+            "output": 0.42,
+            "cache": {
+                "read_discount": 0.1,
+                "write_markup": 1.0
+            }
         },
         "alternative_keys": [],
         "default_parameters": {
@@ -451,6 +605,7 @@
         "class_properties": {
             "supports_images": true,
             "supports_files": true,
+            "supports_batch_requests": true,
             "supports_temperature": true,
             "supports_tools": true,
             "deprecated": false,
@@ -508,6 +663,7 @@
         "class_properties": {
             "supports_images": true,
             "supports_files": true,
+            "supports_batch_requests": true,
             "supports_temperature": true,
             "supports_tools": true,
             "deprecated": false,
@@ -1979,6 +2135,7 @@
         "class_properties": {
             "supports_images": true,
             "supports_files": true,
+            "supports_batch_requests": true,
             "supports_temperature": true,
             "supports_tools": true,
             "deprecated": false,
@@ -2026,6 +2183,7 @@
         "class_properties": {
             "supports_images": true,
             "supports_files": true,
+            "supports_batch_requests": true,
             "supports_temperature": true,
             "supports_tools": true,
             "deprecated": false,
@@ -3350,6 +3508,7 @@
         "class_properties": {
             "supports_images": true,
             "supports_files": true,
+            "supports_batch_requests": true,
             "supports_temperature": false,
             "supports_tools": true,
             "deprecated": false,
@@ -3407,6 +3566,7 @@
         "class_properties": {
             "supports_images": true,
             "supports_files": true,
+            "supports_batch_requests": true,
             "supports_temperature": true,
             "supports_tools": true,
             "deprecated": false,
@@ -3475,6 +3635,7 @@
         "class_properties": {
             "supports_images": true,
             "supports_files": true,
+            "supports_batch_requests": true,
             "supports_temperature": true,
             "supports_tools": true,
             "deprecated": false,
@@ -3522,6 +3683,7 @@
         "class_properties": {
             "supports_images": true,
             "supports_files": true,
+            "supports_batch_requests": true,
             "supports_temperature": true,
             "supports_tools": true,
             "deprecated": false,

model_library/config/anthropic_models.yaml CHANGED Viewed

@@ -23,6 +23,10 @@ base-config:
     temperature: 1
 claude-4-models:
+  base-config:
+    class_properties:
+      supports_batch_requests: true
   anthropic/claude-opus-4-1-20250805:
     label: Claude Opus 4.1 (Nonthinking)
     description: Advanced model for specialized complex

model_library/config/deepseek_models.yaml CHANGED Viewed

@@ -10,7 +10,7 @@ base-config:
     ignored_for_cost: false
   properties:
     reasoning_model: false
 deepseek-v3p2-exp-models:
   base-config:
     class_properties:
@@ -23,6 +23,8 @@ deepseek-v3p2-exp-models:
     costs_per_million_token:
       input: 0.28
       output: 0.42
+      cache:
+        read_discount: 0.1
   deepseek/deepseek-chat:
     label: DeepSeek V3.2-Exp (Nonthinking)

model-library 0.1.0__py3-none-any.whl → 0.1.2__py3-none-any.whl

model-library 0.1.0py3-none-any.whl → 0.1.2py3-none-any.whl