PyPI - model-library - Versions diffs - 0.1.6__py3-none-any.whl → 0.1.8__py3-none-any.whl - Mend

model-library 0.1.6py3-none-any.whl → 0.1.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

model_library/base/base.py +237 -62
model_library/base/delegate_only.py +86 -9
model_library/base/input.py +10 -7
model_library/base/output.py +48 -0
model_library/base/utils.py +56 -7
model_library/config/alibaba_models.yaml +44 -57
model_library/config/all_models.json +253 -126
model_library/config/kimi_models.yaml +30 -3
model_library/config/openai_models.yaml +15 -23
model_library/config/zai_models.yaml +24 -3
model_library/exceptions.py +14 -77
model_library/logging.py +6 -2
model_library/providers/ai21labs.py +30 -14
model_library/providers/alibaba.py +17 -8
model_library/providers/amazon.py +119 -64
model_library/providers/anthropic.py +184 -104
model_library/providers/azure.py +22 -10
model_library/providers/cohere.py +7 -7
model_library/providers/deepseek.py +8 -8
model_library/providers/fireworks.py +7 -8
model_library/providers/google/batch.py +17 -13
model_library/providers/google/google.py +130 -73
model_library/providers/inception.py +7 -7
model_library/providers/kimi.py +18 -8
model_library/providers/minimax.py +30 -13
model_library/providers/mistral.py +61 -35
model_library/providers/openai.py +219 -93
model_library/providers/openrouter.py +34 -0
model_library/providers/perplexity.py +7 -7
model_library/providers/together.py +7 -8
model_library/providers/vals.py +16 -9
model_library/providers/xai.py +157 -144
model_library/providers/zai.py +38 -8
model_library/register_models.py +4 -2
model_library/registry_utils.py +39 -15
model_library/retriers/__init__.py +0 -0
model_library/retriers/backoff.py +73 -0
model_library/retriers/base.py +225 -0
model_library/retriers/token.py +427 -0
model_library/retriers/utils.py +11 -0
model_library/settings.py +1 -1
model_library/utils.py +13 -35
{model_library-0.1.6.dist-info → model_library-0.1.8.dist-info}/METADATA +4 -3
model_library-0.1.8.dist-info/RECORD +70 -0
{model_library-0.1.6.dist-info → model_library-0.1.8.dist-info}/WHEEL +1 -1
model_library-0.1.6.dist-info/RECORD +0 -64
{model_library-0.1.6.dist-info → model_library-0.1.8.dist-info}/licenses/LICENSE +0 -0
{model_library-0.1.6.dist-info → model_library-0.1.8.dist-info}/top_level.txt +0 -0

model_library/base/utils.py CHANGED Viewed

@@ -1,18 +1,36 @@
-from typing import Sequence, TypeVar, cast
+import json
+import re
+from datetime import datetime, timedelta
+from typing import Any, Sequence, TypeVar
+from pydantic import BaseModel
 from model_library.base.input import (
     FileBase,
     InputItem,
-    RawInputItem,
+    RawInput,
+    RawResponse,
     TextInput,
     ToolResult,
 )
 from model_library.utils import truncate_str
-from pydantic import BaseModel
 T = TypeVar("T", bound=BaseModel)
+def serialize_for_tokenizing(content: Any) -> str:
+    """
+    Serialize parsed content into a string for tokenization
+    """
+    parts: list[str] = []
+    if content:
+        if isinstance(content, str):
+            parts.append(content)
+        else:
+            parts.append(json.dumps(content, default=str))
+    return "\n".join(parts)
 def add_optional(
     a: int | float | T | None, b: int | float | T | None
 ) -> int | float | T | None:
@@ -54,12 +72,43 @@ def get_pretty_input_types(input: Sequence["InputItem"], verbose: bool = False)
                 return repr(item)
             case ToolResult():
                 return repr(item)
-            case dict():
-                item = cast(RawInputItem, item)
+            case RawInput():
                 return repr(item)
-            case _:
-                # RawResponse
+            case RawResponse():
                 return repr(item)
     processed_items = [f"  {process_item(item)}" for item in input]
     return "\n" + "\n".join(processed_items) if processed_items else ""
+TIME_PATTERN = re.compile(r"^(\d+(?:\.\d+)?)([a-zA-Z]+)$")
+UNIT_TO_SECONDS = {
+    "ms": 0.001,
+    "s": 1,
+    "m": 60,
+    "h": 3600,
+}
+def to_timestamp(input_str: str, server_now: datetime) -> int:
+    """Converts a header string into a server-relative Unix timestamp in ms."""
+    input_str = input_str.strip()
+    # ISO Timestamp (e.g. 2026-01-09T21:58:01Z)
+    if "T" in input_str and "-" in input_str:
+        try:
+            dt = datetime.fromisoformat(input_str.replace("Z", "+00:00"))
+            return int(dt.timestamp() * 1000)
+        except ValueError:
+            pass
+    # Duration (e.g. 10s, 6ms)
+    match = TIME_PATTERN.match(input_str)
+    if match:
+        value, unit = match.groups()
+        offset_seconds = float(value) * UNIT_TO_SECONDS.get(unit.lower(), 0)
+        # Add duration to the SERVER'S provided date
+        dt = server_now + timedelta(seconds=offset_seconds)
+        return int(dt.timestamp() * 1000)
+    raise ValueError(f"Unsupported time format: {input_str}")

model_library/config/alibaba_models.yaml CHANGED Viewed

@@ -1,17 +1,51 @@
-qwen-models:
-  base-config:
-    company: Alibaba
-    open_source: false
+base-config:
+  company: Alibaba
+  open_source: false
+  supports:
+    temperature: true
+  metadata:
+    available_for_everyone: false
+    available_as_evaluator: false
+  default_parameters:
+    temperature: 0.7
+  properties:
+    reasoning_model: false
+qwen-3-vl-models:
+  base-config:
     supports:
-      temperature: true
+      images: true
+  alibaba/qwen3-vl-plus-2025-09-23:
+    label: Qwen 3 VL Plus
+    open_source: true
+    description: Qwen 3 VL Plus (2025-09-23)
+    release_date: 2025-09-23
     metadata:
-      available_for_everyone: false
-      available_as_evaluator: false
-    default_parameters:
-      temperature: 0.7
+      deprecated: true
     properties:
+      context_window: 262_144
+      max_tokens: 32_768
+      training_cutoff: ""
       reasoning_model: false
+    costs_per_million_token:
+      input: 0.2
+      output: 1.6
+qwen-3-max-models:
+  base-config:
+    supports:
+      tools: true
+      images: false
+  alibaba/qwen3-max-2026-01-23:
+    label: Qwen 3 Max Thinking
+    description: Qwen 3 Max with enhanced reasoning capabilities
+    release_date: 2026-01-23
+    properties:
+      context_window: 256_000
+      max_tokens: 32_000
+      reasoning_model: true
   alibaba/qwen3-max-preview:
     label: Qwen 3 Max Preview
@@ -20,15 +54,7 @@ qwen-models:
     properties:
       context_window: 262_144
       max_tokens: 65_536
-      training_cutoff: ""
-    costs_per_million_token:
-      input: 1.2
-      output: 6
-    supports:
-      images: false
-      tools: true
-    metadata:
-      available_for_everyone: false
+      reasoning_model: true
   alibaba/qwen3-max-2025-09-23:
     label: Qwen 3 Max 2025-09-23
@@ -39,14 +65,6 @@ qwen-models:
       max_tokens: 65_536
       training_cutoff: ""
       reasoning_model: true
-    costs_per_million_token:
-      input: 1.2
-      output: 6
-    supports:
-      images: false
-      tools: true
-    metadata:
-      available_for_everyone: false
   alibaba/qwen3-max:
     label: Qwen 3 Max
@@ -57,34 +75,3 @@ qwen-models:
       max_tokens: 65_536
       training_cutoff: ""
       reasoning_model: false
-    costs_per_million_token:
-      input: 1.2
-      output: 6
-      cache:
-        read_discount: 0.8
-        write_markup: 1
-      context:
-        threshold: 32_000
-        input: 2.4
-        output: 12
-    supports:
-      images: false
-      tools: true
-    metadata:
-      available_for_everyone: false
-  alibaba/qwen3-vl-plus-2025-09-23:
-    label: Qwen 3 VL Plus
-    open_source: true
-    description: Qwen 3 VL Plus (2025-09-23)
-    release_date: 2025-09-23
-    properties:
-      context_window: 262_144
-      max_tokens: 32_768
-      training_cutoff: ""
-      reasoning_model: false
-    costs_per_million_token:
-      input: 0.2
-      output: 1.6
-    supports:
-      images: true

model-library 0.1.6__py3-none-any.whl → 0.1.8__py3-none-any.whl

model-library 0.1.6py3-none-any.whl → 0.1.8py3-none-any.whl