PyPI - nexaai - Versions diffs - 1.0.21rc4__cp310-cp310-macosx_14_0_universal2.whl → 1.0.21rc5__cp310-cp310-macosx_14_0_universal2.whl - Mend

nexaai 1.0.21rc4__cp310-cp310-macosx_14_0_universal2.whl → 1.0.21rc5__cp310-cp310-macosx_14_0_universal2.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of nexaai might be problematic. Click here for more details.

Files changed (29) hide show

nexaai/_stub.cpython-310-darwin.so +0 -0
nexaai/_version.py +1 -1
nexaai/asr.py +2 -1
nexaai/binds/__init__.py +1 -0
nexaai/binds/embedder_bind.cpython-310-darwin.so +0 -0
nexaai/binds/libnexa_bridge.dylib +0 -0
nexaai/binds/llm_bind.cpython-310-darwin.so +0 -0
nexaai/binds/rerank_bind.cpython-310-darwin.so +0 -0
nexaai/binds/vlm_bind.cpython-310-darwin.so +0 -0
nexaai/common.py +1 -0
nexaai/cv.py +2 -1
nexaai/embedder.py +4 -3
nexaai/embedder_impl/mlx_embedder_impl.py +3 -1
nexaai/embedder_impl/pybind_embedder_impl.py +3 -2
nexaai/image_gen.py +2 -1
nexaai/llm.py +5 -3
nexaai/llm_impl/mlx_llm_impl.py +2 -0
nexaai/llm_impl/pybind_llm_impl.py +2 -0
nexaai/rerank.py +5 -3
nexaai/rerank_impl/mlx_rerank_impl.py +2 -0
nexaai/rerank_impl/pybind_rerank_impl.py +109 -16
nexaai/tts.py +2 -1
nexaai/utils/model_manager.py +84 -8
nexaai/vlm.py +2 -1
nexaai/vlm_impl/pybind_vlm_impl.py +4 -5
{nexaai-1.0.21rc4.dist-info → nexaai-1.0.21rc5.dist-info}/METADATA +1 -2
{nexaai-1.0.21rc4.dist-info → nexaai-1.0.21rc5.dist-info}/RECORD +29 -28
{nexaai-1.0.21rc4.dist-info → nexaai-1.0.21rc5.dist-info}/WHEEL +0 -0
{nexaai-1.0.21rc4.dist-info → nexaai-1.0.21rc5.dist-info}/top_level.txt +0 -0

nexaai/_stub.cpython-310-darwin.so CHANGED Viewed

Binary file

nexaai/_version.py CHANGED Viewed

@@ -1,4 +1,4 @@
 # This file is generated by CMake from _version.py.in
 # Do not modify this file manually - it will be overwritten
-__version__ = "1.0.21-rc4"
+__version__ = "1.0.21-rc5"

nexaai/asr.py CHANGED Viewed

@@ -35,7 +35,8 @@ class ASR(BaseModel):
                    tokenizer_path: Optional[str] = None,
                    language: Optional[str] = None,
                    plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP,
-                   device_id: Optional[str] = None
+                   device_id: Optional[str] = None,
+                   **kwargs
         ) -> 'ASR':
         """Load ASR model from local path, routing to appropriate implementation."""
         # Check plugin_id value for routing - handle both enum and string

nexaai/binds/__init__.py CHANGED Viewed

@@ -2,3 +2,4 @@ from .common_bind import *
 from .llm_bind import *
 from .embedder_bind import *
 from .vlm_bind import *
+from .rerank_bind import *

nexaai/binds/embedder_bind.cpython-310-darwin.so CHANGED Viewed

Binary file

nexaai/binds/libnexa_bridge.dylib CHANGED Viewed

Binary file

nexaai/binds/llm_bind.cpython-310-darwin.so CHANGED Viewed

Binary file

nexaai/binds/rerank_bind.cpython-310-darwin.so ADDED Viewed

Binary file

nexaai/binds/vlm_bind.cpython-310-darwin.so CHANGED Viewed

Binary file

nexaai/common.py CHANGED Viewed

@@ -8,6 +8,7 @@ class PluginID(str, Enum):
     MLX = "mlx"
     LLAMA_CPP = "llama_cpp"
     NEXAML = "nexaml"
+    NPU = "npu"
 class ChatMessage(TypedDict):

nexaai/cv.py CHANGED Viewed

@@ -73,7 +73,8 @@ class CVModel(BaseModel):
                    _: str,  # TODO: remove this argument, this is a hack to make api design happy
                    config: CVModelConfig,
                    plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP,
-                   device_id: Optional[str] = None
+                   device_id: Optional[str] = None,
+                   **kwargs
         ) -> 'CVModel':
         """Load CV model from configuration, routing to appropriate implementation."""
         # Check plugin_id value for routing - handle both enum and string

nexaai/embedder.py CHANGED Viewed

@@ -22,12 +22,13 @@ class Embedder(BaseModel):
         pass
     @classmethod
-    def _load_from(cls, model_path: str, tokenizer_file: str = "tokenizer.json", plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP):
+    def _load_from(cls, model_path: str, model_name: str = None, tokenizer_file: str = "tokenizer.json", plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP, **kwargs):
         """
         Load an embedder from model files, routing to appropriate implementation.
         Args:
             model_path: Path to the model file
+            model_name: Name of the model
             tokenizer_file: Path to the tokenizer file (default: "tokenizer.json")
             plugin_id: Plugin ID to use for the model (default: PluginID.LLAMA_CPP)
@@ -39,10 +40,10 @@ class Embedder(BaseModel):
         if plugin_value == "mlx":
             from nexaai.embedder_impl.mlx_embedder_impl import MLXEmbedderImpl
-            return MLXEmbedderImpl._load_from(model_path, tokenizer_file, plugin_id)
+            return MLXEmbedderImpl._load_from(model_path, model_name, tokenizer_file, plugin_id)
         else:
             from nexaai.embedder_impl.pybind_embedder_impl import PyBindEmbedderImpl
-            return PyBindEmbedderImpl._load_from(model_path, tokenizer_file, plugin_id)
+            return PyBindEmbedderImpl._load_from(model_path, model_name, tokenizer_file, plugin_id)
     @abstractmethod
     def generate(self, texts: Union[List[str], str] = None, config: EmbeddingConfig = EmbeddingConfig(), input_ids: Union[List[int], List[List[int]]] = None) -> np.ndarray:

nexaai/embedder_impl/mlx_embedder_impl.py CHANGED Viewed

@@ -14,12 +14,13 @@ class MLXEmbedderImpl(Embedder):
         self._mlx_embedder = None
     @classmethod
-    def _load_from(cls, model_path: str, tokenizer_file: str = "tokenizer.json", plugin_id: Union[PluginID, str] = PluginID.MLX):
+    def _load_from(cls, model_path: str, model_name: str = None, tokenizer_file: str = "tokenizer.json", plugin_id: Union[PluginID, str] = PluginID.MLX):
         """
         Load an embedder from model files using MLX backend.
         Args:
             model_path: Path to the model file
+            model_name: Name of the model
             tokenizer_file: Path to the tokenizer file (default: "tokenizer.json")
             plugin_id: Plugin ID to use for the model (default: PluginID.MLX)
@@ -34,6 +35,7 @@ class MLXEmbedderImpl(Embedder):
             # This will automatically detect if it's JinaV2 or generic model and route correctly
             instance._mlx_embedder = create_embedder(
                 model_path=model_path,
+                # model_name=model_name, # FIXME: For MLX Embedder, model_name is not used
                 tokenizer_path=tokenizer_file
             )

nexaai/embedder_impl/pybind_embedder_impl.py CHANGED Viewed

@@ -16,12 +16,13 @@ class PyBindEmbedderImpl(Embedder):
         self._handle = _handle_ptr
     @classmethod
-    def _load_from(cls, model_path: str, tokenizer_file: str = "tokenizer.json", plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP):
+    def _load_from(cls, model_path: str, model_name: str = None, tokenizer_file: str = "tokenizer.json", plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP):
         """
         Load an embedder from model files
         Args:
             model_path: Path to the model file
+            model_name: Name of the model
             tokenizer_file: Path to the tokenizer file (default: "tokenizer.json")
             plugin_id: Plugin ID to use for the model (default: PluginID.LLAMA_CPP)
@@ -32,7 +33,7 @@ class PyBindEmbedderImpl(Embedder):
         # Convert enum to string for C++ binding
         plugin_id_str = plugin_id.value if isinstance(plugin_id, PluginID) else plugin_id
         # New parameter order: model_path, plugin_id, tokenizer_path (optional)
-        handle = embedder_bind.ml_embedder_create(model_path, plugin_id_str, tokenizer_file)
+        handle = embedder_bind.ml_embedder_create(model_path, model_name, plugin_id_str, tokenizer_file)
         return cls(handle)
     def eject(self):

nexaai/image_gen.py CHANGED Viewed

@@ -71,7 +71,8 @@ class ImageGen(BaseModel):
                    plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP,
                    device_id: Optional[str] = None,
                    float16: bool = True,
-                   quantize: bool = False
+                   quantize: bool = False,
+                   **kwargs
         ) -> 'ImageGen':
         """Load image generation model from local path, routing to appropriate implementation."""
         # Check plugin_id value for routing - handle both enum and string

nexaai/llm.py CHANGED Viewed

@@ -15,10 +15,12 @@ class LLM(BaseModel):
     @classmethod
     def _load_from(cls,
                    local_path: str,
+                   model_name: Optional[str] = None,
                    tokenizer_path: Optional[str] = None,
                    m_cfg: ModelConfig = ModelConfig(),
                    plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP,
-                   device_id: Optional[str] = None
+                   device_id: Optional[str] = None,
+                   **kwargs
         ) -> 'LLM':
         """Load model from local path, routing to appropriate implementation."""
         # Check plugin_id value for routing - handle both enum and string
@@ -26,10 +28,10 @@ class LLM(BaseModel):
         if plugin_value == "mlx":
             from nexaai.llm_impl.mlx_llm_impl import MLXLLMImpl
-            return MLXLLMImpl._load_from(local_path, tokenizer_path, m_cfg, plugin_id, device_id)
+            return MLXLLMImpl._load_from(local_path, model_name, tokenizer_path, m_cfg, plugin_id, device_id)
         else:
             from nexaai.llm_impl.pybind_llm_impl import PyBindLLMImpl
-            return PyBindLLMImpl._load_from(local_path, tokenizer_path, m_cfg, plugin_id, device_id)
+            return PyBindLLMImpl._load_from(local_path, model_name, tokenizer_path, m_cfg, plugin_id, device_id)
     def cancel_generation(self):
         """Signal to cancel any ongoing stream generation."""

nexaai/llm_impl/mlx_llm_impl.py CHANGED Viewed

@@ -16,6 +16,7 @@ class MLXLLMImpl(LLM):
     @classmethod
     def _load_from(cls,
                    local_path: str,
+                   model_name: Optional[str] = None,
                    tokenizer_path: Optional[str] = None,
                    m_cfg: ModelConfig = ModelConfig(),
                    plugin_id: Union[PluginID, str] = PluginID.MLX,
@@ -40,6 +41,7 @@ class MLXLLMImpl(LLM):
             instance = cls(m_cfg)
             instance._mlx_llm = MLXLLMInterface(
                 model_path=local_path,
+                # model_name=model_name, # FIXME: For MLX LLM, model_name is not used
                 tokenizer_path=tokenizer_path or local_path,
                 config=mlx_config,
                 device=device_id

nexaai/llm_impl/pybind_llm_impl.py CHANGED Viewed

@@ -19,6 +19,7 @@ class PyBindLLMImpl(LLM):
     @classmethod
     def _load_from(cls,
                    local_path: str,
+                   model_name: Optional[str] = None,
                    tokenizer_path: Optional[str] = None,
                    m_cfg: ModelConfig = ModelConfig(),
                    plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP,
@@ -55,6 +56,7 @@ class PyBindLLMImpl(LLM):
         plugin_id_str = plugin_id.value if isinstance(plugin_id, PluginID) else plugin_id
         handle = llm_bind.ml_llm_create(
             model_path=local_path,
+            model_name=model_name,
             tokenizer_path=tokenizer_path,
             model_config=config,
             plugin_id=plugin_id_str,

nexaai/rerank.py CHANGED Viewed

@@ -24,9 +24,11 @@ class Reranker(BaseModel):
     @classmethod
     def _load_from(cls,
                    model_path: str,
+                   model_name: str = None,
                    tokenizer_file: str = "tokenizer.json",
                    plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP,
-                   device_id: Optional[str] = None
+                   device_id: Optional[str] = None,
+                   **kwargs
         ) -> 'Reranker':
         """Load reranker model from local path, routing to appropriate implementation."""
         # Check plugin_id value for routing - handle both enum and string
@@ -34,10 +36,10 @@ class Reranker(BaseModel):
         if plugin_value == "mlx":
             from nexaai.rerank_impl.mlx_rerank_impl import MLXRerankImpl
-            return MLXRerankImpl._load_from(model_path, tokenizer_file, plugin_id, device_id)
+            return MLXRerankImpl._load_from(model_path, model_name, tokenizer_file, plugin_id, device_id)
         else:
             from nexaai.rerank_impl.pybind_rerank_impl import PyBindRerankImpl
-            return PyBindRerankImpl._load_from(model_path, tokenizer_file, plugin_id, device_id)
+            return PyBindRerankImpl._load_from(model_path, model_name, tokenizer_file, plugin_id, device_id)
     @abstractmethod
     def load_model(self, model_path: str, extra_data: Optional[str] = None) -> bool:

nexaai/rerank_impl/mlx_rerank_impl.py CHANGED Viewed

@@ -17,6 +17,7 @@ class MLXRerankImpl(Reranker):
     @classmethod
     def _load_from(cls,
                    model_path: str,
+                   model_name: str = None,
                    tokenizer_file: str = "tokenizer.json",
                    plugin_id: Union[PluginID, str] = PluginID.MLX,
                    device_id: Optional[str] = None
@@ -29,6 +30,7 @@ class MLXRerankImpl(Reranker):
             instance = cls()
             instance._mlx_reranker = create_reranker(
                 model_path=model_path,
+                # model_name=model_name, # FIXME: For MLX Reranker, model_name is not used
                 tokenizer_path=tokenizer_file,
                 device=device_id
             )

nexaai/rerank_impl/pybind_rerank_impl.py CHANGED Viewed

@@ -1,36 +1,89 @@
 from typing import List, Optional, Sequence, Union
+import numpy as np
 from nexaai.common import PluginID
 from nexaai.rerank import Reranker, RerankConfig
+from nexaai.binds import rerank_bind, common_bind
+from nexaai.runtime import _ensure_runtime
 class PyBindRerankImpl(Reranker):
-    def __init__(self):
-        """Initialize PyBind Rerank implementation."""
+    def __init__(self, _handle_ptr):
+        """
+        Internal initializer
+        Args:
+            _handle_ptr: Capsule handle to the C++ reranker object
+        """
         super().__init__()
-        # TODO: Add PyBind-specific initialization
+        self._handle = _handle_ptr
     @classmethod
     def _load_from(cls,
                    model_path: str,
+                   model_name: str = None,
                    tokenizer_file: str = "tokenizer.json",
                    plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP,
                    device_id: Optional[str] = None
         ) -> 'PyBindRerankImpl':
-        """Load reranker model from local path using PyBind backend."""
-        # TODO: Implement PyBind reranker loading
-        instance = cls()
-        return instance
+        """
+        Load reranker model from local path using PyBind backend.
+        Args:
+            model_path: Path to the model file
+            model_name: Name of the model (optional)
+            tokenizer_file: Path to the tokenizer file (default: "tokenizer.json")
+            plugin_id: Plugin ID to use for the model (default: PluginID.LLAMA_CPP)
+            device_id: Device ID to use for the model (optional)
+        Returns:
+            PyBindRerankImpl instance
+        """
+        _ensure_runtime()
+        # Convert enum to string for C++ binding
+        plugin_id_str = plugin_id.value if isinstance(plugin_id, PluginID) else plugin_id
+        # Create model config
+        model_config = common_bind.ModelConfig()
+        # Create reranker handle with new API signature
+        handle = rerank_bind.ml_reranker_create(
+            model_path,
+            model_name,
+            tokenizer_file,
+            model_config,
+            plugin_id_str,
+            device_id
+        )
+        return cls(handle)
     def eject(self):
-        """Destroy the model and free resources."""
-        # TODO: Implement PyBind reranker cleanup
-        pass
+        """
+        Clean up resources and destroy the reranker
+        """
+        # Destructor of the handle will unload the model correctly
+        if hasattr(self, '_handle') and self._handle is not None:
+            del self._handle
+            self._handle = None
     def load_model(self, model_path: str, extra_data: Optional[str] = None) -> bool:
-        """Load model from path."""
-        # TODO: Implement PyBind reranker model loading
-        raise NotImplementedError("PyBind reranker model loading not yet implemented")
+        """
+        Load model from path.
+        Note: This method is not typically used directly. Use _load_from instead.
+        Args:
+            model_path: Path to the model file
+            extra_data: Additional data (unused)
+        Returns:
+            True if successful
+        """
+        # This method is part of the BaseModel interface but typically not used
+        # directly for PyBind implementations since _load_from handles creation
+        raise NotImplementedError("Use _load_from class method to load models")
     def rerank(
         self,
@@ -38,6 +91,46 @@ class PyBindRerankImpl(Reranker):
         documents: Sequence[str],
         config: Optional[RerankConfig] = None,
     ) -> List[float]:
-        """Rerank documents given a query."""
-        # TODO: Implement PyBind reranking
-        raise NotImplementedError("PyBind reranking not yet implemented")
+        """
+        Rerank documents given a query.
+        Args:
+            query: Query text as UTF-8 string
+            documents: List of document texts to rerank
+            config: Optional reranking configuration
+        Returns:
+            List of ranking scores (one per document)
+        """
+        if self._handle is None:
+            raise RuntimeError("Reranker handle is None. Model may have been ejected.")
+        # Use default config if not provided
+        if config is None:
+            config = RerankConfig()
+        # Create bind config
+        bind_config = rerank_bind.RerankConfig()
+        bind_config.batch_size = config.batch_size
+        bind_config.normalize = config.normalize
+        bind_config.normalize_method = config.normalize_method
+        # Convert documents to list if needed
+        documents_list = list(documents)
+        # Call the binding which returns a dict with scores and profile_data
+        result = rerank_bind.ml_reranker_rerank(
+            self._handle,
+            query,
+            documents_list,
+            bind_config
+        )
+        # Extract scores from result dict
+        scores_array = result.get("scores", np.array([]))
+        # Convert numpy array to list of floats
+        if isinstance(scores_array, np.ndarray):
+            return scores_array.tolist()
+        else:
+            return []

nexaai/tts.py CHANGED Viewed

@@ -45,7 +45,8 @@ class TTS(BaseModel):
                    model_path: str,
                    vocoder_path: str,
                    plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP,
-                   device_id: Optional[str] = None
+                   device_id: Optional[str] = None,
+                   **kwargs
         ) -> 'TTS':
         """Load TTS model from local path, routing to appropriate implementation."""
         # Check plugin_id value for routing - handle both enum and string

nexaai/utils/model_manager.py CHANGED Viewed

@@ -1344,7 +1344,7 @@ def _download_model_if_needed(
     token: Union[bool, str, None] = None,
     is_mmproj: bool = False,
     **kwargs
-) -> str:
+) -> tuple[str, Optional[str], Optional[str]]:
     """
     Helper function to download a model from HuggingFace if it doesn't exist locally.
@@ -1355,15 +1355,78 @@ def _download_model_if_needed(
         token: HuggingFace authentication token for private repositories
     Returns:
-        str: Local path to the model (either existing or downloaded)
+        tuple[str, Optional[str], Optional[str]]: Tuple of (local_path, model_name, plugin_id)
+            - local_path: Local path to the model (either existing or downloaded)
+            - model_name: ModelName from nexa.manifest if available, None otherwise
+            - plugin_id: PluginId from nexa.manifest if available, None otherwise
     Raises:
         RuntimeError: If download fails
     """
+    # Helper function to extract model info from manifest
+    def _extract_info_from_manifest(path: str) -> tuple[Optional[str], Optional[str], Optional[dict]]:
+        """Extract ModelName, PluginId, and full manifest from nexa.manifest if it exists."""
+        # If path is a file, check its parent directory for manifest
+        if os.path.isfile(path):
+            manifest_dir = os.path.dirname(path)
+        else:
+            manifest_dir = path
+        manifest_path = os.path.join(manifest_dir, 'nexa.manifest')
+        if not os.path.exists(manifest_path):
+            return None, None, None
+        try:
+            with open(manifest_path, 'r', encoding='utf-8') as f:
+                manifest = json.load(f)
+                return manifest.get('ModelName'), manifest.get('PluginId'), manifest
+        except (json.JSONDecodeError, IOError):
+            return None, None, None
+    # Helper function to get a model file path from manifest
+    # Note: Tnis is for NPU only, because when downloading, it is a directory; when passing local path to inference, it needs to be a file.
+    def _get_model_file_from_manifest(manifest: dict, base_dir: str) -> Optional[str]:
+        """Extract a model file path from manifest's ModelFile section."""
+        if not manifest or 'ModelFile' not in manifest:
+            return None
+        model_files = manifest['ModelFile']
+        # Find the first valid model file (skip N/A entries and metadata files)
+        for key, file_info in model_files.items():
+            if key == 'N/A':
+                continue
+            if isinstance(file_info, dict) and 'Name' in file_info:
+                file_name = file_info['Name']
+                # Skip common non-model files
+                if file_name and not file_name.startswith('.') and file_name.endswith('.nexa'):
+                    file_path = os.path.join(base_dir, file_name)
+                    if os.path.exists(file_path):
+                        return file_path
+        # If no .nexa files found, try ExtraFiles for .nexa files
+        if 'ExtraFiles' in manifest:
+            for file_info in manifest['ExtraFiles']:
+                if isinstance(file_info, dict) and 'Name' in file_info:
+                    file_name = file_info['Name']
+                    if file_name and file_name.endswith('.nexa') and not file_name.startswith('.cache'):
+                        file_path = os.path.join(base_dir, file_name)
+                        if os.path.exists(file_path):
+                            return file_path
+        return None
     # Check if model_path exists locally (file or directory)
     if os.path.exists(model_path):
-        # Local path exists, return as-is
-        return model_path
+        # Local path exists, try to extract model info
+        model_name, plugin_id, manifest = _extract_info_from_manifest(model_path)
+        # If PluginId is "npu" and path is a directory, convert to file path
+        if plugin_id == "npu" and os.path.isdir(model_path):
+            model_file_path = _get_model_file_from_manifest(manifest, model_path)
+            if model_file_path:
+                model_path = model_file_path
+        return model_path, model_name, plugin_id
     # Model path doesn't exist locally, try to download from HuggingFace
     try:
@@ -1383,7 +1446,16 @@ def _download_model_if_needed(
             **kwargs
         )
-        return downloaded_path
+        # Extract model info from the downloaded manifest
+        model_name, plugin_id, manifest = _extract_info_from_manifest(downloaded_path)
+        # If PluginId is "npu" and path is a directory, convert to file path
+        if plugin_id == "npu" and os.path.isdir(downloaded_path):
+            model_file_path = _get_model_file_from_manifest(manifest, downloaded_path)
+            if model_file_path:
+                downloaded_path = model_file_path
+        return downloaded_path, model_name, plugin_id
     except Exception as e:
         # Only handle download-related errors
@@ -1452,7 +1524,7 @@ def auto_download_model(func: Callable) -> Callable:
         # Download name_or_path if needed
         if name_or_path is not None:
             try:
-                downloaded_name_path = _download_model_if_needed(
+                downloaded_name_path, model_name, plugin_id = _download_model_if_needed(
                     name_or_path, 'name_or_path', progress_callback, token, **kwargs
                 )
@@ -1463,6 +1535,10 @@ def auto_download_model(func: Callable) -> Callable:
                         args = tuple(args_list)
                 else:
                     kwargs['name_or_path'] = downloaded_name_path
+                # Add model_name to kwargs if it exists and not already set
+                if model_name is not None and 'model_name' not in kwargs:
+                    kwargs['model_name'] = model_name
             except Exception as e:
                 raise e  # Re-raise the error from _download_model_if_needed
@@ -1470,7 +1546,7 @@ def auto_download_model(func: Callable) -> Callable:
         # Download mmproj_path if needed
         if mmproj_path is not None:
             try:
-                downloaded_mmproj_path = _download_model_if_needed(
+                downloaded_mmproj_path, _, _ = _download_model_if_needed(
                     mmproj_path, 'mmproj_path', progress_callback, token, is_mmproj=True, **kwargs
                 )
@@ -1482,5 +1558,5 @@ def auto_download_model(func: Callable) -> Callable:
         # Call original function with updated paths (outside try-catch to let model creation errors bubble up)
         return func(*args, **kwargs)
     return wrapper

nexaai/vlm.py CHANGED Viewed

@@ -22,7 +22,8 @@ class VLM(BaseModel):
                    model_name: Optional[str] = None,
                    m_cfg: ModelConfig = ModelConfig(),
                    plugin_id: Union[PluginID, str] = PluginID.LLAMA_CPP,
-                   device_id: Optional[str] = None
+                   device_id: Optional[str] = None,
+                   **kwargs
         ) -> 'VLM':
         """Load VLM model from local path, routing to appropriate implementation.

nexaai/vlm_impl/pybind_vlm_impl.py CHANGED Viewed

@@ -73,7 +73,7 @@ class PyBindVLMImpl(VLM):
         handle = vlm_bind.create_vlm(
             model_path=local_path,
             mmproj_path=mmproj_path,
-            # model_name=model_name, # TODO: enable model_name in pybind later
+            model_name=model_name,
             model_config=config,
             plugin_id=plugin_id_str,
             device_id=device_id
@@ -109,11 +109,10 @@ class PyBindVLMImpl(VLM):
                 t = c["type"]
                 if t == "text":
                     blocks.append({"type": "text", "text": c.get("text","") or ""})
-                elif t == "image":
-                    # Pass through the original structure - let vlm-bind.cpp handle field extraction
-                    blocks.append(c)
                 else:
-                    raise ValueError(f"Unsupported content type: {t}. Use 'text' or 'image' to match the golden reference in vlm.cpp")
+                    # Pass through the original structure for image, audio, and any other types
+                    # Let vlm-bind.cpp handle field extraction (text/url/path)
+                    blocks.append(c)
             payload.append({"role": role, "content": blocks})

{nexaai-1.0.21rc4.dist-info → nexaai-1.0.21rc5.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: nexaai
-Version: 1.0.21rc4
+Version: 1.0.21rc5
 Summary: Python bindings for NexaSDK C-lib backend
 Author-email: "Nexa AI, Inc." <dev@nexa.ai>
 Project-URL: Homepage, https://github.com/NexaAI/nexasdk-bridge
@@ -14,7 +14,6 @@ Requires-Python: >=3.7
 Description-Content-Type: text/markdown
 Requires-Dist: huggingface_hub
 Requires-Dist: tqdm
-Requires-Dist: hf_xet
 Requires-Dist: numpy
 Requires-Dist: httpx
 Provides-Extra: mlx

{nexaai-1.0.21rc4.dist-info → nexaai-1.0.21rc5.dist-info}/RECORD RENAMED Viewed

@@ -1,28 +1,29 @@
 nexaai/__init__.py,sha256=gOd7sNsqEESopw_24xgnOSkIRENrk4Fa-RMtmVv62eA,2421
-nexaai/_stub.cpython-310-darwin.so,sha256=S7HBEXSqi5I45poF3LYs2TG074WA8bKc1x8HwuoZyWs,66768
-nexaai/_version.py,sha256=96J46jiKFpZK_xMMQViecm1z3kZktIDNNqQCXx0kYp0,143
-nexaai/asr.py,sha256=NljMXDErwPNMOPaRkJZMEDka9Nk8xyur7L8i924TStY,2054
+nexaai/_stub.cpython-310-darwin.so,sha256=tKGwBF2vBcfDMxLzlwD0mCcn3NhgwqqkETX_6ZQhxEY,66768
+nexaai/_version.py,sha256=xjLVIdWRLT2AZrjSVMMaQ9riEM81_VB5EUm6fx_kLHU,143
+nexaai/asr.py,sha256=BglyvLM_SiLbQwKhihOuiyX2m1I9-Kq_gYcE7vpjBPY,2083
 nexaai/base.py,sha256=N8PRgDFA-XPku2vWnQIofQ7ipz3pPlO6f8YZGnuhquE,982
-nexaai/common.py,sha256=Y0NJNLTi4Nq4x1WL6PQsSvGUto0eGmWhjpsC6jcekfA,3444
-nexaai/cv.py,sha256=RHCDo8gvBH8BkGZx7qVyp-OKxqi7E1GG9XzyaXehCNA,3273
-nexaai/embedder.py,sha256=Cw0tSHkPgd-RI62afCqQAcTHMnQhaI2CvfTMO-1JKOg,2452
-nexaai/image_gen.py,sha256=0C_5Tjj4BYmxLbmMmvwajp-yy2mmEEOKwBFnDQNPzx4,4356
-nexaai/llm.py,sha256=S1o_k2VQoF5w2wO25f142OO1R75TP89Ii69VZv8pIGo,3567
+nexaai/common.py,sha256=MRWZ6a7pnci_OUHxZRm3YqgKLAtZFD7b88STYDfeIF8,3460
+nexaai/cv.py,sha256=gpE3F__6bjh8OQKNJZs-QrBuCxqMj2eH-u6HR90vGZE,3302
+nexaai/embedder.py,sha256=lXOT16PEvd_hT23d77dZH38VHNOAk-3JvoOUdQTEaGI,2552
+nexaai/image_gen.py,sha256=MkGw1HXqqv8cJzbiGERNPKFXfq9vMOlvuq0pgekXw68,4385
+nexaai/llm.py,sha256=-agVJuj0FOaDvDiT-fFSOpoyVt-MpNudBucsod3Vp1M,3673
 nexaai/log.py,sha256=Kwo2CIfWN6iP4M4F5EUIV8KIO5hAsvz6HZAaOwJ27Og,2628
-nexaai/rerank.py,sha256=vWaBucoQ1wz-2iYnZqyFIcEjm-4Xcs1KDbFN5X8zzDQ,1872
+nexaai/rerank.py,sha256=rFKm1Y_ou__0lU82OTy4j_AYIGVBGfID0gzuZ6zXYsM,1968
 nexaai/runtime.py,sha256=JvllhlNPgYGLbgGyX2yNvmGzT0lZ5XbvTvEo8sZG_Ho,2067
 nexaai/runtime_error.py,sha256=sO87LyCA0qzm0hVqBrmG2FDzGQH865EMbTMop2OfZto,779
-nexaai/tts.py,sha256=ZnBpWUxIfHhh7KfEjddtH7hHOTa91zg7ogGLakMIALo,2167
-nexaai/vlm.py,sha256=MreJ_S5-C0KH3haFuJwHqVtL099MrrmBQ23vK1PINCc,4771
+nexaai/tts.py,sha256=jvgDZIyo47NBDny6z74IQT2SDDVo7Mpp-QZwl6YxARU,2196
+nexaai/vlm.py,sha256=LUrd1_SGHOsYpWyUymX93oEIsNJv7XzHIHo4hBZOhQA,4800
 nexaai/asr_impl/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 nexaai/asr_impl/mlx_asr_impl.py,sha256=eosd8-TIWAOwV0HltmoFrLwzXHcU4jyxtncvuZE9pgA,3257
 nexaai/asr_impl/pybind_asr_impl.py,sha256=pE9Hb_hMi5yAc4MF83bLVOb8zDtreCkB3_u7XED9YpA,1516
-nexaai/binds/__init__.py,sha256=eYuay_8DDXeOUWz2_R9HFSabohxs6hvZn391t2L0Po0,104
+nexaai/binds/__init__.py,sha256=tI15Ghxgp_PZAdob7op8_K5Ia8DNiTvXiYpFZyB4oN0,131
 nexaai/binds/common_bind.cpython-310-darwin.so,sha256=zxJuD0nSV--VZKxBfWZUavU7_bHj_JTi0FhkjvG4VJw,235264
-nexaai/binds/embedder_bind.cpython-310-darwin.so,sha256=tPa0c0Dv_GiW66fgmAGWGCHXRGNApznqoQS0eQx9GFM,202064
-nexaai/binds/libnexa_bridge.dylib,sha256=0nzFJHOy_JI55ALwJDo2cmNAFJqcEkwlLF40ESPFaJ4,272648
-nexaai/binds/llm_bind.cpython-310-darwin.so,sha256=TAWfa1Hzq00TjtC1xVsiAeLp6hv2LrL5afDz4omUghc,182784
-nexaai/binds/vlm_bind.cpython-310-darwin.so,sha256=VpTl0U8YmiYTyp5vNlmLRxiwGD8-4am8nBvdWYY1d-I,182704
+nexaai/binds/embedder_bind.cpython-310-darwin.so,sha256=nn3kINQUNyXIzmcU1olLg8RlkZYyIs_RtIlCk6OH1ds,202064
+nexaai/binds/libnexa_bridge.dylib,sha256=O5cI95LKiety_NjJT21lOz5KlXxUZSY5kqgXzPQXx18,272648
+nexaai/binds/llm_bind.cpython-310-darwin.so,sha256=YShsXbe_n2N05joMmTnZXaXh9gM9LGdcmuWUxUc5plI,182784
+nexaai/binds/rerank_bind.cpython-310-darwin.so,sha256=GJmffOLo9A48S_pMG2CtHyhbamtt97QikSSCXk3LqiM,183920
+nexaai/binds/vlm_bind.cpython-310-darwin.so,sha256=JEoQbyOkMXVK4WyBCqKBHbyXHtTiTWT18UkZMFvMh4k,182704
 nexaai/binds/cpu_gpu/libggml-base.dylib,sha256=9urbatWTB4QJ6uariOYlB_ZN1FFci5GaD8OfGZ9oPSQ,650736
 nexaai/binds/cpu_gpu/libggml-cpu.so,sha256=qiYxbTe4Nt7n36zJVvq3zovgSZEmrN2is6gzTern7UI,677728
 nexaai/binds/cpu_gpu/libggml-metal.so,sha256=zfaX7rIBYQazH2lf-vza007BMhPTK1ASd2T0HLLIA4E,673104
@@ -202,14 +203,14 @@ nexaai/cv_impl/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 nexaai/cv_impl/mlx_cv_impl.py,sha256=gKECQOv8iaWwG3bl7xeqVy2NN_9K7tYerIFzfn4eLo4,3228
 nexaai/cv_impl/pybind_cv_impl.py,sha256=uSmwBste4cT7c8DQmXzRLmzwDf773PAbXNYWW1UzVls,1064
 nexaai/embedder_impl/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-nexaai/embedder_impl/mlx_embedder_impl.py,sha256=dTjOC1VJ9ypIgCvkK_jKNSWpswbg132rDcTzWcL5oFA,4482
-nexaai/embedder_impl/pybind_embedder_impl.py,sha256=9gsHuSbF64IZH9ugqv4-GTUuRpy-FJNUb0cww2QR3uA,3575
+nexaai/embedder_impl/mlx_embedder_impl.py,sha256=pFPraUAjm9EVvVbwIp1cjbtXUysF5pqxEcK2CAFvcDw,4639
+nexaai/embedder_impl/pybind_embedder_impl.py,sha256=lFpf0wI2d7kfO2GUyUuUS1U2L_PyZMJVGmAvF8EuQ0g,3653
 nexaai/image_gen_impl/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 nexaai/image_gen_impl/mlx_image_gen_impl.py,sha256=BuDkksvXyb4J02GsdnbGAmYckfUU0Eah6BimoMD3QqY,11219
 nexaai/image_gen_impl/pybind_image_gen_impl.py,sha256=ms34VYoD5AxZFG6cIG0QAJDjCtfphaZ1bHzKzey1xF8,3692
 nexaai/llm_impl/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-nexaai/llm_impl/mlx_llm_impl.py,sha256=4v7jUFzHfE7zw2uViekGQDaTROz8A6oaW31Z3iVe6tg,11157
-nexaai/llm_impl/pybind_llm_impl.py,sha256=aooqkcXZWhCo07wbSafGgBrA3WnijtnUADShjjgFsBQ,8051
+nexaai/llm_impl/mlx_llm_impl.py,sha256=dPtaEribluHZZY_f9M114glcQhtDEckukw4Sfd5zJos,11296
+nexaai/llm_impl/pybind_llm_impl.py,sha256=XXnUuRZMr9rrEL1vM6VTwsgs0KQnKn4C3TyrHE46uw8,8139
 nexaai/mlx_backend/ml.py,sha256=DKXVOAfh8cg7KTKljh7jpcPwfQFNigc6uv_ZXF6lse8,23977
 nexaai/mlx_backend/profiling.py,sha256=Dc-mybFwBdCIKFWL7CbSHjkOJGAoYHG7r_e_XPhzwBU,9361
 nexaai/mlx_backend/asr/__init__.py,sha256=fuT_9_xpYJ28m4yjly5L2jChUrzlSQz-b_S7nujxkSM,451
@@ -553,21 +554,21 @@ nexaai/mlx_backend/vlm/modeling/trainer/lora.py,sha256=tGjvenjEQ8_1Az8Nz3smz5Mgv
 nexaai/mlx_backend/vlm/modeling/trainer/trainer.py,sha256=h16SaHt76JzFruXuidgXDx7_2evx4L0SecvzqLmhyZw,9081
 nexaai/mlx_backend/vlm/modeling/trainer/utils.py,sha256=29oHf_7946YeJKP_-Dt-NPeN4xJq8Fj7Yv4jZKO9RWA,4909
 nexaai/rerank_impl/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-nexaai/rerank_impl/mlx_rerank_impl.py,sha256=h37PKSIRBY8mwzVeLeP4ix9ui3waIsg4gorzelYLJbM,3243
-nexaai/rerank_impl/pybind_rerank_impl.py,sha256=CtwkG7YrW58GPMDERJSnISGTVCXWNju5__R2W837t7c,1513
+nexaai/rerank_impl/mlx_rerank_impl.py,sha256=3nbqCdzyAugc4P_6K9mowEgy4LFdfzhy7GUvn9GMpSE,3377
+nexaai/rerank_impl/pybind_rerank_impl.py,sha256=tmzrpRYCCV3ATxbE9G1Io6SUtgYPO8BFe48nTae6_xw,4490
 nexaai/tts_impl/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 nexaai/tts_impl/mlx_tts_impl.py,sha256=i_uNPdvlXYtL3e01oKjDlP9jgkWCRt1bBHsExaaiJi8,3101
 nexaai/tts_impl/pybind_tts_impl.py,sha256=mpn44r6pfYLIl-NrEy2dXHjGtWtNCmM7HRyxiANxUI4,1444
 nexaai/utils/decode.py,sha256=61n4Zf6c5QLyqGoctEitlI9BX3tPlP2a5aaKNHbw3T4,404
 nexaai/utils/manifest_utils.py,sha256=OOp_BmFWH1ZHMYkS2VGAby5Rpm4f4GLCRBJEBYm-kys,21489
-nexaai/utils/model_manager.py,sha256=CsRflxY329DgDeZxl_PGFKis7MQW7XROkrvZUCPEpvo,62022
+nexaai/utils/model_manager.py,sha256=OnL87zCPn3cBcScCKo-bHnBUpr24-Po293QC6Bwgx1Q,66112
 nexaai/utils/model_types.py,sha256=ONWjjo8CFPdhxki6qo7MXnSZaEzjBcxa_Kkf_y5NXus,1483
 nexaai/utils/progress_tracker.py,sha256=jdUqtmPqyhwC9uSKvQcJEYETwSt-OhP4oitdJ94614o,15394
 nexaai/utils/quantization_utils.py,sha256=FYcNSAKGlBqFDUTx3jSKOr2lnq4nyiyC0ZG8oSxFwiU,7825
 nexaai/vlm_impl/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 nexaai/vlm_impl/mlx_vlm_impl.py,sha256=sgHqnX5OCSGLccCnTuRiktIbqThNn3AAIvYE2_Dy4TI,10833
-nexaai/vlm_impl/pybind_vlm_impl.py,sha256=MDbreWSqugakXU_PqH6mPoCxjKEEbYfQIco_NDck8_s,9905
-nexaai-1.0.21rc4.dist-info/METADATA,sha256=GHbnStWeUZeE2wbSl1Omhzxe6i2-LrQRH03jG3i8Yco,1209
-nexaai-1.0.21rc4.dist-info/WHEEL,sha256=T2p57lol9__xkoU6aJTyN1Pm43ZpRU3q6km7mIbrAMs,114
-nexaai-1.0.21rc4.dist-info/top_level.txt,sha256=LRE2YERlrZk2vfuygnSzsEeqSknnZbz3Z1MHyNmBU4w,7
-nexaai-1.0.21rc4.dist-info/RECORD,,
+nexaai/vlm_impl/pybind_vlm_impl.py,sha256=stJKHdhYhBuWUQkky-nHgCv625qDB_1geI3v5BLNGpM,9765
+nexaai-1.0.21rc5.dist-info/METADATA,sha256=QJ9gbIXVYJHi45-NWVh9g5XxqImymoirQot4jMqi2tw,1187
+nexaai-1.0.21rc5.dist-info/WHEEL,sha256=T2p57lol9__xkoU6aJTyN1Pm43ZpRU3q6km7mIbrAMs,114
+nexaai-1.0.21rc5.dist-info/top_level.txt,sha256=LRE2YERlrZk2vfuygnSzsEeqSknnZbz3Z1MHyNmBU4w,7
+nexaai-1.0.21rc5.dist-info/RECORD,,

{nexaai-1.0.21rc4.dist-info → nexaai-1.0.21rc5.dist-info}/WHEEL RENAMED Viewed

File without changes

{nexaai-1.0.21rc4.dist-info → nexaai-1.0.21rc5.dist-info}/top_level.txt RENAMED Viewed

File without changes