PyPI - lemonade-sdk - Versions diffs - 8.1.4__py3-none-any.whl → 8.2.2__py3-none-any.whl - Mend

lemonade-sdk 8.1.4py3-none-any.whl → 8.2.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of lemonade-sdk might be problematic. Click here for more details.

Files changed (53) hide show

lemonade/cache.py +6 -1
lemonade/cli.py +47 -5
lemonade/common/inference_engines.py +13 -4
lemonade/common/status.py +4 -4
lemonade/common/system_info.py +544 -1
lemonade/profilers/agt_power.py +437 -0
lemonade/profilers/hwinfo_power.py +429 -0
lemonade/tools/accuracy.py +143 -48
lemonade/tools/adapter.py +6 -1
lemonade/tools/bench.py +26 -8
lemonade/tools/flm/__init__.py +1 -0
lemonade/tools/flm/utils.py +303 -0
lemonade/tools/huggingface/bench.py +6 -1
lemonade/tools/llamacpp/bench.py +146 -27
lemonade/tools/llamacpp/load.py +30 -2
lemonade/tools/llamacpp/utils.py +393 -33
lemonade/tools/oga/bench.py +5 -26
lemonade/tools/oga/load.py +60 -121
lemonade/tools/oga/migration.py +403 -0
lemonade/tools/report/table.py +76 -8
lemonade/tools/server/flm.py +133 -0
lemonade/tools/server/llamacpp.py +220 -553
lemonade/tools/server/serve.py +684 -168
lemonade/tools/server/static/js/chat.js +666 -342
lemonade/tools/server/static/js/model-settings.js +24 -3
lemonade/tools/server/static/js/models.js +597 -73
lemonade/tools/server/static/js/shared.js +79 -14
lemonade/tools/server/static/logs.html +191 -0
lemonade/tools/server/static/styles.css +491 -66
lemonade/tools/server/static/webapp.html +83 -31
lemonade/tools/server/tray.py +158 -38
lemonade/tools/server/utils/macos_tray.py +226 -0
lemonade/tools/server/utils/{system_tray.py → windows_tray.py} +13 -0
lemonade/tools/server/webapp.py +4 -1
lemonade/tools/server/wrapped_server.py +559 -0
lemonade/version.py +1 -1
lemonade_install/install.py +54 -611
{lemonade_sdk-8.1.4.dist-info → lemonade_sdk-8.2.2.dist-info}/METADATA +29 -72
lemonade_sdk-8.2.2.dist-info/RECORD +83 -0
lemonade_server/cli.py +145 -37
lemonade_server/model_manager.py +521 -37
lemonade_server/pydantic_models.py +28 -1
lemonade_server/server_models.json +246 -92
lemonade_server/settings.py +39 -39
lemonade/tools/quark/__init__.py +0 -0
lemonade/tools/quark/quark_load.py +0 -173
lemonade/tools/quark/quark_quantize.py +0 -439
lemonade_sdk-8.1.4.dist-info/RECORD +0 -77
{lemonade_sdk-8.1.4.dist-info → lemonade_sdk-8.2.2.dist-info}/WHEEL +0 -0
{lemonade_sdk-8.1.4.dist-info → lemonade_sdk-8.2.2.dist-info}/entry_points.txt +0 -0
{lemonade_sdk-8.1.4.dist-info → lemonade_sdk-8.2.2.dist-info}/licenses/LICENSE +0 -0
{lemonade_sdk-8.1.4.dist-info → lemonade_sdk-8.2.2.dist-info}/licenses/NOTICE.md +0 -0
{lemonade_sdk-8.1.4.dist-info → lemonade_sdk-8.2.2.dist-info}/top_level.txt +0 -0

lemonade_server/model_manager.py CHANGED Viewed

@@ -1,16 +1,33 @@
 import json
 import os
+import subprocess
 from typing import Optional
 import shutil
 import huggingface_hub
 from importlib.metadata import distributions
 from lemonade_server.pydantic_models import PullConfig
+from lemonade_server.pydantic_models import PullConfig
 from lemonade.cache import DEFAULT_CACHE_DIR
-from lemonade.tools.llamacpp.utils import parse_checkpoint, download_gguf
+from lemonade.tools.llamacpp.utils import (
+    parse_checkpoint,
+    download_gguf,
+    resolve_local_gguf_model,
+)
 from lemonade.common.network import custom_snapshot_download
+from lemonade.tools.oga.migration import (
+    detect_incompatible_ryzenai_models,
+    delete_incompatible_models,
+)
 USER_MODELS_FILE = os.path.join(DEFAULT_CACHE_DIR, "user_models.json")
+from lemonade.tools.flm.utils import (
+    get_flm_installed_models,
+    is_flm_available,
+    install_flm,
+    download_flm_model,
+)
 class ModelManager:
@@ -52,10 +69,17 @@ class ModelManager:
         # Add the model name as a key in each entry, to make it easier
         # to access later
+        # Also convert labels to boolean fields for LoadConfig compatibility
         for key, value in models.items():
             value["model_name"] = key
+            # Convert labels to boolean fields for backwards compatibility with LoadConfig
+            labels = value.get("labels", [])
+            if "reasoning" in labels and "reasoning" not in value:
+                value["reasoning"] = True
+            if "vision" in labels and "vision" not in value:
+                value["vision"] = True
         return models
     @property
@@ -77,17 +101,131 @@ class ModelManager:
     def downloaded_models(self) -> dict:
         """
         Returns a dictionary of locally available models.
+        For GGUF models with variants, checks if the specific variant files exist.
         """
+        from huggingface_hub.constants import HF_HUB_CACHE
         downloaded_models = {}
         downloaded_checkpoints = self.downloaded_hf_checkpoints
+        # Get FLM installed model checkpoints
+        flm_installed_checkpoints = get_flm_installed_models()
         for model in self.supported_models:
-            base_checkpoint = parse_checkpoint(
-                self.supported_models[model]["checkpoint"]
-            )[0]
-            if base_checkpoint in downloaded_checkpoints:
-                downloaded_models[model] = self.supported_models[model]
+            model_info = self.supported_models[model]
+            # Handle FLM models
+            if model_info.get("recipe") == "flm":
+                if model_info["checkpoint"] in flm_installed_checkpoints:
+                    downloaded_models[model] = model_info
+            else:
+                # Handle other models
+                checkpoint = model_info["checkpoint"]
+                base_checkpoint, variant = parse_checkpoint(checkpoint)
+                # Special handling for locally uploaded user models (not internet-downloaded)
+                if (
+                    model.startswith("user.")
+                    and model_info.get("source") == "local_upload"
+                ):
+                    # Locally uploaded model: checkpoint is in cache directory format (models--xxx)
+                    local_model_path = os.path.join(HF_HUB_CACHE, base_checkpoint)
+                    if os.path.exists(local_model_path):
+                        downloaded_models[model] = model_info
+                    continue
+                # For all other models (server models and internet-downloaded user models),
+                # use the standard verification logic with variant checks
+                if base_checkpoint in downloaded_checkpoints:
+                    # For GGUF models with variants, verify the specific variant files exist
+                    if variant and model_info.get("recipe") == "llamacpp":
+                        try:
+                            from lemonade.tools.llamacpp.utils import (
+                                identify_gguf_models,
+                            )
+                            from lemonade.common.network import custom_snapshot_download
+                            # Get the local snapshot path
+                            snapshot_path = custom_snapshot_download(
+                                base_checkpoint, local_files_only=True
+                            )
+                            # Check if the specific variant files exist
+                            core_files, sharded_files = identify_gguf_models(
+                                base_checkpoint, variant, model_info.get("mmproj", "")
+                            )
+                            all_variant_files = (
+                                list(core_files.values()) + sharded_files
+                            )
+                            # Verify all required files exist locally
+                            all_files_exist = True
+                            for file_path in all_variant_files:
+                                full_file_path = os.path.join(snapshot_path, file_path)
+                                if not os.path.exists(full_file_path):
+                                    all_files_exist = False
+                                    break
+                            if all_files_exist:
+                                downloaded_models[model] = model_info
+                        except Exception:
+                            # If we can't verify the variant, don't include it
+                            pass
+                    else:
+                        # For non-GGUF models or GGUF without variants, use the original logic
+                        downloaded_models[model] = model_info
         return downloaded_models
+    def register_local_model(
+        self,
+        model_name: str,
+        checkpoint: str,
+        recipe: str,
+        reasoning: bool = False,
+        vision: bool = False,
+        mmproj: str = "",
+        snapshot_path: str = "",
+    ):
+        model_name_clean = model_name[5:]
+        # Prepare model info
+        labels = ["custom"]
+        if reasoning:
+            labels.append("reasoning")
+        if vision:
+            labels.append("vision")
+        new_user_model = {
+            "checkpoint": checkpoint,
+            "recipe": recipe,
+            "suggested": True,
+            "labels": labels,
+            "source": "local_upload",
+        }
+        if mmproj:
+            new_user_model["mmproj"] = mmproj
+        # Load existing user models
+        user_models = {}
+        if os.path.exists(USER_MODELS_FILE):
+            with open(USER_MODELS_FILE, "r", encoding="utf-8") as file:
+                user_models = json.load(file)
+        # Check for conflicts
+        if model_name_clean in user_models:
+            raise ValueError(
+                f"{model_name_clean} is already registered."
+                f"Please use a different model name or delete the existing model."
+            )
+        # Save to user_models.json
+        user_models[model_name_clean] = new_user_model
+        os.makedirs(os.path.dirname(USER_MODELS_FILE), exist_ok=True)
+        with open(USER_MODELS_FILE, "w", encoding="utf-8") as file:
+            json.dump(user_models, file)
     @property
     def downloaded_models_enabled(self) -> dict:
         """
@@ -102,6 +240,7 @@ class ModelManager:
         checkpoint: Optional[str] = None,
         recipe: Optional[str] = None,
         reasoning: bool = False,
+        vision: bool = False,
         mmproj: str = "",
         do_not_upgrade: bool = False,
     ):
@@ -115,6 +254,7 @@ class ModelManager:
             if model not in self.supported_models:
                 # Register the model as a user model if the model name
                 # is not already registered
+                import logging
                 # Ensure the model name includes the `user` namespace
                 model_parsed = model.split(".", 1)
@@ -137,11 +277,17 @@ class ModelManager:
                     )
                 # JSON content that will be used for registration if the download succeeds
+                labels = ["custom"]
+                if reasoning:
+                    labels.append("reasoning")
+                if vision:
+                    labels.append("vision")
                 new_user_model = {
                     "checkpoint": checkpoint,
                     "recipe": recipe,
                     "suggested": True,
-                    "labels": ["custom"] + (["reasoning"] if reasoning else []),
+                    "labels": labels,
                 }
                 if mmproj:
@@ -164,8 +310,64 @@ class ModelManager:
                     checkpoint=checkpoint,
                     recipe=recipe,
                     reasoning=reasoning,
+                    vision=vision,
                 )
             else:
+                # Model is already registered - check if trying to register with different parameters
+                existing_model = self.supported_models[model]
+                existing_checkpoint = existing_model.get("checkpoint")
+                existing_recipe = existing_model.get("recipe")
+                existing_reasoning = "reasoning" in existing_model.get("labels", [])
+                existing_mmproj = existing_model.get("mmproj", "")
+                existing_vision = "vision" in existing_model.get("labels", [])
+                # Compare parameters
+                checkpoint_differs = checkpoint and checkpoint != existing_checkpoint
+                recipe_differs = recipe and recipe != existing_recipe
+                reasoning_differs = reasoning and reasoning != existing_reasoning
+                mmproj_differs = mmproj and mmproj != existing_mmproj
+                vision_differs = vision and vision != existing_vision
+                if (
+                    checkpoint_differs
+                    or recipe_differs
+                    or reasoning_differs
+                    or mmproj_differs
+                    or vision_differs
+                ):
+                    conflicts = []
+                    if checkpoint_differs:
+                        conflicts.append(
+                            f"checkpoint (existing: '{existing_checkpoint}', new: '{checkpoint}')"
+                        )
+                    if recipe_differs:
+                        conflicts.append(
+                            f"recipe (existing: '{existing_recipe}', new: '{recipe}')"
+                        )
+                    if reasoning_differs:
+                        conflicts.append(
+                            f"reasoning (existing: {existing_reasoning}, new: {reasoning})"
+                        )
+                    if mmproj_differs:
+                        conflicts.append(
+                            f"mmproj (existing: '{existing_mmproj}', new: '{mmproj}')"
+                        )
+                    if vision_differs:
+                        conflicts.append(
+                            f"vision (existing: {existing_vision}, new: {vision})"
+                        )
+                    conflict_details = ", ".join(conflicts)
+                    additional_suggestion = ""
+                    if model.startswith("user."):
+                        additional_suggestion = f" or delete the existing model first using `lemonade-server delete {model}`"
+                    raise ValueError(
+                        f"Model {model} is already registered with a different configuration. "
+                        f"Conflicting parameters: {conflict_details}. "
+                        f"Please use a different model name{additional_suggestion}."
+                    )
                 new_registration_model_config = None
             # Download the model
@@ -177,12 +379,51 @@ class ModelManager:
                 gguf_model_config = PullConfig(**self.supported_models[model])
             print(f"Downloading {model} ({checkpoint_to_download})")
-            if "gguf" in checkpoint_to_download.lower():
-                download_gguf(
-                    gguf_model_config.checkpoint,
-                    gguf_model_config.mmproj,
-                    do_not_upgrade=do_not_upgrade,
+            # Handle FLM models
+            current_recipe = (
+                recipe
+                if new_registration_model_config
+                else self.supported_models[model].get("recipe")
+            )
+            if current_recipe == "flm":
+                # Check if FLM is available, and install it if not
+                if not is_flm_available():
+                    print(
+                        "FLM is not installed or not at the latest version. Installing FLM..."
+                    )
+                    install_flm()
+                try:
+                    download_flm_model(checkpoint_to_download, None, do_not_upgrade)
+                    print(f"Successfully downloaded FLM model: {model}")
+                except subprocess.CalledProcessError as e:
+                    raise RuntimeError(
+                        f"Failed to download FLM model {model}: {e}"
+                    ) from e
+                except FileNotFoundError as e:
+                    # This shouldn't happen after install_flm(), but just in case
+                    raise RuntimeError(
+                        f"FLM command not found even after installation attempt. "
+                        f"Please manually install FLM using 'lemonade-install --flm'."
+                    ) from e
+            elif "gguf" in checkpoint_to_download.lower():
+                # Parse checkpoint to check local cache first
+                base_checkpoint, variant = parse_checkpoint(
+                    gguf_model_config.checkpoint
+                )
+                local_result = resolve_local_gguf_model(
+                    base_checkpoint, variant, gguf_model_config.mmproj
                 )
+                # Only download if not found locally
+                if not local_result:
+                    download_gguf(
+                        gguf_model_config.checkpoint,
+                        gguf_model_config.mmproj,
+                        do_not_upgrade=do_not_upgrade,
+                    )
+                else:
+                    print(f"Model already exists locally, skipping download")
             else:
                 custom_snapshot_download(
                     checkpoint_to_download, do_not_upgrade=do_not_upgrade
@@ -192,6 +433,11 @@ class ModelManager:
             # We do this registration after the download so that we don't register
             # any incorrectly configured models where the download would fail
             if new_registration_model_config:
+                # For models downloaded from the internet (HuggingFace),
+                # keep the original checkpoint format (e.g., "amd/Llama-3.2-1B-Instruct-...")
+                # Do NOT convert to cache directory format - that's only for locally uploaded models
+                new_user_model["checkpoint"] = checkpoint
                 if os.path.exists(USER_MODELS_FILE):
                     with open(USER_MODELS_FILE, "r", encoding="utf-8") as file:
                         user_models: dict = json.load(file)
@@ -209,66 +455,304 @@ class ModelManager:
     def filter_models_by_backend(self, models: dict) -> dict:
         """
         Returns a filtered dict of models that are enabled by the
-        current environment.
+        current environment and platform.
         """
+        import platform
         installed_packages = {dist.metadata["Name"].lower() for dist in distributions()}
-        hybrid_installed = (
+        ryzenai_installed = (
             "onnxruntime-vitisai" in installed_packages
             and "onnxruntime-genai-directml-ryzenai" in installed_packages
         )
+        from lemonade_install.install import (
+            check_ryzen_ai_processor,
+            UnsupportedPlatformError,
+        )
+        try:
+            check_ryzen_ai_processor()
+            ryzenai_npu_available = True
+        except UnsupportedPlatformError:
+            ryzenai_npu_available = False
+        # On macOS, only llamacpp (GGUF) models are supported, and only on Apple Silicon with macOS 14+
+        is_macos = platform.system() == "Darwin"
+        if is_macos:
+            machine = platform.machine().lower()
+            if machine == "x86_64":
+                # Intel Macs are not supported - return empty model list with error info
+                return {
+                    "_unsupported_platform_error": {
+                        "error": "Intel Mac Not Supported",
+                        "message": (
+                            "Lemonade Server requires Apple Silicon processors on macOS. "
+                            "Intel Macs are not currently supported. "
+                            "Please use a Mac with Apple Silicon or try Lemonade on Windows/Linux."
+                        ),
+                        "platform": f"macOS {machine}",
+                        "supported": "macOS 14+ with Apple Silicon (arm64/aarch64)",
+                    }
+                }
+            # Check macOS version requirement
+            mac_version = platform.mac_ver()[0]
+            if mac_version:
+                major_version = int(mac_version.split(".")[0])
+                if major_version < 14:
+                    return {
+                        "_unsupported_platform_error": {
+                            "error": "macOS Version Not Supported",
+                            "message": (
+                                f"Lemonade Server requires macOS 14 or later. "
+                                f"Your system is running macOS {mac_version}. "
+                                f"Please update your macOS version to use Lemonade Server."
+                            ),
+                            "platform": f"macOS {mac_version} {machine}",
+                            "supported": "macOS 14+ with Apple Silicon (arm64/aarch64)",
+                        }
+                    }
         filtered = {}
         for model, value in models.items():
-            if value.get("recipe") == "oga-hybrid":
-                if hybrid_installed:
-                    filtered[model] = value
-            else:
-                filtered[model] = value
+            recipe = value.get("recipe")
+            # Filter Ryzen AI  models based on package availability
+            if recipe == "oga-hybrid" or recipe == "oga-npu":
+                if not ryzenai_installed:
+                    continue
+            if recipe == "flm":
+                if not ryzenai_npu_available:
+                    continue
+            # On macOS, only show llamacpp models (GGUF format)
+            if is_macos and recipe != "llamacpp":
+                continue
+            filtered[model] = value
         return filtered
     def delete_model(self, model_name: str):
         """
         Deletes the specified model from local storage.
+        For GGUF models with variants, only deletes the specific variant files.
         """
+        from huggingface_hub.constants import HF_HUB_CACHE
         if model_name not in self.supported_models:
             raise ValueError(
                 f"Model {model_name} is not supported. Please choose from the following: "
                 f"{list(self.supported_models.keys())}"
             )
-        checkpoint = self.supported_models[model_name]["checkpoint"]
+        model_info = self.supported_models[model_name]
+        checkpoint = model_info["checkpoint"]
         print(f"Deleting {model_name} ({checkpoint})")
-        # Handle GGUF models that have the format "checkpoint:variant"
-        base_checkpoint = parse_checkpoint(checkpoint)[0]
+        # Handle FLM models
+        if model_info.get("recipe") == "flm":
+            try:
+                command = ["flm", "remove", checkpoint]
+                subprocess.run(command, check=True, encoding="utf-8", errors="replace")
+                print(f"Successfully deleted FLM model: {model_name}")
+                return
+            except subprocess.CalledProcessError as e:
+                raise ValueError(f"Failed to delete FLM model {model_name}: {e}") from e
+        if checkpoint.startswith("models--"):
+            # This is already in cache directory format (local model)
+            # Extract just the base directory name (models--{name}) from checkpoint
+            # which might contain full file path like models--name\files\model.gguf
+            checkpoint_parts = checkpoint.replace("\\", "/").split("/")
+            base_checkpoint = checkpoint_parts[0]  # Just the models--{name} part
+            model_cache_dir = os.path.join(HF_HUB_CACHE, base_checkpoint)
+            if os.path.exists(model_cache_dir):
+                shutil.rmtree(model_cache_dir)
+                print(
+                    f"Successfully deleted local model {model_name} from {model_cache_dir}"
+                )
+            else:
+                print(
+                    f"Model {model_name} directory not found at {model_cache_dir} - may have been manually deleted"
+                )
+            # Clean up user models registry
+            if model_name.startswith("user.") and os.path.exists(USER_MODELS_FILE):
+                with open(USER_MODELS_FILE, "r", encoding="utf-8") as file:
+                    user_models = json.load(file)
+                base_model_name = model_name[5:]  # Remove "user." prefix
+                if base_model_name in user_models:
+                    del user_models[base_model_name]
+                    with open(USER_MODELS_FILE, "w", encoding="utf-8") as file:
+                        json.dump(user_models, file)
+                    print(f"Removed {model_name} from user models registry")
+            return
+        # Parse checkpoint to get base and variant
+        base_checkpoint, variant = parse_checkpoint(checkpoint)
+        # Get the repository cache directory
+        snapshot_path = None
+        model_cache_dir = None
         try:
-            # Get the local path using snapshot_download with local_files_only=True
+            # First, try to get the local path using snapshot_download with local_files_only=True
             snapshot_path = custom_snapshot_download(
                 base_checkpoint, local_files_only=True
             )
             # Navigate up to the model directory (parent of snapshots directory)
-            model_path = os.path.dirname(os.path.dirname(snapshot_path))
-            # Delete the entire model directory (including all snapshots)
-            if os.path.exists(model_path):
-                shutil.rmtree(model_path)
-                print(f"Successfully deleted model {model_name} from {model_path}")
-            else:
-                raise ValueError(
-                    f"Model {model_name} not found locally at {model_path}"
-                )
+            model_cache_dir = os.path.dirname(os.path.dirname(snapshot_path))
         except Exception as e:
+            # If snapshot_download fails, try to construct the cache path manually
             if (
                 "not found in cache" in str(e).lower()
-                or "no such file" in str(e).lower()
+                or "localentrynotfounderror" in str(e).lower()
+                or "cannot find an appropriate cached snapshot" in str(e).lower()
             ):
-                raise ValueError(f"Model {model_name} is not installed locally")
+                # Construct the Hugging Face cache path manually
+                cache_home = huggingface_hub.constants.HF_HUB_CACHE
+                # Convert repo format (e.g., "unsloth/GLM-4.5-Air-GGUF") to cache format
+                repo_cache_name = base_checkpoint.replace("/", "--")
+                model_cache_dir = os.path.join(cache_home, f"models--{repo_cache_name}")
+                # Try to find the snapshot path within the model cache directory
+                if os.path.exists(model_cache_dir):
+                    snapshots_dir = os.path.join(model_cache_dir, "snapshots")
+                    if os.path.exists(snapshots_dir):
+                        snapshot_dirs = [
+                            d
+                            for d in os.listdir(snapshots_dir)
+                            if os.path.isdir(os.path.join(snapshots_dir, d))
+                        ]
+                        if snapshot_dirs:
+                            # Use the first (likely only) snapshot directory
+                            snapshot_path = os.path.join(
+                                snapshots_dir, snapshot_dirs[0]
+                            )
             else:
                 raise ValueError(f"Failed to delete model {model_name}: {str(e)}")
+        # Handle deletion based on whether this is a GGUF model with variants
+        if variant and snapshot_path and os.path.exists(snapshot_path):
+            # This is a GGUF model with a specific variant - delete only variant files
+            try:
+                from lemonade.tools.llamacpp.utils import identify_gguf_models
+                # Get the specific files for this variant
+                core_files, sharded_files = identify_gguf_models(
+                    base_checkpoint,
+                    variant,
+                    self.supported_models[model_name].get("mmproj", ""),
+                )
+                all_variant_files = list(core_files.values()) + sharded_files
+                # Delete the specific variant files
+                deleted_files = []
+                for file_path in all_variant_files:
+                    full_file_path = os.path.join(snapshot_path, file_path)
+                    if os.path.exists(full_file_path):
+                        if os.path.isfile(full_file_path):
+                            os.remove(full_file_path)
+                            deleted_files.append(file_path)
+                        elif os.path.isdir(full_file_path):
+                            shutil.rmtree(full_file_path)
+                            deleted_files.append(file_path)
+                if deleted_files:
+                    print(f"Successfully deleted variant files: {deleted_files}")
+                else:
+                    print(f"No variant files found for {variant} in {snapshot_path}")
+                # Check if the snapshot directory is now empty (only containing .gitattributes, README, etc.)
+                remaining_files = [
+                    f
+                    for f in os.listdir(snapshot_path)
+                    if f.endswith(".gguf")
+                    or os.path.isdir(os.path.join(snapshot_path, f))
+                ]
+                # If no GGUF files remain, we can delete the entire repository
+                if not remaining_files:
+                    print(f"No other variants remain, deleting entire repository cache")
+                    shutil.rmtree(model_cache_dir)
+                    print(
+                        f"Successfully deleted entire model cache at {model_cache_dir}"
+                    )
+                else:
+                    print(
+                        f"Other variants still exist in repository, keeping cache directory"
+                    )
+            except Exception as variant_error:
+                print(
+                    f"Warning: Could not perform selective variant deletion: {variant_error}"
+                )
+                print("This may indicate the files were already manually deleted")
+        elif model_cache_dir and os.path.exists(model_cache_dir):
+            # Non-GGUF model or GGUF without variant - delete entire repository as before
+            shutil.rmtree(model_cache_dir)
+            print(f"Successfully deleted model {model_name} from {model_cache_dir}")
+        elif model_cache_dir:
+            # Model directory doesn't exist - it was likely already manually deleted
+            print(
+                f"Model {model_name} directory not found at {model_cache_dir} - may have been manually deleted"
+            )
+        else:
+            raise ValueError(f"Unable to determine cache path for model {model_name}")
+        # Clean up user models registry if applicable
+        if model_name.startswith("user.") and os.path.exists(USER_MODELS_FILE):
+            with open(USER_MODELS_FILE, "r", encoding="utf-8") as file:
+                user_models = json.load(file)
+            # Remove the "user." prefix to get the actual model name in the file
+            base_model_name = model_name[5:]  # Remove "user." prefix
+            if base_model_name in user_models:
+                del user_models[base_model_name]
+                with open(USER_MODELS_FILE, "w", encoding="utf-8") as file:
+                    json.dump(user_models, file)
+                print(f"Removed {model_name} from user models registry")
+    def get_incompatible_ryzenai_models(self):
+        """
+        Get information about incompatible RyzenAI models in the cache.
+        Returns:
+            dict with 'models' list and 'total_size' info
+        """
+        # Get HF_HOME from environment
+        hf_home = os.environ.get("HF_HOME", None)
+        incompatible_models, total_size = detect_incompatible_ryzenai_models(
+            DEFAULT_CACHE_DIR, hf_home
+        )
+        return {
+            "models": incompatible_models,
+            "total_size": total_size,
+            "count": len(incompatible_models),
+        }
+    def cleanup_incompatible_models(self, model_paths: list):
+        """
+        Delete incompatible RyzenAI models from the cache.
+        Args:
+            model_paths: List of model paths to delete
+        Returns:
+            dict with deletion results
+        """
+        return delete_incompatible_models(model_paths)
 # This file was originally licensed under Apache 2.0. It has been modified.
 # Modifications Copyright (c) 2025 AMD

lemonade-sdk 8.1.4__py3-none-any.whl → 8.2.2__py3-none-any.whl

Potentially problematic release.

lemonade-sdk 8.1.4py3-none-any.whl → 8.2.2py3-none-any.whl