PyPI - cortex-llm - Versions diffs - 1.0.7__tar.gz → 1.0.8__tar.gz - Mend

cortex-llm 1.0.7tar.gz → 1.0.8tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (58) hide show

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: cortex-llm
-Version: 1.0.7
+Version: 1.0.8
 Summary: GPU-Accelerated LLM Terminal for Apple Silicon
 Home-page: https://github.com/faisalmumtaz/Cortex
 Author: Cortex Development Team

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/__init__.py RENAMED Viewed

@@ -5,7 +5,7 @@ A high-performance terminal interface for running Hugging Face LLMs locally
 with exclusive GPU acceleration via Metal Performance Shaders (MPS) and MLX.
 """
-__version__ = "1.0.7"
+__version__ = "1.0.8"
 __author__ = "Cortex Development Team"
 __license__ = "MIT"

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/metal/mlx_converter.py RENAMED Viewed

@@ -66,9 +66,22 @@ class MLXConverter:
         self.cache_dir.mkdir(parents=True, exist_ok=True)
         self.conversion_cache = self.cache_dir / "conversion_cache.json"
         self._load_conversion_cache()
+        self._warned_mlx_lm_compat = False
         logger.info(f"MLX Converter initialized with cache dir: {self.cache_dir}")
         logger.info(f"MLX LM available: {mlx_utils is not None and load is not None}")
+    def _warn_mlx_lm_compat(self, missing: str) -> None:
+        """Warn once when mlx-lm is missing newer helper APIs."""
+        if self._warned_mlx_lm_compat:
+            return
+        self._warned_mlx_lm_compat = True
+        message = (
+            f"[WARN] mlx-lm is missing '{missing}'. Using compatibility fallback. "
+            "For best support, upgrade mlx-lm to a newer version."
+        )
+        logger.warning(message)
+        print(message)
     def _load_conversion_cache(self) -> None:
         """Load conversion cache metadata."""
@@ -206,6 +219,83 @@ class MLXConverter:
         return download_dir
+    def _mlx_get_model_path(self, source_path: Path) -> Tuple[Path, Optional[str]]:
+        """Resolve model path with MLX LM compatibility fallbacks."""
+        if mlx_utils is not None and hasattr(mlx_utils, "get_model_path"):
+            return mlx_utils.get_model_path(str(source_path))
+        self._warn_mlx_lm_compat("get_model_path")
+        # Fallback: local path or direct HF download.
+        model_path = Path(source_path)
+        if model_path.exists():
+            hf_repo = None
+            try:
+                from huggingface_hub import ModelCard
+                card_path = model_path / "README.md"
+                if card_path.is_file():
+                    card = ModelCard.load(card_path)
+                    hf_repo = getattr(card.data, "base_model", None)
+            except Exception:
+                hf_repo = None
+            return model_path, hf_repo
+        try:
+            model_path = Path(
+                snapshot_download(
+                    str(source_path),
+                    allow_patterns=[
+                        "*.json",
+                        "model*.safetensors",
+                        "*.py",
+                        "tokenizer.model",
+                        "*.tiktoken",
+                        "tiktoken.model",
+                        "*.txt",
+                        "*.jsonl",
+                        "*.jinja",
+                    ],
+                )
+            )
+        except Exception as e:
+            raise RuntimeError(f"Failed to download model from Hugging Face: {e}") from e
+        return model_path, str(source_path)
+    def _mlx_fetch_from_hub(
+        self,
+        model_path: Path,
+        trust_remote_code: bool = False
+    ) -> Tuple[Any, Dict[str, Any], Any]:
+        """Fetch model/config/tokenizer with MLX LM compatibility fallbacks."""
+        if mlx_utils is not None and hasattr(mlx_utils, "fetch_from_hub"):
+            return mlx_utils.fetch_from_hub(
+                model_path,
+                lazy=True,
+                trust_remote_code=trust_remote_code
+            )
+        self._warn_mlx_lm_compat("fetch_from_hub")
+        if mlx_utils is not None and hasattr(mlx_utils, "load_model") and hasattr(mlx_utils, "load_tokenizer"):
+            model, model_config = mlx_utils.load_model(model_path, lazy=True)
+            try:
+                tokenizer = mlx_utils.load_tokenizer(
+                    model_path,
+                    eos_token_ids=model_config.get("eos_token_id", None),
+                    tokenizer_config_extra={"trust_remote_code": trust_remote_code},
+                )
+            except TypeError:
+                tokenizer = mlx_utils.load_tokenizer(
+                    model_path,
+                    eos_token_ids=model_config.get("eos_token_id", None),
+                )
+            return model, model_config, tokenizer
+        raise RuntimeError(
+            "mlx_lm.utils is missing required helpers (fetch_from_hub/load_model). "
+            "Upgrade mlx-lm to a newer version."
+        )
     def _requires_sentencepiece(self, model_path: Path) -> bool:
         """Return True if the model likely needs SentencePiece."""
         # If a fast tokenizer is present, SentencePiece should not be required.
@@ -379,10 +469,17 @@ class MLXConverter:
             # Build quantization configuration
             quantize_config = self._build_quantization_config(config)
-            model_path, hf_repo = mlx_utils.get_model_path(str(source_path))
-            model, model_config, tokenizer = mlx_utils.fetch_from_hub(
-                model_path, lazy=True, trust_remote_code=False
-            )
+            try:
+                model_path, hf_repo = self._mlx_get_model_path(Path(source_path))
+            except Exception as e:
+                return False, f"Model path resolution failed: {e}", None
+            try:
+                model, model_config, tokenizer = self._mlx_fetch_from_hub(
+                    model_path, trust_remote_code=False
+                )
+            except Exception as e:
+                return False, f"Model fetch failed: {e}", None
             dtype = model_config.get("torch_dtype", None)
             if dtype in ["float16", "bfloat16", "float32"]:
@@ -398,6 +495,8 @@ class MLXConverter:
                 model.update(tree_map_with_path(set_dtype, model.parameters()))
             if config.quantization != QuantizationRecipe.NONE:
+                if mlx_utils is None or not hasattr(mlx_utils, "quantize_model"):
+                    return False, "MLX LM quantize_model not available; upgrade mlx-lm.", None
                 quant_predicate = None
                 if quantize_config and "quant_predicate" in quantize_config:
                     quant_predicate = quantize_config["quant_predicate"]
@@ -411,6 +510,8 @@ class MLXConverter:
                 )
             normalized_hf_repo = self._normalize_hf_repo(hf_repo)
+            if mlx_utils is None or not hasattr(mlx_utils, "save"):
+                return False, "MLX LM save() not available; upgrade mlx-lm.", None
             mlx_utils.save(output_path, model_path, model, tokenizer, model_config, hf_repo=normalized_hf_repo)
             logger.info("MLX conversion completed")

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex_llm.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: cortex-llm
-Version: 1.0.7
+Version: 1.0.8
 Summary: GPU-Accelerated LLM Terminal for Apple Silicon
 Home-page: https://github.com/faisalmumtaz/Cortex
 Author: Cortex Development Team

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "cortex-llm"
-version = "1.0.7"
+version = "1.0.8"
 description = "GPU-Accelerated LLM Terminal for Apple Silicon"
 readme = "README.md"
 license = "MIT"

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/setup.py RENAMED Viewed

@@ -26,7 +26,7 @@ def read_requirements():
 setup(
     name="cortex-llm",
-    version="1.0.7",
+    version="1.0.8",
     author="Cortex Development Team",
     description="GPU-Accelerated LLM Terminal for Apple Silicon",
     long_description=README,

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/LICENSE RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/README.md RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/__main__.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/config.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/conversation_manager.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/fine_tuning/__init__.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/fine_tuning/dataset.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/fine_tuning/mlx_lora_trainer.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/fine_tuning/trainer.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/fine_tuning/wizard.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/gpu_validator.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/inference_engine.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/metal/__init__.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/metal/gpu_validator.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/metal/memory_pool.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/metal/mlx_accelerator.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/metal/mlx_compat.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/metal/mps_optimizer.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/metal/optimizer.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/metal/performance_profiler.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/model_downloader.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/model_manager.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/quantization/__init__.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/quantization/dynamic_quantizer.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/__init__.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/auto_detector.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/config_manager.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/interactive.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/registry.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/template_profiles/__init__.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/template_profiles/base.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/template_profiles/complex/__init__.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/template_profiles/complex/reasoning.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/template_profiles/standard/__init__.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/template_profiles/standard/alpaca.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/template_profiles/standard/chatml.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/template_profiles/standard/gemma.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/template_profiles/standard/llama.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/template_registry/template_profiles/standard/simple.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/ui/__init__.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/ui/cli.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/ui/markdown_render.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex/ui/terminal_app.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex_llm.egg-info/SOURCES.txt RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex_llm.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex_llm.egg-info/entry_points.txt RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex_llm.egg-info/not-zip-safe RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex_llm.egg-info/requires.txt RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/cortex_llm.egg-info/top_level.txt RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/setup.cfg RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/tests/test_apple_silicon.py RENAMED Viewed

File without changes

{cortex_llm-1.0.7 → cortex_llm-1.0.8}/tests/test_metal_optimization.py RENAMED Viewed

File without changes

cortex-llm 1.0.7__tar.gz → 1.0.8__tar.gz

cortex-llm 1.0.7tar.gz → 1.0.8tar.gz