PyPI - coreai-catalog - Versions diffs - 2.0.2__py3-none-any.whl - Mend

coreai-catalog 2.0.2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

coreai_catalog/__init__.py +12 -0
coreai_catalog/__main__.py +6 -0
coreai_catalog/api.py +254 -0
coreai_catalog/catalog.py +546 -0
coreai_catalog/cli.py +1176 -0
coreai_catalog/data/artifacts.yaml +1110 -0
coreai_catalog/data/benchmarks.yaml +933 -0
coreai_catalog/data/catalog.yaml +3885 -0
coreai_catalog/data/schema/artifact.schema.json +107 -0
coreai_catalog/data/schema/benchmark.schema.json +77 -0
coreai_catalog/data/schema/model.schema.json +240 -0
coreai_catalog/data/schema/term.schema.json +68 -0
coreai_catalog/data/schema/upstream.schema.json +59 -0
coreai_catalog/data/sources.yaml +213 -0
coreai_catalog/data/terms.yaml +391 -0
coreai_catalog/data/upstreams.yaml +673 -0
coreai_catalog/exports.py +194 -0
coreai_catalog/installer.py +280 -0
coreai_catalog/task_pages.py +193 -0
coreai_catalog-2.0.2.dist-info/METADATA +658 -0
coreai_catalog-2.0.2.dist-info/RECORD +26 -0
coreai_catalog-2.0.2.dist-info/WHEEL +5 -0
coreai_catalog-2.0.2.dist-info/entry_points.txt +3 -0
coreai_catalog-2.0.2.dist-info/top_level.txt +2 -0
mcp_server/__init__.py +1 -0
mcp_server/server.py +554 -0

coreai_catalog/__init__.py ADDED Viewed

@@ -0,0 +1,12 @@
+"""Core AI Catalog — discover, verify, and install Apple Core AI models.
+Public API:
+    from coreai_catalog import Catalog
+    catalog = Catalog.load()
+    catalog.recommend(task="ocr", device="iphone")
+    catalog.compare("qwen3-vl-2b", "unlimited-ocr")
+"""
+from .api import Catalog
+__all__ = ["Catalog"]

coreai_catalog/__main__.py ADDED Viewed

@@ -0,0 +1,6 @@
+#!/usr/bin/env python3
+"""Entry point for python -m coreai_catalog"""
+from coreai_catalog.cli import main
+if __name__ == "__main__":
+    main()

coreai_catalog/api.py ADDED Viewed

@@ -0,0 +1,254 @@
+"""
+Core AI Catalog — public Python API.
+A clean, stable interface for programmatic access to the catalog.
+Works with pip-installed package (no repo clone needed).
+Example:
+    from coreai_catalog import Catalog
+    catalog = Catalog.load()
+    catalog.recommend(task="ocr", device="iphone")
+    catalog.compare("qwen3-vl-2b", "unlimited-ocr")
+    catalog.license_report("qwen3-vl-2b")
+"""
+from __future__ import annotations
+from pathlib import Path
+from typing import Any
+from .catalog import Catalog as _Catalog, resolve_task as _resolve_task
+class Catalog:
+    """High-level catalog API for programmatic access.
+    Usage:
+        from coreai_catalog import Catalog
+        # Auto-discovers YAML data (bundled in pip package, or from repo root)
+        catalog = Catalog.load()
+        # Search and filter
+        results = catalog.search(capability="vision-language", device="iphone")
+        # Get recommendations
+        recs = catalog.recommend(task="ocr", device="iphone", license_filter="likely")
+        # Compare models
+        diff = catalog.compare("qwen3-vl-2b", "unlimited-ocr")
+        # License triage
+        report = catalog.license_report("qwen3-vl-2b")
+        # Browse tasks
+        tasks = catalog.tasks()
+    """
+    def __init__(self, root: Path | None = None) -> None:
+        self._cat = _Catalog(root)
+    @classmethod
+    def load(cls) -> "Catalog":
+        """Create a Catalog instance, auto-discovering the YAML data.
+        Search order: CWD → walk up from package → bundled package data.
+        """
+        return cls()
+    @property
+    def version(self) -> str:
+        """Catalog version string (e.g. '1.6.0')."""
+        self._cat._load()
+        # Read from the raw YAML metadata
+        import yaml
+        cat_path = self._cat.root / "catalog.yaml"
+        if cat_path.exists():
+            data = yaml.safe_load(cat_path.read_text()) or {}
+            return data.get("metadata", {}).get("version", "unknown")
+        return "unknown"
+    @property
+    def model_count(self) -> int:
+        """Total number of models in the catalog."""
+        return len(self._cat.models)
+    def search(
+        self,
+        capability: str | None = None,
+        device: str | None = None,
+        license_filter: str | None = None,
+        family: str | None = None,
+        source_group: str | None = None,
+        modality: str | None = None,
+        limit: int = 50,
+    ) -> list[dict]:
+        """Search models by criteria.
+        Args:
+            capability: Filter by capability (e.g. 'chat', 'vision-language').
+            device: Filter by device support (e.g. 'iphone', 'mac').
+            license_filter: Filter by commercial use ('likely' or 'check_license').
+            family: Filter by model family (e.g. 'Qwen', 'Gemma').
+            source_group: Filter by source ('official', 'zoo', 'external').
+            modality: Filter by input modality ('text', 'image', 'audio').
+            limit: Maximum results.
+        Returns:
+            List of model dicts with capabilities, devices, license, score.
+        """
+        results = self._cat.search(
+            capability=capability,
+            device=device,
+            license_type=license_filter,
+            family=family,
+            source_group=source_group,
+            modality=modality,
+        )
+        return results[:limit]
+    def recommend(
+        self,
+        task: str,
+        device: str | None = None,
+        license_filter: str | None = None,
+        limit: int = 5,
+    ) -> list[dict]:
+        """Recommend models for a task.
+        Args:
+            task: Task description (e.g. 'robot vision', 'private OCR').
+                  See ``catalog.tasks()`` for valid keywords.
+            device: Target device filter ('iphone', 'mac').
+            license_filter: Commercial use filter ('likely' or 'check_license').
+            limit: Maximum results.
+        Returns:
+            Sorted list of recommendations with score, matched capabilities,
+            and metadata.
+        """
+        capabilities = _resolve_task(task)
+        return self._cat.recommend_models(
+            capabilities=capabilities,
+            device=device,
+            limit=limit,
+            task=task,
+            license_type=license_filter,
+        )
+    def get_model(self, model_id: str) -> dict | None:
+        """Get full details for a specific model.
+        Args:
+            model_id: Model ID (e.g. 'qwen3-vl-2b').
+        Returns:
+            Model dict with all fields, or None if not found.
+        """
+        return self._cat.get_model(model_id)
+    def compare(self, *model_ids: str) -> dict[str, Any]:
+        """Compare two or more models side-by-side.
+        Args:
+            *model_ids: Two or more model IDs to compare.
+        Returns:
+            Dict with 'models' list and field-by-field comparison.
+        """
+        if len(model_ids) < 2:
+            raise ValueError("compare() requires at least 2 model IDs")
+        models = []
+        for mid in model_ids:
+            m = self._cat.get_model(mid)
+            if m is None:
+                raise KeyError(f"Model '{mid}' not found")
+            models.append(m)
+        result: dict[str, Any] = {"models": []}
+        for m in models:
+            entry = {
+                "id": m["id"],
+                "name": m["name"],
+                "family": m.get("family"),
+                "capabilities": m.get("capabilities", []),
+                "parameters": m.get("size", {}).get("parameters"),
+                "precision": m.get("size", {}).get("precision"),
+                "devices": m.get("device_support", {}),
+                "license": m.get("license", {}),
+                "source_group": m.get("source_group"),
+                "score": self._cat.readiness_score(m),
+                "benchmarks": self._cat.get_benchmarks(m["id"]),
+            }
+            result["models"].append(entry)
+        return result
+    def license_report(self, model_id: str) -> dict[str, Any]:
+        """Generate a license triage report for a model.
+        Args:
+            model_id: Model ID.
+        Returns:
+            Dict with license name, commercial_use status, and notes.
+        """
+        m = self._cat.get_model(model_id)
+        if m is None:
+            raise KeyError(f"Model '{model_id}' not found")
+        lic = m.get("license", {})
+        art = self._cat.get_artifact(model_id) or {}
+        off = art.get("officiality", {}) if art else {}
+        return {
+            "model_id": model_id,
+            "name": m.get("name", model_id),
+            "license_name": lic.get("name", "unknown"),
+            "commercial_use": lic.get("commercial_use", "unknown"),
+            "officiality": off,
+            "artifact_source": art.get("huggingface", {}).get("url", ""),
+        }
+    def tasks(self) -> dict[str, list[str]]:
+        """List all supported task keywords grouped by capability.
+        Returns:
+            Dict mapping capability name to list of task synonyms.
+        """
+        from .catalog import TASK_MAP
+        from collections import defaultdict
+        cap_to_tasks: dict[str, list[str]] = defaultdict(list)
+        for task_syn, caps in TASK_MAP.items():
+            for cap in caps:
+                cap_to_tasks[cap].append(task_syn)
+        return {cap: sorted(syns) for cap, syns in sorted(cap_to_tasks.items())}
+    def capabilities(self) -> list[dict[str, Any]]:
+        """List all capabilities with model counts.
+        Returns:
+            List of dicts with capability name, model count, and benchmark count.
+        """
+        from collections import Counter
+        cap_counts: Counter = Counter()
+        bench_counts: Counter = Counter()
+        for m in self._cat.models:
+            has_bench = bool(self._cat.get_benchmarks(m["id"]))
+            for c in m.get("capabilities", []):
+                cap_counts[c] += 1
+                if has_bench:
+                    bench_counts[c] += 1
+        return [
+            {
+                "capability": cap,
+                "model_count": count,
+                "benchmark_count": bench_counts.get(cap, 0),
+            }
+            for cap, count in cap_counts.most_common()
+        ]