PyPI - split-stack - Versions diffs - 0.2.0__py3-none-any.whl - Mend

split-stack 0.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

split_stack/__init__.py +106 -0
split_stack/__main__.py +4 -0
split_stack/advice.py +12 -0
split_stack/benchmark.py +97 -0
split_stack/cli.py +690 -0
split_stack/community_picks.py +247 -0
split_stack/compare.py +194 -0
split_stack/complexity.py +77 -0
split_stack/discovery.py +288 -0
split_stack/hints.py +102 -0
split_stack/local_models.py +63 -0
split_stack/model_guide.py +273 -0
split_stack/model_registry.py +314 -0
split_stack/models.py +77 -0
split_stack/ollama_errors.py +30 -0
split_stack/ollama_generate.py +135 -0
split_stack/poc_models.py +131 -0
split_stack/presets.py +75 -0
split_stack/quantization.py +137 -0
split_stack/requirements.py +287 -0
split_stack/routing.py +96 -0
split_stack/session.py +259 -0
split_stack/setup_wizard.py +259 -0
split_stack/startup_tips.py +169 -0
split_stack/tiering.py +66 -0
split_stack/validation.py +85 -0
split_stack-0.2.0.dist-info/METADATA +364 -0
split_stack-0.2.0.dist-info/RECORD +32 -0
split_stack-0.2.0.dist-info/WHEEL +5 -0
split_stack-0.2.0.dist-info/entry_points.txt +2 -0
split_stack-0.2.0.dist-info/licenses/LICENSE +21 -0
split_stack-0.2.0.dist-info/top_level.txt +1 -0

split_stack/discovery.py ADDED Viewed

@@ -0,0 +1,288 @@
+from __future__ import annotations
+import os
+from dataclasses import dataclass
+from pathlib import Path
+_CONFIGURED_MODELS_DIR: Path | None = None
+def configure_models_dir(path: str | Path | None) -> None:
+    """Pin an Ollama models directory for discovery (used by demo server)."""
+    global _CONFIGURED_MODELS_DIR
+    if not path:
+        _CONFIGURED_MODELS_DIR = None
+        return
+    try:
+        resolved = Path(path).expanduser().resolve()
+    except OSError:
+        _CONFIGURED_MODELS_DIR = None
+        return
+    _CONFIGURED_MODELS_DIR = resolved if resolved.is_dir() else None
+def default_models_dir() -> Path | None:
+    """First existing Ollama models folder from env and common dev layouts."""
+    candidates: list[Path] = []
+    if _CONFIGURED_MODELS_DIR is not None:
+        candidates.append(_CONFIGURED_MODELS_DIR)
+    for key in ("SPLIT_STACK_OLLAMA_MODELS", "OLLAMA_MODELS"):
+        raw = os.environ.get(key, "").strip()
+        if raw:
+            candidates.append(Path(raw))
+    profile = os.environ.get("USERPROFILE", "").strip()
+    if profile:
+        candidates.append(Path(profile) / "dev" / "Tools" / ".ollama" / "models")
+    home = Path.home()
+    candidates.extend(
+        [
+            home / "dev" / "Tools" / ".ollama" / "models",
+            home / ".ollama" / "models",
+        ]
+    )
+    seen: set[Path] = set()
+    for candidate in candidates:
+        try:
+            resolved = candidate.expanduser().resolve()
+        except OSError:
+            continue
+        if resolved in seen:
+            continue
+        seen.add(resolved)
+        library = resolved / "manifests" / "registry.ollama.ai" / "library"
+        if library.is_dir():
+            return resolved
+    return None
+@dataclass(frozen=True)
+class ModelInventory:
+    api_models: tuple[str, ...]
+    disk_models: tuple[str, ...]
+    manifest_roots: tuple[str, ...]
+    suggested_stack: tuple[str, ...]
+    note: str | None = None
+def manifest_search_paths(extra_root: str | Path | None = None) -> list[Path]:
+    """Candidate Ollama model directories (OLLAMA_MODELS, home, common dev layout)."""
+    seen: set[Path] = set()
+    ordered: list[Path] = []
+    def add(path: Path | None) -> None:
+        if path is None:
+            return
+        try:
+            resolved = path.expanduser().resolve()
+        except OSError:
+            return
+        if resolved in seen or not resolved.is_dir():
+            return
+        seen.add(resolved)
+        ordered.append(resolved)
+    env_models = os.environ.get("OLLAMA_MODELS", "").strip()
+    if env_models:
+        add(Path(env_models))
+    split_stack_models = os.environ.get("SPLIT_STACK_OLLAMA_MODELS", "").strip()
+    if split_stack_models:
+        add(Path(split_stack_models))
+    if _CONFIGURED_MODELS_DIR is not None:
+        add(_CONFIGURED_MODELS_DIR)
+    profile = os.environ.get("USERPROFILE", "").strip()
+    if profile:
+        add(Path(profile) / "dev" / "Tools" / ".ollama" / "models")
+    if extra_root:
+        add(Path(extra_root))
+    home = Path.home()
+    add(home / ".ollama" / "models")
+    add(home / "dev" / "Tools" / ".ollama" / "models")
+    return ordered
+def discover_models_from_disk(
+    *,
+    manifests_root: Path | str | None = None,
+) -> list[str]:
+    """List model tags from on-disk Ollama manifests (family/tag → family:tag)."""
+    roots = manifest_search_paths(extra_root=Path(manifests_root) if manifests_root else None)
+    found: set[str] = set()
+    for root in roots:
+        library = root / "manifests" / "registry.ollama.ai" / "library"
+        if not library.is_dir():
+            continue
+        for family_dir in library.iterdir():
+            if not family_dir.is_dir():
+                continue
+            for tag_path in family_dir.iterdir():
+                if tag_path.is_file():
+                    found.add(f"{family_dir.name}:{tag_path.name}")
+    return sorted(found)
+def discover_models(base_url: str = "http://127.0.0.1:11434") -> list[str]:
+    """Models the running Ollama server reports via /api/tags."""
+    try:
+        import requests
+    except ImportError as exc:
+        raise RuntimeError(
+            "discover_models requires optional dependency: pip install split-stack[ollama]"
+        ) from exc
+    url = f"{base_url.rstrip('/')}/api/tags"
+    response = requests.get(url, timeout=5)
+    response.raise_for_status()
+    payload = response.json() or {}
+    models = [item.get("name", "") for item in payload.get("models", [])]
+    return [model for model in models if model]
+def _suggest_stack_from_pool(model_names: list[str], *, count: int = 3) -> list[str]:
+    if not model_names:
+        return []
+    if len(model_names) <= count:
+        return list(model_names)
+    from split_stack.model_registry import load_registry, model_weight
+    registry = load_registry()
+    ranked = sorted(model_names, key=lambda name: model_weight(name, registry))
+    if count == 3 and len(ranked) >= 3:
+        return [ranked[0], ranked[len(ranked) // 2], ranked[-1]]
+    return ranked[:count]
+def list_model_inventory(
+    *,
+    base_url: str = "http://127.0.0.1:11434",
+    manifests_root: Path | str | None = None,
+) -> ModelInventory:
+    """Merge Ollama API tags with on-disk manifest scan."""
+    roots = manifest_search_paths(extra_root=Path(manifests_root) if manifests_root else None)
+    api_models: list[str] = []
+    api_error: str | None = None
+    try:
+        api_models = discover_models(base_url=base_url)
+    except Exception as exc:
+        api_error = str(exc)
+    disk_models = discover_models_from_disk(manifests_root=manifests_root)
+    pool = sorted(set(api_models) | set(disk_models))
+    suggested = _suggest_stack_from_pool(pool, count=3)
+    note_parts: list[str] = []
+    if api_error:
+        note_parts.append(f"Ollama API unreachable: {api_error}")
+    elif len(api_models) < len(disk_models):
+        note_parts.append(
+            f"Ollama API lists {len(api_models)} model(s) but disk has {len(disk_models)}. "
+            "Point Ollama at your model folder (OLLAMA_MODELS) or use disk models in the demo."
+        )
+    if not roots:
+        note_parts.append("No Ollama model directories found on disk.")
+    if note_parts:
+        note = " ".join(note_parts)
+    else:
+        note = None
+    return ModelInventory(
+        api_models=tuple(api_models),
+        disk_models=tuple(disk_models),
+        manifest_roots=tuple(str(path) for path in roots),
+        suggested_stack=tuple(suggested),
+        note=note,
+    )
+def model_locations_by_tag(
+    *,
+    manifests_root: Path | str | None = None,
+) -> dict[str, tuple[str, ...]]:
+    """Map model tag to every manifest root that contains it."""
+    roots = manifest_search_paths(extra_root=Path(manifests_root) if manifests_root else None)
+    locations: dict[str, list[str]] = {}
+    for root in roots:
+        library = root / "manifests" / "registry.ollama.ai" / "library"
+        if not library.is_dir():
+            continue
+        for family_dir in library.iterdir():
+            if not family_dir.is_dir():
+                continue
+            for tag_path in family_dir.iterdir():
+                if tag_path.is_file():
+                    tag = f"{family_dir.name}:{tag_path.name}"
+                    locations.setdefault(tag, []).append(str(root))
+    return {tag: tuple(paths) for tag, paths in sorted(locations.items())}
+def audit_model_folders(
+    *,
+    manifests_root: Path | str | None = None,
+) -> dict[str, object]:
+    """Report duplicate tags across Ollama model directories."""
+    locations = model_locations_by_tag(manifests_root=manifests_root)
+    duplicates = {tag: list(paths) for tag, paths in locations.items() if len(paths) > 1}
+    primary = default_models_dir()
+    if primary is None:
+        home = Path.home() / ".ollama" / "models"
+        primary = home if home.is_dir() else None
+    return {
+        "primary_root": str(primary) if primary else None,
+        "scan_roots": list(manifest_search_paths()),
+        "tag_count": len(locations),
+        "locations": {tag: list(paths) for tag, paths in locations.items()},
+        "duplicates": duplicates,
+        "duplicate_tags": sorted(duplicates),
+    }
+def remove_duplicate_manifests(
+    *,
+    keep_root: str | Path,
+    drop_roots: list[str | Path] | None = None,
+) -> list[str]:
+    """Delete manifest files from secondary folders when keep_root already has the tag."""
+    keep = Path(keep_root).expanduser().resolve()
+    drops = [Path(path).expanduser().resolve() for path in (drop_roots or manifest_search_paths())]
+    drops = [path for path in drops if path != keep and path.is_dir()]
+    keep_library = keep / "manifests" / "registry.ollama.ai" / "library"
+    if not keep_library.is_dir():
+        return []
+    keep_tags: set[str] = set()
+    for family_dir in keep_library.iterdir():
+        if not family_dir.is_dir():
+            continue
+        for tag_path in family_dir.iterdir():
+            if tag_path.is_file():
+                keep_tags.add(f"{family_dir.name}:{tag_path.name}")
+    removed: list[str] = []
+    for drop in drops:
+        library = drop / "manifests" / "registry.ollama.ai" / "library"
+        if not library.is_dir():
+            continue
+        for family_dir in library.iterdir():
+            if not family_dir.is_dir():
+                continue
+            for tag_path in list(family_dir.iterdir()):
+                if not tag_path.is_file():
+                    continue
+                tag = f"{family_dir.name}:{tag_path.name}"
+                if tag in keep_tags:
+                    tag_path.unlink()
+                    removed.append(f"{tag} @ {drop}")
+    return removed

split_stack/hints.py ADDED Viewed

@@ -0,0 +1,102 @@
+"""Agent step hints for agent-loop routing."""
+from __future__ import annotations
+from split_stack.models import ComplexityTier, StepKind
+# Five step types used in compare POC and agent-runner demos.
+HINT_CATALOG: tuple[dict[str, str], ...] = (
+    {
+        "id": "lookup",
+        "tier": ComplexityTier.SIMPLE.value,
+        "label": "Lookup",
+        "summary": "Facts, definitions, one-liners",
+    },
+    {
+        "id": "explain",
+        "tier": ComplexityTier.MEDIUM.value,
+        "label": "Explain",
+        "summary": "Summarise, compare, outline, plan",
+    },
+    {
+        "id": "design",
+        "tier": ComplexityTier.COMPLEX.value,
+        "label": "Design",
+        "summary": "Architecture, strategy, tradeoffs",
+    },
+    {
+        "id": "code",
+        "tier": ComplexityTier.COMPLEX.value,
+        "label": "Code",
+        "summary": "Implement, refactor, debug (uses code slot when set)",
+    },
+    {
+        "id": "reason",
+        "tier": ComplexityTier.REASONING.value,
+        "label": "Reason",
+        "summary": "Proofs, step-by-step, formal logic",
+    },
+)
+# Short-lived aliases from an earlier 4-hint experiment.
+LEGACY_HINT_ALIASES: dict[str, str] = {
+    "work": "explain",
+    "build": "design",
+}
+_CANONICAL_IDS = frozenset(item["id"] for item in HINT_CATALOG)
+def canonical_hint_id(hint: str | StepKind | None) -> str | None:
+    if hint is None:
+        return None
+    if isinstance(hint, StepKind):
+        raw = hint.value
+    else:
+        raw = hint.strip().lower()
+    if raw in _CANONICAL_IDS:
+        return raw
+    if raw in LEGACY_HINT_ALIASES:
+        return LEGACY_HINT_ALIASES[raw]
+    return raw
+def normalize_step_kind(hint: str | StepKind | None) -> StepKind | None:
+    if hint is None:
+        return None
+    if isinstance(hint, StepKind):
+        return hint
+    lowered = hint.strip().lower()
+    canonical = canonical_hint_id(lowered)
+    if canonical is None:
+        valid = ", ".join(item["id"] for item in HINT_CATALOG)
+        raise ValueError(f"Unknown step hint '{hint}'. Valid hints: {valid}")
+    try:
+        return StepKind(canonical)
+    except ValueError as exc:
+        valid = ", ".join(item["id"] for item in HINT_CATALOG)
+        raise ValueError(f"Unknown step hint '{hint}'. Valid hints: {valid}") from exc
+def prefer_code_model(hint: str | StepKind | None) -> bool:
+    if hint is None:
+        return False
+    raw = hint.value if isinstance(hint, StepKind) else hint.strip().lower()
+    return raw == "code"
+def tier_from_step_kind(kind: StepKind) -> ComplexityTier:
+    lookup = {
+        StepKind.LOOKUP: ComplexityTier.SIMPLE,
+        StepKind.EXPLAIN: ComplexityTier.MEDIUM,
+        StepKind.WORK: ComplexityTier.MEDIUM,
+        StepKind.DESIGN: ComplexityTier.COMPLEX,
+        StepKind.BUILD: ComplexityTier.COMPLEX,
+        StepKind.CODE: ComplexityTier.COMPLEX,
+        StepKind.REASON: ComplexityTier.REASONING,
+    }
+    return lookup[kind]
+def list_hints() -> tuple[dict[str, str], ...]:
+    return HINT_CATALOG

split_stack/local_models.py ADDED Viewed

@@ -0,0 +1,63 @@
+from __future__ import annotations
+from split_stack.discovery import discover_models, discover_models_from_disk, list_model_inventory
+from split_stack.model_registry import ResolvedModel, load_registry, resolve_discovered_models
+from split_stack.tiering import assign_tiers
+def list_local_models(
+    *,
+    base_url: str = "http://127.0.0.1:11434",
+    config_path: str | None = None,
+    profile: str | None = None,
+    only_vram_ok: bool = False,
+    include_disk: bool = False,
+    quant_mode: str | None = None,
+) -> tuple[list[ResolvedModel], str | None]:
+    registry = load_registry(config_path, profile=profile)
+    discovered = discover_models(base_url=base_url)
+    note: str | None = None
+    if include_disk:
+        inventory = list_model_inventory(base_url=base_url)
+        discovered = sorted(set(discovered) | set(inventory.disk_models))
+        note = inventory.note
+    effective_filter = only_vram_ok and registry.apply_vram_filter
+    resolved = resolve_discovered_models(
+        discovered,
+        registry=registry,
+        only_vram_ok=effective_filter,
+        quant_mode=quant_mode,
+    )
+    warning = None
+    if effective_filter and len(resolved) < 2:
+        warning = (
+            "Fewer than two models fit assumed_vram_gb="
+            f"{registry.assumed_vram_gb}. Add smaller models, pick a larger workstation profile, "
+            "or set deployment_profile to datacenter with a custom catalog."
+        )
+    if note and not warning:
+        warning = note
+    elif note and warning:
+        warning = f"{warning} {note}"
+    return resolved, warning
+def assign_tiers_from_local(
+    *,
+    base_url: str = "http://127.0.0.1:11434",
+    config_path: str | None = None,
+    profile: str | None = None,
+    only_vram_ok: bool = True,
+    quant_mode: str | None = None,
+):
+    models, warning = list_local_models(
+        base_url=base_url,
+        config_path=config_path,
+        profile=profile,
+        only_vram_ok=only_vram_ok,
+        quant_mode=quant_mode,
+    )
+    if not models:
+        raise RuntimeError("No models available after discovery and VRAM filter")
+    tiers = assign_tiers([item.name for item in models])
+    return tiers, models, warning