PyPI - repr-cli - Versions diffs - 0.1.0__py3-none-any.whl → 0.2.2__py3-none-any.whl - Mend

repr-cli 0.1.0py3-none-any.whl → 0.2.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

repr/__init__.py +1 -1
repr/__main__.py +6 -0
repr/api.py +127 -1
repr/auth.py +66 -2
repr/cli.py +2143 -663
repr/config.py +658 -32
repr/discovery.py +5 -0
repr/doctor.py +458 -0
repr/hooks.py +634 -0
repr/keychain.py +255 -0
repr/llm.py +506 -0
repr/openai_analysis.py +92 -21
repr/privacy.py +333 -0
repr/storage.py +527 -0
repr/templates.py +229 -0
repr/tools.py +202 -0
repr/ui.py +79 -364
repr_cli-0.2.2.dist-info/METADATA +263 -0
repr_cli-0.2.2.dist-info/RECORD +24 -0
{repr_cli-0.1.0.dist-info → repr_cli-0.2.2.dist-info}/licenses/LICENSE +1 -1
repr/analyzer.py +0 -915
repr/highlights.py +0 -712
repr_cli-0.1.0.dist-info/METADATA +0 -326
repr_cli-0.1.0.dist-info/RECORD +0 -18
{repr_cli-0.1.0.dist-info → repr_cli-0.2.2.dist-info}/WHEEL +0 -0
{repr_cli-0.1.0.dist-info → repr_cli-0.2.2.dist-info}/entry_points.txt +0 -0
{repr_cli-0.1.0.dist-info → repr_cli-0.2.2.dist-info}/top_level.txt +0 -0

repr/llm.py ADDED Viewed

@@ -0,0 +1,506 @@
+"""
+LLM detection, configuration, and testing.
+Supports:
+- Local LLMs: Ollama, LM Studio, custom OpenAI-compatible endpoints
+- Cloud: repr.dev managed inference
+- BYOK: Bring your own key (OpenAI, Anthropic, etc.)
+"""
+from dataclasses import dataclass
+from typing import Any
+import httpx
+@dataclass
+class LocalLLMInfo:
+    """Information about a detected local LLM."""
+    provider: str  # "ollama", "lmstudio", "custom"
+    name: str
+    url: str
+    models: list[str]
+    default_model: str | None
+@dataclass
+class LLMTestResult:
+    """Result of LLM connection test."""
+    success: bool
+    provider: str
+    endpoint: str
+    model: str | None
+    response_time_ms: float | None
+    error: str | None
+# Known local LLM endpoints
+LOCAL_ENDPOINTS = [
+    {
+        "provider": "ollama",
+        "name": "Ollama",
+        "url": "http://localhost:11434",
+        "api_path": "/v1",
+        "models_endpoint": "/api/tags",
+    },
+    {
+        "provider": "lmstudio",
+        "name": "LM Studio",
+        "url": "http://localhost:1234",
+        "api_path": "/v1",
+        "models_endpoint": "/v1/models",
+    },
+]
+def detect_local_llm() -> LocalLLMInfo | None:
+    """
+    Detect available local LLM endpoints.
+    Returns:
+        LocalLLMInfo if found, None otherwise
+    """
+    for endpoint in LOCAL_ENDPOINTS:
+        try:
+            # Try to connect and get models
+            models_url = f"{endpoint['url']}{endpoint['models_endpoint']}"
+            resp = httpx.get(models_url, timeout=3)
+            if resp.status_code == 200:
+                data = resp.json()
+                # Parse models based on provider
+                if endpoint["provider"] == "ollama":
+                    models = [m.get("name", m.get("model", "")) for m in data.get("models", [])]
+                else:
+                    models = [m.get("id", "") for m in data.get("data", [])]
+                models = [m for m in models if m]  # Filter empty
+                return LocalLLMInfo(
+                    provider=endpoint["provider"],
+                    name=endpoint["name"],
+                    url=endpoint["url"],
+                    models=models,
+                    default_model=models[0] if models else None,
+                )
+        except Exception:
+            continue
+    return None
+def detect_all_local_llms() -> list[LocalLLMInfo]:
+    """
+    Detect all available local LLM endpoints.
+    Returns:
+        List of LocalLLMInfo for all found providers
+    """
+    found = []
+    for endpoint in LOCAL_ENDPOINTS:
+        try:
+            models_url = f"{endpoint['url']}{endpoint['models_endpoint']}"
+            resp = httpx.get(models_url, timeout=3)
+            if resp.status_code == 200:
+                data = resp.json()
+                if endpoint["provider"] == "ollama":
+                    models = [m.get("name", m.get("model", "")) for m in data.get("models", [])]
+                else:
+                    models = [m.get("id", "") for m in data.get("data", [])]
+                models = [m for m in models if m]
+                found.append(LocalLLMInfo(
+                    provider=endpoint["provider"],
+                    name=endpoint["name"],
+                    url=endpoint["url"],
+                    models=models,
+                    default_model=models[0] if models else None,
+                ))
+        except Exception:
+            continue
+    return found
+def test_local_llm(
+    url: str | None = None,
+    model: str | None = None,
+    api_key: str | None = None,
+) -> LLMTestResult:
+    """
+    Test local LLM connection and generation.
+    Args:
+        url: LLM API base URL (auto-detect if None)
+        model: Model to test (use default if None)
+        api_key: API key if required
+    Returns:
+        LLMTestResult with test outcome
+    """
+    import time
+    # Auto-detect if no URL provided
+    if not url:
+        detected = detect_local_llm()
+        if not detected:
+            return LLMTestResult(
+                success=False,
+                provider="unknown",
+                endpoint="",
+                model=None,
+                response_time_ms=None,
+                error="No local LLM detected. Is Ollama or LM Studio running?",
+            )
+        url = detected.url
+        if not model:
+            model = detected.default_model
+        provider = detected.provider
+    else:
+        provider = "custom"
+    # Determine model
+    if not model:
+        model = "llama3.2"  # Common default
+    # Test generation
+    try:
+        start = time.time()
+        headers = {"Content-Type": "application/json"}
+        if api_key:
+            headers["Authorization"] = f"Bearer {api_key}"
+        # Use chat completions endpoint
+        chat_url = f"{url}/v1/chat/completions"
+        resp = httpx.post(
+            chat_url,
+            headers=headers,
+            json={
+                "model": model,
+                "messages": [{"role": "user", "content": "Say 'hello' and nothing else."}],
+                "max_tokens": 10,
+            },
+            timeout=30,
+        )
+        elapsed_ms = (time.time() - start) * 1000
+        if resp.status_code == 200:
+            return LLMTestResult(
+                success=True,
+                provider=provider,
+                endpoint=url,
+                model=model,
+                response_time_ms=elapsed_ms,
+                error=None,
+            )
+        else:
+            return LLMTestResult(
+                success=False,
+                provider=provider,
+                endpoint=url,
+                model=model,
+                response_time_ms=elapsed_ms,
+                error=f"HTTP {resp.status_code}: {resp.text[:100]}",
+            )
+    except httpx.ConnectError:
+        return LLMTestResult(
+            success=False,
+            provider=provider,
+            endpoint=url,
+            model=model,
+            response_time_ms=None,
+            error=f"Connection failed: {url}",
+        )
+    except httpx.TimeoutException:
+        return LLMTestResult(
+            success=False,
+            provider=provider,
+            endpoint=url,
+            model=model,
+            response_time_ms=None,
+            error="Request timed out (30s)",
+        )
+    except Exception as e:
+        return LLMTestResult(
+            success=False,
+            provider=provider,
+            endpoint=url,
+            model=model,
+            response_time_ms=None,
+            error=str(e),
+        )
+def test_byok_provider(provider: str, api_key: str, model: str | None = None) -> LLMTestResult:
+    """
+    Test BYOK provider connection.
+    Args:
+        provider: Provider name (openai, anthropic, etc.)
+        api_key: API key
+        model: Model to test
+    Returns:
+        LLMTestResult with test outcome
+    """
+    import time
+    from .config import BYOK_PROVIDERS
+    if provider not in BYOK_PROVIDERS:
+        return LLMTestResult(
+            success=False,
+            provider=provider,
+            endpoint="",
+            model=model,
+            response_time_ms=None,
+            error=f"Unknown provider: {provider}",
+        )
+    provider_info = BYOK_PROVIDERS[provider]
+    base_url = provider_info["base_url"]
+    if not model:
+        model = provider_info["default_model"]
+    try:
+        start = time.time()
+        if provider == "anthropic":
+            # Anthropic uses different API format
+            resp = httpx.post(
+                f"{base_url}/messages",
+                headers={
+                    "x-api-key": api_key,
+                    "anthropic-version": "2023-06-01",
+                    "Content-Type": "application/json",
+                },
+                json={
+                    "model": model,
+                    "max_tokens": 10,
+                    "messages": [{"role": "user", "content": "Say 'hello' and nothing else."}],
+                },
+                timeout=30,
+            )
+        else:
+            # OpenAI-compatible API
+            resp = httpx.post(
+                f"{base_url}/chat/completions",
+                headers={
+                    "Authorization": f"Bearer {api_key}",
+                    "Content-Type": "application/json",
+                },
+                json={
+                    "model": model,
+                    "messages": [{"role": "user", "content": "Say 'hello' and nothing else."}],
+                    "max_tokens": 10,
+                },
+                timeout=30,
+            )
+        elapsed_ms = (time.time() - start) * 1000
+        if resp.status_code == 200:
+            return LLMTestResult(
+                success=True,
+                provider=provider,
+                endpoint=base_url,
+                model=model,
+                response_time_ms=elapsed_ms,
+                error=None,
+            )
+        elif resp.status_code == 401:
+            return LLMTestResult(
+                success=False,
+                provider=provider,
+                endpoint=base_url,
+                model=model,
+                response_time_ms=elapsed_ms,
+                error="Invalid API key",
+            )
+        else:
+            return LLMTestResult(
+                success=False,
+                provider=provider,
+                endpoint=base_url,
+                model=model,
+                response_time_ms=elapsed_ms,
+                error=f"HTTP {resp.status_code}: {resp.text[:100]}",
+            )
+    except Exception as e:
+        return LLMTestResult(
+            success=False,
+            provider=provider,
+            endpoint=base_url,
+            model=model,
+            response_time_ms=None,
+            error=str(e),
+        )
+def list_ollama_models(url: str = "http://localhost:11434") -> list[str]:
+    """
+    List available Ollama models.
+    Args:
+        url: Ollama API URL
+    Returns:
+        List of model names
+    """
+    try:
+        resp = httpx.get(f"{url}/api/tags", timeout=5)
+        if resp.status_code == 200:
+            data = resp.json()
+            return [m.get("name", "") for m in data.get("models", []) if m.get("name")]
+    except Exception:
+        pass
+    return []
+def list_openai_compatible_models(url: str, api_key: str | None = None) -> list[str]:
+    """
+    List models from OpenAI-compatible endpoint.
+    Args:
+        url: API base URL
+        api_key: Optional API key
+    Returns:
+        List of model IDs
+    """
+    try:
+        headers = {}
+        if api_key:
+            headers["Authorization"] = f"Bearer {api_key}"
+        resp = httpx.get(f"{url}/v1/models", headers=headers, timeout=5)
+        if resp.status_code == 200:
+            data = resp.json()
+            return [m.get("id", "") for m in data.get("data", []) if m.get("id")]
+    except Exception:
+        pass
+    return []
+def get_llm_status() -> dict[str, Any]:
+    """
+    Get comprehensive LLM status.
+    Returns:
+        Dict with local, cloud, and BYOK status
+    """
+    from .config import (
+        get_llm_config,
+        get_default_llm_mode,
+        list_byok_providers,
+        is_authenticated,
+        is_cloud_allowed,
+    )
+    llm_config = get_llm_config()
+    default_mode = get_default_llm_mode()
+    # Check local LLM
+    local_info = detect_local_llm()
+    local_available = local_info is not None
+    # Check cloud
+    cloud_available = is_authenticated() and is_cloud_allowed()
+    # Check BYOK
+    byok_providers = list_byok_providers()
+    return {
+        "default_mode": default_mode,
+        "local": {
+            "available": local_available,
+            "provider": local_info.provider if local_info else None,
+            "name": local_info.name if local_info else None,
+            "url": local_info.url if local_info else llm_config.get("local_api_url"),
+            "model": llm_config.get("local_model") or (local_info.default_model if local_info else None),
+            "models_count": len(local_info.models) if local_info else 0,
+        },
+        "cloud": {
+            "available": cloud_available,
+            "model": llm_config.get("cloud_model", "gpt-4o-mini"),
+            "blocked_reason": None if cloud_available else (
+                "Not authenticated" if not is_authenticated() else "Local-only mode enabled"
+            ),
+        },
+        "byok": {
+            "providers": byok_providers,
+            "count": len(byok_providers),
+        },
+        "settings": {
+            "cloud_send_diffs": llm_config.get("cloud_send_diffs", False),
+            "cloud_redact_paths": llm_config.get("cloud_redact_paths", True),
+            "cloud_redact_emails": llm_config.get("cloud_redact_emails", False),
+        },
+    }
+def get_effective_llm_mode() -> tuple[str, dict[str, Any]]:
+    """
+    Get the effective LLM mode that will be used.
+    Returns:
+        Tuple of (mode, config_dict)
+        Mode is one of: "local", "cloud", "byok:<provider>"
+    """
+    from .config import (
+        get_default_llm_mode,
+        get_llm_config,
+        get_byok_config,
+        is_authenticated,
+        is_cloud_allowed,
+        get_forced_mode,
+    )
+    # Check for forced mode
+    forced = get_forced_mode()
+    if forced:
+        if forced == "local":
+            llm_config = get_llm_config()
+            return "local", {
+                "url": llm_config.get("local_api_url"),
+                "model": llm_config.get("local_model"),
+            }
+    default_mode = get_default_llm_mode()
+    llm_config = get_llm_config()
+    # Handle BYOK mode
+    if default_mode.startswith("byok:"):
+        provider = default_mode.split(":", 1)[1]
+        byok_config = get_byok_config(provider)
+        if byok_config:
+            return default_mode, byok_config
+        # Fall back to local if BYOK not configured
+        default_mode = "local"
+    # Handle cloud mode
+    if default_mode == "cloud":
+        if is_authenticated() and is_cloud_allowed():
+            return "cloud", {
+                "model": llm_config.get("cloud_model", "gpt-4o-mini"),
+            }
+        # Fall back to local if cloud not available
+        default_mode = "local"
+    # Local mode
+    return "local", {
+        "url": llm_config.get("local_api_url"),
+        "model": llm_config.get("local_model"),
+    }

repr/openai_analysis.py CHANGED Viewed

@@ -22,39 +22,97 @@ DEFAULT_EXTRACTION_MODEL = "openai/gpt-5-nano-2025-08-07"
 DEFAULT_SYNTHESIS_MODEL = "openai/gpt-5.2-2025-12-11"
 EXTRACTION_TEMPERATURE = 0.3
 SYNTHESIS_TEMPERATURE = 0.7
-COMMITS_PER_BATCH = 25
+COMMITS_PER_BATCH = 25  # Default fallback, use config value when possible
-def get_openai_client(api_key: str = None, base_url: str = None) -> AsyncOpenAI:
+def estimate_tokens(commits: list[dict[str, Any]]) -> int:
+    """
+    Estimate token count for a list of commits.
+    Uses a rough heuristic: ~4 characters per token (GPT tokenization rule of thumb).
+    Includes commit messages, file paths, and diffs.
+    Args:
+        commits: List of commits with diffs
+    Returns:
+        Estimated token count
+    """
+    total_chars = 0
+    for commit in commits:
+        # Count commit message
+        total_chars += len(commit.get('message', ''))
+        # Count file information
+        for file_info in commit.get('files', []):
+            total_chars += len(file_info.get('path', ''))
+            if 'diff' in file_info and file_info['diff']:
+                total_chars += len(file_info['diff'])
+    # Rule of thumb: ~4 characters per token
+    estimated_tokens = total_chars // 4
+    # Add overhead for prompts and formatting (~2000 tokens)
+    return estimated_tokens + 2000
+def get_batch_size() -> int:
+    """
+    Get batch size from config, with fallback to COMMITS_PER_BATCH constant.
+    Returns:
+        Batch size (max commits per batch)
+    """
+    try:
+        from .config import load_config
+        config = load_config()
+        return config.get("generation", {}).get("max_commits_per_batch", COMMITS_PER_BATCH)
+    except Exception:
+        return COMMITS_PER_BATCH
+def get_openai_client(api_key: str = None, base_url: str = None, verbose: bool = False) -> AsyncOpenAI:
     """
     Get OpenAI-compatible client that proxies through our backend.
     Args:
         api_key: API key (optional, for local LLM mode)
         base_url: Base URL for API (optional, for local LLM mode)
+        verbose: Whether to print debug info
     Returns:
         AsyncOpenAI client
     """
+    import sys
     # If explicit parameters provided, use them (for local mode)
     if api_key:
         kwargs = {"api_key": api_key}
         if base_url:
             kwargs["base_url"] = base_url
+        if verbose:
+            print(f"[DEBUG] Using explicit API key with base_url: {base_url or 'OpenAI default'}", file=sys.stderr)
         return AsyncOpenAI(**kwargs)
     # Use our backend as the proxy - it will forward to LiteLLM
     # The rf_* token is used to authenticate with our backend
     _, litellm_key = get_litellm_config()
     if not litellm_key:
-        raise ValueError("Not logged in. Please run 'rf login' first.")
+        raise ValueError("Not logged in. Please run 'repr login' first.")
     # Point to our backend's LLM proxy endpoint
     backend_url = get_api_base().replace("/api/cli", "")
+    proxy_url = f"{backend_url}/api/llm/v1"
+    if verbose:
+        print(f"[DEBUG] Backend URL: {backend_url}", file=sys.stderr)
+        print(f"[DEBUG] Proxy URL: {proxy_url}", file=sys.stderr)
+        print(f"[DEBUG] Token: {litellm_key[:15]}...", file=sys.stderr)
     return AsyncOpenAI(
         api_key=litellm_key,
-        base_url=f"{backend_url}/api/llm/v1"
+        base_url=proxy_url
     )
@@ -146,17 +204,26 @@ List the specific technical work done in this batch. For each item:
 Focus on substance, not process."""
-    response = await client.chat.completions.create(
-        model=model,
-        messages=[
-            {"role": "system", "content": system_prompt},
-            {"role": "user", "content": user_prompt},
-        ],
-        temperature=EXTRACTION_TEMPERATURE,
-        max_tokens=16000,  # Increased for reasoning models that use tokens for thinking
-    )
-    return response.choices[0].message.content or ""
+    try:
+        response = await client.chat.completions.create(
+            model=model,
+            messages=[
+                {"role": "system", "content": system_prompt},
+                {"role": "user", "content": user_prompt},
+            ],
+            temperature=EXTRACTION_TEMPERATURE,
+            max_tokens=16000,  # Increased for reasoning models that use tokens for thinking
+        )
+        return response.choices[0].message.content or ""
+    except Exception as e:
+        error_msg = str(e).lower()
+        # Handle content moderation blocks gracefully
+        if "blocked" in error_msg or "content" in error_msg or "moderation" in error_msg:
+            # Skip this batch but continue with others
+            return f"[Batch {batch_num} skipped - content filter triggered]"
+        # Re-raise other errors
+        raise
 async def synthesize_profile(
@@ -290,6 +357,7 @@ async def analyze_repo_openai(
     synthesis_model: str = None,
     verbose: bool = False,
     progress_callback: callable = None,
+    since: str = None,
 ) -> str:
     """
     Analyze a single repository using OpenAI-compatible API.
@@ -303,11 +371,12 @@ async def analyze_repo_openai(
         verbose: Whether to print verbose output
         progress_callback: Optional callback for progress updates
             Signature: callback(step: str, detail: str, repo: str, progress: float)
+        since: Only analyze commits after this point (SHA or date like '2026-01-01')
     Returns:
         Repository analysis/narrative in markdown
     """
-    client = get_openai_client(api_key=api_key, base_url=base_url)
+    client = get_openai_client(api_key=api_key, base_url=base_url, verbose=verbose)
     if progress_callback:
         progress_callback(
@@ -322,6 +391,7 @@ async def analyze_repo_openai(
         repo_path=repo.path,
         count=200,  # Last 200 commits
         days=730,  # Last 2 years
+        since=since,
     )
     if not commits:
@@ -335,10 +405,11 @@ async def analyze_repo_openai(
             progress=10.0,
         )
-    # Split into batches
+    # Split into batches (use config value)
+    batch_size = get_batch_size()
     batches = [
-        commits[i:i + COMMITS_PER_BATCH]
-        for i in range(0, len(commits), COMMITS_PER_BATCH)
+        commits[i:i + batch_size]
+        for i in range(0, len(commits), batch_size)
     ]
     total_batches = len(batches)
@@ -346,7 +417,7 @@ async def analyze_repo_openai(
     if progress_callback:
         progress_callback(
             step="Analyzing",
-            detail=f"Processing {total_batches} batches ({COMMITS_PER_BATCH} commits each)",
+            detail=f"Processing {total_batches} batches ({batch_size} commits each)",
             repo=repo.name,
             progress=15.0,
         )
@@ -501,7 +572,7 @@ async def analyze_repos_openai(
             progress=92.0,
         )
-    client = get_openai_client(api_key=api_key, base_url=base_url)
+    client = get_openai_client(api_key=api_key, base_url=base_url, verbose=verbose)
     # Aggregate metadata from all repos (injected directly, not LLM-generated)
     total_commits = sum(r.commit_count for r in repos)

repr-cli 0.1.0__py3-none-any.whl → 0.2.2__py3-none-any.whl

repr-cli 0.1.0py3-none-any.whl → 0.2.2py3-none-any.whl