PyPI - contextcore - Versions diffs - 0.1.0__py3-none-any.whl - Mend

contextcore 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

activity/__init__.py +1 -0
activity/recent_sync.py +56 -0
audio_search_implementation_v2/__init__.py +1 -0
audio_search_implementation_v2/audio_index.py +67 -0
audio_search_implementation_v2/scanner.py +47 -0
audio_search_implementation_v2/worker.py +17 -0
auth_manager.py +57 -0
cli/__init__.py +2 -0
cli/commands/__init__.py +1 -0
cli/commands/doctor.py +238 -0
cli/commands/helpers.py +500 -0
cli/commands/init.py +1022 -0
cli/commands/report.py +185 -0
cli/commands/search.py +172 -0
cli/commands/status.py +296 -0
cli/commands/update.py +122 -0
cli/constants.py +5 -0
cli/env.py +60 -0
cli/lifecycle.py +353 -0
cli/main.py +293 -0
cli/paths.py +53 -0
cli/server.py +216 -0
cli/ui.py +165 -0
config.py +500 -0
contextcore-0.1.0.dist-info/METADATA +693 -0
contextcore-0.1.0.dist-info/RECORD +63 -0
contextcore-0.1.0.dist-info/WHEEL +5 -0
contextcore-0.1.0.dist-info/entry_points.txt +2 -0
contextcore-0.1.0.dist-info/licenses/LICENSE +661 -0
contextcore-0.1.0.dist-info/top_level.txt +17 -0
core/__init__.py +16 -0
core/sdk.py +233 -0
detect_paths.py +346 -0
image_search_implementation_v2/__init__.py +1 -0
image_search_implementation_v2/annoy_store.py +210 -0
image_search_implementation_v2/config.py +34 -0
image_search_implementation_v2/db.py +277 -0
image_search_implementation_v2/embedder.py +55 -0
image_search_implementation_v2/index_worker.py +114 -0
image_search_implementation_v2/main.py +42 -0
image_search_implementation_v2/ocr.py +30 -0
image_search_implementation_v2/search.py +258 -0
index_controller/__init__.py +1 -0
index_controller/ignore.py +27 -0
index_controller/thumbnail_manager.py +112 -0
mcp_registration.py +360 -0
mcp_server.py +1391 -0
rclone_service.py +55 -0
register_mcp.py +710 -0
run_index_pipeline.py +614 -0
text_search_implementation_v2/__init__.py +1 -0
text_search_implementation_v2/config.py +8 -0
text_search_implementation_v2/db.py +148 -0
text_search_implementation_v2/extract.py +191 -0
text_search_implementation_v2/index_controller.py +30 -0
text_search_implementation_v2/index_worker.py +237 -0
text_search_implementation_v2/main.py +56 -0
text_search_implementation_v2/search.py +264 -0
unimain.py +3868 -0
video_search_implementation_v2/__init__.py +1 -0
video_search_implementation_v2/runtime.py +216 -0
video_search_implementation_v2/video_index.py +659 -0
video_search_implementation_v2/watcher.py +181 -0

activity/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ """ContextCore activity helpers package."""

activity/recent_sync.py ADDED Viewed

@@ -0,0 +1,56 @@
+# activity/recent_sync.py
+import json
+import time
+from pathlib import Path
+from threading import Lock
+import sys
+_ROOT = Path(__file__).resolve().parent.parent
+sys.path.insert(0, str(_ROOT))
+from config import get_organized_root
+MAX_ITEMS = 5
+STATE_PATH = get_organized_root() / ".radxa_state" / "recent_sync.json"
+_lock = Lock()
+def _load():
+    if STATE_PATH.exists():
+        try:
+            return json.loads(STATE_PATH.read_text())
+        except Exception:
+            return []
+    return []
+def _save(items):
+    STATE_PATH.parent.mkdir(parents=True, exist_ok=True)
+    STATE_PATH.write_text(json.dumps(items, indent=2))
+def record_sync(path: str, category: str):
+    with _lock:
+        items = _load()
+        filename = Path(path).name
+        # Remove duplicates (same path)
+        items = [i for i in items if i["path"] != path]
+        items.insert(0, {
+            "path": path,
+            "filename": filename,
+            "category": category,
+            "synced_at": int(time.time()),
+        })
+        items = items[:MAX_ITEMS]
+        _save(items)
+def get_recent_syncs():
+    with _lock:
+        return _load()

audio_search_implementation_v2/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ """Audio indexing and transcription package for ContextCore."""

audio_search_implementation_v2/audio_index.py ADDED Viewed

@@ -0,0 +1,67 @@
+from __future__ import annotations
+import threading
+from pathlib import Path
+from faster_whisper import WhisperModel
+from text_search_implementation_v2.db import get_file_mtime, upsert_file
+AUDIO_EXTS = {".mp3", ".wav", ".m4a", ".aac", ".flac", ".ogg"}
+_whisper_model = None
+_whisper_lock = threading.Lock()
+def get_whisper():
+    global _whisper_model
+    if _whisper_model is None:
+        print("Loading Whisper model...")
+        _whisper_model = WhisperModel("small.en", device="cpu", compute_type="int8")
+    return _whisper_model
+def prewarm_whisper() -> tuple[bool, str | None]:
+    try:
+        get_whisper()
+        return True, None
+    except Exception as exc:
+        return False, str(exc)
+def transcribe_audio(path: Path):
+    model = get_whisper()
+    segments, _ = model.transcribe(str(path))
+    return " ".join(seg.text.strip() for seg in segments if seg.text.strip())
+def scan_audio_index(audio_root: Path):
+    total_new = 0
+    for path in audio_root.rglob("*"):
+        if not path.is_file() or path.suffix.lower() not in AUDIO_EXTS:
+            continue
+        try:
+            mtime = path.stat().st_mtime
+        except Exception:
+            continue
+        existing_mtime = get_file_mtime(str(path))
+        if existing_mtime is not None and abs(existing_mtime - mtime) < 0.001:
+            continue
+        print("Transcribing:", path)
+        try:
+            transcript = transcribe_audio(path)
+        except Exception as exc:
+            print("Transcription failed:", exc)
+            continue
+        if not transcript:
+            continue
+        upsert_file(str(path), path.name, "audio", mtime, transcript)
+        total_new += 1
+    return {"status": "ok", "new_audio_indexed": total_new}

audio_search_implementation_v2/scanner.py ADDED Viewed

@@ -0,0 +1,47 @@
+# audio_search_implementation_v2/scanner.py
+from pathlib import Path
+from faster_whisper import WhisperModel
+from text_search_implementation_v2.db import upsert_file, get_file_mtime
+AUDIO_EXTS = {".mp3", ".wav", ".m4a", ".aac", ".flac", ".ogg"}
+def run_audio_scan(audio_root: Path):
+    print("🎧 Loading Whisper model...")
+    model = WhisperModel("small.en", device="cpu", compute_type="int8")
+    total_new = 0
+    for p in audio_root.rglob("*"):
+        if not p.is_file():
+            continue
+        if p.suffix.lower() not in AUDIO_EXTS:
+            continue
+        try:
+            mtime = p.stat().st_mtime
+        except Exception:
+            continue
+        existing_mtime = get_file_mtime(str(p))
+        if existing_mtime is not None:
+            if abs(existing_mtime - mtime) < 0.001:
+                continue
+        print("🎧 Transcribing:", p)
+        try:
+            segments, _ = model.transcribe(str(p))
+            transcript = " ".join(seg.text.strip() for seg in segments)
+        except Exception as e:
+            print("⚠️ Transcription failed:", e)
+            continue
+        if not transcript:
+            continue
+        upsert_file(str(p), p.name, "audio", mtime, transcript)
+        total_new += 1
+    print("🎧 Audio indexing complete. New files:", total_new)
+    return total_new

audio_search_implementation_v2/worker.py ADDED Viewed

@@ -0,0 +1,17 @@
+# audio_search_implementation_v2/worker.py
+import sys
+sys.path.insert(0, str(__import__("pathlib").Path(__file__).resolve().parent.parent))
+from pathlib import Path
+from audio_search_implementation_v2.scanner import run_audio_scan
+from config import get_audio_directories
+if __name__ == "__main__":
+    audio_dirs = get_audio_directories()
+    print("🚀 Audio worker started")
+    total = 0
+    for audio_root in audio_dirs:
+        if audio_root.is_dir():
+            total += run_audio_scan(audio_root)
+    print("🚀 Audio worker exiting. Indexed:", total)

auth_manager.py ADDED Viewed

@@ -0,0 +1,57 @@
+import subprocess
+import threading
+import uuid
+import re
+import json
+auth_sessions = {}
+def start_auth(storage_type):
+    session_id = str(uuid.uuid4())
+    process = subprocess.Popen(
+        ["rclone", "authorize", storage_type, "--auth-no-open-browser"],
+        stdout=subprocess.PIPE,
+        stderr=subprocess.STDOUT,
+        text=True,
+    )
+    auth_sessions[session_id] = {
+        "process": process,
+        "status": "starting",
+        "verification_url": None,
+        "user_code": None,
+        "token": None
+    }
+    threading.Thread(
+        target=_monitor_process,
+        args=(session_id,),
+        daemon=True
+    ).start()
+    return session_id
+def _monitor_process(session_id):
+    process = auth_sessions[session_id]["process"]
+    for line in process.stdout:
+        line = line.strip()
+        print("AUTH OUTPUT:", line)
+        # Capture verification URL
+        if "http" in line and "google" in line:
+            auth_sessions[session_id]["verification_url"] = line
+            auth_sessions[session_id]["status"] = "waiting_for_user"
+        # Capture user code
+        if re.search(r"[A-Z0-9]{4}-[A-Z0-9]{4}", line):
+            auth_sessions[session_id]["user_code"] = line
+        # Capture token JSON
+        if line.startswith("{") and "access_token" in line:
+            auth_sessions[session_id]["token"] = line
+            auth_sessions[session_id]["status"] = "completed"
+    process.wait()

cli/__init__.py ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ # cli/__init__.py
2	+ # ContextCore CLI package

cli/commands/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ # cli/commands/__init__.py

cli/commands/doctor.py ADDED Viewed

@@ -0,0 +1,238 @@
+# cli/commands/doctor.py
+#
+# contextcore doctor - diagnostic check of the local installation.
+from __future__ import annotations
+import json
+import platform
+import shutil
+import sqlite3
+import subprocess
+import sys
+from pathlib import Path
+from cli.constants import DEFAULT_PORT
+from cli.lifecycle import autostart_status, get_port_usage, index_lock_active, read_index_state
+from cli.paths import get_sdk_root
+from cli.ui import console, error, header, hint, section, success, warning
+def _check(label: str, ok: bool, fix_label: str = "", fix_cmd: str = "") -> bool:
+    if ok:
+        success(label)
+    else:
+        error(label)
+        if fix_cmd:
+            hint(fix_label, fix_cmd)
+    return ok
+def run_doctor() -> None:
+    header("ContextCore Doctor")
+    console.print("[dim]Checking your ContextCore setup...[/dim]")
+    sdk_root = get_sdk_root()
+    issues = 0
+    section("Runtime")
+    py_ok = sys.version_info >= (3, 10)
+    if not _check(
+        f"Python {sys.version.split()[0]} {'(OK)' if py_ok else '(requires 3.10+)'}",
+        py_ok,
+        "upgrade python",
+        "https://python.org/downloads",
+    ):
+        issues += 1
+    try:
+        with sqlite3.connect(":memory:") as c:
+            c.execute("SELECT 1").fetchone()
+        _check("SQLite accessible", True)
+    except Exception as e:
+        _check(f"SQLite error: {e}", False)
+        issues += 1
+    try:
+        import sqlite_vec  # noqa: F401
+        _check("sqlite-vec installed", True)
+    except ImportError:
+        _check("sqlite-vec not installed", False, "install sqlite-vec", ".venv/Scripts/pip install sqlite-vec")
+        issues += 1
+    section("Configuration")
+    cfg = Path.home() / ".contextcore" / "contextcore.yaml"
+    if _check(
+        f"Config file at {cfg}",
+        cfg.exists(),
+        "run init to create config",
+        "contextcore init",
+    ):
+        for line in cfg.read_text(encoding="utf-8").splitlines():
+            if line.startswith("organized_root:"):
+                val = line.split(":", 1)[1].strip().strip("'\"")
+                root = Path(val)
+                _check(
+                    f"organized_root exists: {root}",
+                    root.exists(),
+                    "create the directory or update the config",
+                    f"mkdir \"{root}\"",
+                )
+                if not root.exists():
+                    issues += 1
+                break
+    else:
+        issues += 1
+    section("Autostart")
+    auto = autostart_status()
+    installed = bool(auto.get("installed"))
+    if _check(
+        f"Autostart {'installed' if installed else 'not installed'}",
+        installed,
+        "repair autostart",
+        "contextcore init",
+    ):
+        if auto.get("target"):
+            success(f"Autostart target: {auto.get('target')}")
+    else:
+        issues += 1
+    section("Index Lock")
+    active_lock, state = index_lock_active()
+    if active_lock:
+        success("A full index job is active")
+        if state.get("source"):
+            success(f"Source: {state.get('source')}")
+    else:
+        success("No active full index lock")
+    if state.get("stale_lock_recovered_at"):
+        warning(f"Recovered stale lock at {state.get('stale_lock_recovered_at')}")
+    elif read_index_state().get("active"):
+        warning("Index state says active, but no live lock was found")
+    section("MCP Server")
+    mcp = sdk_root / "mcp_server.py"
+    if _check("mcp_server.py found", mcp.exists(), "reinstall contextcore", "pip install --force-reinstall contextcore"):
+        r = subprocess.run(
+            [sys.executable, "-c", "import mcp_server"],
+            capture_output=True,
+            cwd=str(sdk_root),
+            timeout=10,
+        )
+        _check(
+            "mcp_server imports cleanly",
+            r.returncode == 0,
+            "retry MCP import check",
+            f"cd \"{sdk_root}\" && \"{sys.executable}\" -c \"import mcp_server\"",
+        )
+        if r.returncode != 0:
+            console.print(f"  [dim]{r.stderr.strip()[-400:]}[/dim]")
+            issues += 1
+    else:
+        issues += 1
+    section("FastAPI Server")
+    usage = get_port_usage(DEFAULT_PORT)
+    if usage.get("is_contextcore"):
+        success(f"Server listening on port {DEFAULT_PORT}")
+    elif usage.get("in_use"):
+        pid = usage.get("pid")
+        name = usage.get("process_name") or "unknown"
+        _check(
+            f"Port {DEFAULT_PORT} is occupied by {name}{f' (PID {pid})' if pid else ''}",
+            False,
+            "inspect the conflicting process",
+            f"tasklist /FI \"PID eq {pid}\"" if platform.system() == "Windows" and pid else f"ps -p {pid} -o pid,comm,args" if pid else "",
+        )
+        if platform.system() == "Windows" and pid:
+            hint("stop it if appropriate", f"taskkill /F /PID {pid}")
+        elif pid:
+            hint("stop it if appropriate", f"kill {pid}")
+        issues += 1
+    else:
+        _check(
+            f"Server listening on port {DEFAULT_PORT}",
+            False,
+            "start the server",
+            "contextcore serve",
+        )
+        issues += 1
+    section("Claude Desktop")
+    plat = platform.system().lower()
+    if plat == "windows":
+        import os
+        claude_cfg = Path(os.environ.get("APPDATA", "~")) / "Claude" / "claude_desktop_config.json"
+    elif plat == "darwin":
+        claude_cfg = Path.home() / "Library" / "Application Support" / "Claude" / "claude_desktop_config.json"
+    else:
+        claude_cfg = Path.home() / ".config" / "Claude" / "claude_desktop_config.json"
+    claude_cfg = claude_cfg.expanduser()
+    if _check(
+        f"Claude Desktop config found at {claude_cfg}",
+        claude_cfg.exists(),
+        "install Claude Desktop or open it once to create the config",
+        "https://claude.ai/download",
+    ):
+        try:
+            data = json.loads(claude_cfg.read_text(encoding="utf-8"))
+            has_cc = "contextcore" in data.get("mcpServers", {})
+            _check("ContextCore registered in Claude Desktop", has_cc, "re-register", "contextcore register claude-desktop")
+            if not has_cc:
+                issues += 1
+        except Exception as e:
+            error(f"Could not read Claude config: {e}")
+            issues += 1
+    else:
+        issues += 1
+    section("Optional Models")
+    try:
+        import torch  # noqa: F401
+        success("torch installed (image/video search available)")
+    except ImportError:
+        warning("torch not installed - image/video search unavailable")
+        hint("install vision model", "contextcore install clip")
+    try:
+        import faster_whisper  # noqa: F401
+        success("faster-whisper installed (audio search available)")
+    except ImportError:
+        warning("faster-whisper not installed - audio search unavailable")
+        hint("install audio model", "contextcore install audio")
+    section("Image Search Capabilities")
+    try:
+        import pytesseract  # noqa: F401
+        success("pytesseract installed (OCR Python package available)")
+    except ImportError:
+        warning("pytesseract not installed - OCR text extraction disabled")
+        hint("install OCR package", f"{sys.executable} -m pip install pytesseract")
+    tesseract_ok = bool(shutil.which("tesseract"))
+    if tesseract_ok:
+        success("tesseract binary found (OCR runtime available)")
+    else:
+        warning("tesseract binary not found - OCR text extraction disabled")
+        if platform.system() == "Windows":
+            hint("install tesseract", "winget install UB-Mannheim.TesseractOCR")
+        elif platform.system() == "Darwin":
+            hint("install tesseract", "brew install tesseract")
+        else:
+            hint("install tesseract", "sudo apt-get install tesseract-ocr")
+    try:
+        import annoy  # noqa: F401
+        success("annoy installed (semantic image ANN backend available)")
+    except ImportError:
+        warning("annoy not installed - semantic image search disabled (OCR/filename still works)")
+        hint("install annoy", f"{sys.executable} -m pip install annoy")
+    console.print()
+    if issues == 0:
+        console.print("[bold green]All checks passed[/bold green]  ContextCore is healthy.")
+    else:
+        console.print(f"[bold red]{issues} issue{'s' if issues > 1 else ''} found.[/bold red]  Follow the Fix: suggestions above.")
+    console.print()