PyPI - tricoder - Versions diffs - 1.2.8__py3-none-any.whl - Mend

tricoder 1.2.8__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

tricoder/__about__.py +6 -0
tricoder/__init__.py +19 -0
tricoder/calibration.py +276 -0
tricoder/cli.py +890 -0
tricoder/context_view.py +228 -0
tricoder/data_loader.py +144 -0
tricoder/extract.py +622 -0
tricoder/fusion.py +203 -0
tricoder/git_tracker.py +203 -0
tricoder/gpu_utils.py +414 -0
tricoder/graph_view.py +583 -0
tricoder/model.py +476 -0
tricoder/optimize.py +263 -0
tricoder/subtoken_utils.py +196 -0
tricoder/train.py +857 -0
tricoder/typed_view.py +313 -0
tricoder-1.2.8.dist-info/METADATA +306 -0
tricoder-1.2.8.dist-info/RECORD +22 -0
tricoder-1.2.8.dist-info/WHEEL +4 -0
tricoder-1.2.8.dist-info/entry_points.txt +3 -0
tricoder-1.2.8.dist-info/licenses/LICENSE +56 -0
tricoder-1.2.8.dist-info/licenses/LICENSE_COMMERCIAL.md +68 -0

tricoder/gpu_utils.py ADDED Viewed

@@ -0,0 +1,414 @@
+"""GPU acceleration utilities using CuPy (CUDA) or PyTorch (MPS for Mac)."""
+import warnings
+import platform
+import sys
+from typing import Optional, Tuple
+import numpy as np
+from scipy import sparse
+# Try CuPy for CUDA (NVIDIA GPUs)
+try:
+    import cupy as cp
+    import cupyx.scipy.sparse as cusp
+    CUPY_AVAILABLE = True
+except ImportError:
+    CUPY_AVAILABLE = False
+    cp = None
+    cusp = None
+# Try PyTorch for MPS (Mac GPUs) or CUDA fallback
+try:
+    import torch
+    TORCH_AVAILABLE = True
+    TORCH_VERSION = torch.__version__
+except ImportError:
+    TORCH_AVAILABLE = False
+    TORCH_VERSION = None
+    torch = None
+def diagnose_gpu_support() -> dict:
+    """
+    Diagnose GPU support availability and provide helpful information.
+    Returns:
+        Dictionary with diagnostic information
+    """
+    diagnostics = {
+        'platform': platform.system(),
+        'is_mac': platform.system() == 'Darwin',
+        'python_version': sys.version,
+        'cupy_available': CUPY_AVAILABLE,
+        'torch_available': TORCH_AVAILABLE,
+        'torch_version': TORCH_VERSION,
+        'gpu_backends': []
+    }
+    # Check CuPy/CUDA
+    if CUPY_AVAILABLE:
+        try:
+            _ = cp.array([1, 2, 3])
+            device = cp.cuda.Device(0)
+            device.use()
+            diagnostics['gpu_backends'].append('CUDA (CuPy)')
+        except Exception as e:
+            diagnostics['cupy_error'] = str(e)
+    # Check PyTorch MPS (Mac)
+    if TORCH_AVAILABLE and diagnostics['is_mac']:
+        try:
+            if hasattr(torch.backends, 'mps') and hasattr(torch.backends.mps, 'is_available'):
+                if torch.backends.mps.is_available():
+                    diagnostics['gpu_backends'].append('MPS (Mac)')
+                else:
+                    diagnostics['mps_unavailable_reason'] = 'MPS backend not available (requires macOS 12.3+ and Apple Silicon)'
+            else:
+                diagnostics['mps_unavailable_reason'] = f'PyTorch {TORCH_VERSION} does not support MPS (requires PyTorch 1.12+)'
+        except Exception as e:
+            diagnostics['mps_error'] = str(e)
+    # Check PyTorch CUDA
+    if TORCH_AVAILABLE:
+        try:
+            if torch.cuda.is_available():
+                diagnostics['gpu_backends'].append('CUDA (PyTorch)')
+        except Exception:
+            pass
+    return diagnostics
+class GPUAccelerator:
+    """GPU accelerator with automatic CPU fallback. Supports CUDA (NVIDIA) and MPS (Mac)."""
+    def __init__(self, use_gpu: bool = False):
+        """
+        Initialize GPU accelerator.
+        Args:
+            use_gpu: Whether to attempt GPU acceleration
+        """
+        self.use_gpu = False
+        self.device_type = None  # 'cuda', 'mps', or None
+        self.device = None
+        self.backend = None  # 'cupy' or 'torch'
+        if not use_gpu:
+            return
+        # Detect platform and available GPU backends
+        is_mac = platform.system() == 'Darwin'
+        # Try CuPy (CUDA) first on non-Mac systems
+        if not is_mac and CUPY_AVAILABLE:
+            try:
+                _ = cp.array([1, 2, 3])
+                self.device = cp.cuda.Device(0)
+                self.device.use()
+                self.use_gpu = True
+                self.device_type = 'cuda'
+                self.backend = 'cupy'
+                return
+            except Exception:
+                pass
+        # Try PyTorch MPS (Mac GPU)
+        if TORCH_AVAILABLE and is_mac:
+            try:
+                # Check if MPS backend is available (requires PyTorch 1.12+ and macOS 12.3+)
+                if hasattr(torch.backends, 'mps') and hasattr(torch.backends.mps, 'is_available'):
+                    if torch.backends.mps.is_available():
+                        self.device = torch.device('mps')
+                        # Test with a small operation
+                        test_tensor = torch.tensor([1.0, 2.0, 3.0], device=self.device)
+                        _ = test_tensor * 2
+                        self.use_gpu = True
+                        self.device_type = 'mps'
+                        self.backend = 'torch'
+                        return
+                    else:
+                        warnings.warn("MPS backend is not available. This requires macOS 12.3+ and Apple Silicon (M1/M2/M3). Falling back to CPU.")
+                else:
+                    warnings.warn("PyTorch MPS backend not available. Please upgrade PyTorch to version 1.12+ for Mac GPU support. Falling back to CPU.")
+            except Exception as e:
+                warnings.warn(f"MPS GPU acceleration failed: {e}. Falling back to CPU.")
+        # Try PyTorch CUDA as fallback (if available)
+        if TORCH_AVAILABLE and torch.cuda.is_available():
+            try:
+                self.device = torch.device('cuda')
+                test_tensor = torch.tensor([1.0, 2.0, 3.0], device=self.device)
+                _ = test_tensor * 2
+                self.use_gpu = True
+                self.device_type = 'cuda'
+                self.backend = 'torch'
+                return
+            except Exception:
+                pass
+        # No GPU available
+        if use_gpu:
+            warnings.warn("GPU acceleration requested but no GPU backend available. Falling back to CPU.")
+    def to_gpu(self, arr: np.ndarray):
+        """Convert numpy array to GPU array."""
+        if not self.use_gpu:
+            return arr
+        if self.backend == 'cupy':
+            return cp.asarray(arr)
+        elif self.backend == 'torch':
+            return torch.from_numpy(arr).to(self.device)
+        return arr
+    def to_cpu(self, arr) -> np.ndarray:
+        """Convert GPU array back to CPU numpy array."""
+        if not self.use_gpu:
+            return arr
+        if self.backend == 'cupy' and isinstance(arr, cp.ndarray):
+            return cp.asnumpy(arr)
+        elif self.backend == 'torch' and isinstance(arr, torch.Tensor):
+            return arr.cpu().numpy()
+        return arr
+    def sparse_to_gpu(self, sp_matrix: sparse.spmatrix) -> 'cusp.spmatrix':
+        """Convert scipy sparse matrix to CuPy sparse matrix."""
+        if self.use_gpu:
+            if isinstance(sp_matrix, sparse.csr_matrix):
+                return cusp.csr_matrix(sp_matrix)
+            elif isinstance(sp_matrix, sparse.csc_matrix):
+                return cusp.csc_matrix(sp_matrix)
+            elif isinstance(sp_matrix, sparse.coo_matrix):
+                return cusp.coo_matrix(sp_matrix)
+        return sp_matrix
+    def sparse_to_cpu(self, sp_matrix) -> sparse.spmatrix:
+        """Convert CuPy sparse matrix back to scipy sparse matrix."""
+        if self.use_gpu and hasattr(sp_matrix, 'get'):
+            # CuPy sparse matrix
+            return sp_matrix.get()
+        return sp_matrix
+    def svd(self, matrix: np.ndarray, n_components: int,
+            random_state: Optional[int] = None) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
+        """
+        Perform Truncated SVD on GPU or CPU.
+        Args:
+            matrix: Input matrix (n_samples, n_features)
+            n_components: Number of components
+            random_state: Random seed
+        Returns:
+            (U, S, Vt) where U @ diag(S) @ Vt approximates the input
+        """
+        if self.use_gpu:
+            try:
+                gpu_matrix = self.to_gpu(matrix)
+                if self.backend == 'cupy':
+                    # CuPy SVD
+                    U, S, Vt = cp.linalg.svd(gpu_matrix, full_matrices=False)
+                elif self.backend == 'torch':
+                    # PyTorch SVD
+                    U, S, Vt = torch.linalg.svd(gpu_matrix, full_matrices=False)
+                else:
+                    raise ValueError(f"Unknown backend: {self.backend}")
+                # Truncate to n_components
+                U = U[:, :n_components]
+                S = S[:n_components]
+                Vt = Vt[:n_components, :]
+                # Convert back to CPU
+                return self.to_cpu(U), self.to_cpu(S), self.to_cpu(Vt)
+            except Exception as e:
+                warnings.warn(f"GPU SVD failed: {e}. Falling back to CPU.")
+                self.use_gpu = False
+        # CPU fallback using sklearn
+        from sklearn.decomposition import TruncatedSVD
+        svd = TruncatedSVD(n_components=n_components, random_state=random_state, n_iter=5)
+        U = svd.fit_transform(matrix)
+        S = svd.singular_values_
+        Vt = svd.components_
+        return U, S, Vt
+    def pca(self, matrix: np.ndarray, n_components: int,
+            random_state: Optional[int] = None) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
+        """
+        Perform PCA on GPU or CPU.
+        Args:
+            matrix: Input matrix (n_samples, n_features)
+            n_components: Number of components
+            random_state: Random seed
+        Returns:
+            (transformed, components, mean)
+        """
+        if self.use_gpu:
+            try:
+                gpu_matrix = self.to_gpu(matrix)
+                # Center the data
+                if self.backend == 'cupy':
+                    mean = cp.mean(gpu_matrix, axis=0)
+                    centered = gpu_matrix - mean
+                    # SVD
+                    U, S, Vt = cp.linalg.svd(centered, full_matrices=False)
+                    # Transform: U @ diag(S)
+                    transformed = U @ cp.diag(S)
+                elif self.backend == 'torch':
+                    mean = torch.mean(gpu_matrix, axis=0)
+                    centered = gpu_matrix - mean
+                    # SVD
+                    U, S, Vt = torch.linalg.svd(centered, full_matrices=False)
+                    # Transform: U @ diag(S)
+                    transformed = U @ torch.diag(S)
+                else:
+                    raise ValueError(f"Unknown backend: {self.backend}")
+                # Truncate
+                U = U[:, :n_components]
+                S = S[:n_components]
+                Vt = Vt[:n_components, :]
+                transformed = transformed[:, :n_components]
+                # Convert back to CPU
+                return self.to_cpu(transformed), self.to_cpu(Vt), self.to_cpu(mean)
+            except Exception as e:
+                warnings.warn(f"GPU PCA failed: {e}. Falling back to CPU.")
+                self.use_gpu = False
+        # CPU fallback using sklearn
+        from sklearn.decomposition import PCA
+        pca = PCA(n_components=n_components, random_state=random_state)
+        transformed = pca.fit_transform(matrix)
+        return transformed, pca.components_, pca.mean_
+    def matmul(self, a, b):
+        """Matrix multiplication on GPU or CPU."""
+        if self.use_gpu:
+            try:
+                a_gpu = self.to_gpu(a) if isinstance(a, np.ndarray) else a
+                b_gpu = self.to_gpu(b) if isinstance(b, np.ndarray) else b
+                if self.backend == 'cupy':
+                    result = cp.matmul(a_gpu, b_gpu)
+                elif self.backend == 'torch':
+                    result = torch.matmul(a_gpu, b_gpu)
+                else:
+                    raise ValueError(f"Unknown backend: {self.backend}")
+                return self.to_cpu(result)
+            except Exception as e:
+                warnings.warn(f"GPU matmul failed: {e}. Falling back to CPU.")
+                self.use_gpu = False
+        return np.matmul(a, b)
+    def sparse_matmul(self, a, b):
+        """Sparse matrix multiplication on GPU or CPU."""
+        if self.use_gpu:
+            try:
+                # PyTorch sparse support is limited, so prefer CuPy for sparse ops
+                if self.backend == 'cupy':
+                    a_gpu = self.sparse_to_gpu(a) if isinstance(a, sparse.spmatrix) else a
+                    b_gpu = self.to_gpu(b) if isinstance(b, np.ndarray) else b
+                    result = a_gpu @ b_gpu
+                    return self.to_cpu(result)
+                elif self.backend == 'torch':
+                    # PyTorch: convert sparse to dense for now (MPS doesn't support sparse well)
+                    if isinstance(a, sparse.spmatrix):
+                        a_dense = self.to_gpu(a.toarray())
+                        b_gpu = self.to_gpu(b) if isinstance(b, np.ndarray) else b
+                        result = torch.matmul(a_dense, b_gpu)
+                        return self.to_cpu(result)
+            except Exception as e:
+                warnings.warn(f"GPU sparse matmul failed: {e}. Falling back to CPU.")
+                self.use_gpu = False
+        if isinstance(a, sparse.spmatrix):
+            return a @ b
+        return np.matmul(a, b)
+    def norm(self, arr: np.ndarray, axis: Optional[int] = None, keepdims: bool = False) -> np.ndarray:
+        """Compute L2 norm on GPU or CPU."""
+        if self.use_gpu:
+            try:
+                gpu_arr = self.to_gpu(arr)
+                if self.backend == 'cupy':
+                    result = cp.linalg.norm(gpu_arr, axis=axis, keepdims=keepdims)
+                elif self.backend == 'torch':
+                    result = torch.linalg.norm(gpu_arr, dim=axis, keepdim=keepdims)
+                else:
+                    raise ValueError(f"Unknown backend: {self.backend}")
+                return self.to_cpu(result)
+            except Exception as e:
+                warnings.warn(f"GPU norm failed: {e}. Falling back to CPU.")
+                self.use_gpu = False
+        return np.linalg.norm(arr, axis=axis, keepdims=keepdims)
+    def sum(self, arr, axis: Optional[int] = None, keepdims: bool = False):
+        """Sum array on GPU or CPU."""
+        if self.use_gpu:
+            try:
+                gpu_arr = self.to_gpu(arr) if isinstance(arr, np.ndarray) else arr
+                if self.backend == 'cupy':
+                    result = cp.sum(gpu_arr, axis=axis, keepdims=keepdims)
+                elif self.backend == 'torch':
+                    result = torch.sum(gpu_arr, dim=axis, keepdim=keepdims)
+                else:
+                    raise ValueError(f"Unknown backend: {self.backend}")
+                return self.to_cpu(result) if hasattr(result, 'cpu') or isinstance(result, cp.ndarray) else result
+            except Exception as e:
+                warnings.warn(f"GPU sum failed: {e}. Falling back to CPU.")
+                self.use_gpu = False
+        return np.sum(arr, axis=axis, keepdims=keepdims)
+    def maximum(self, a, b):
+        """Element-wise maximum on GPU or CPU."""
+        if self.use_gpu:
+            try:
+                a_gpu = self.to_gpu(a) if isinstance(a, np.ndarray) else a
+                b_gpu = self.to_gpu(b) if isinstance(b, np.ndarray) else b
+                if self.backend == 'cupy':
+                    result = cp.maximum(a_gpu, b_gpu)
+                elif self.backend == 'torch':
+                    result = torch.maximum(a_gpu, b_gpu)
+                else:
+                    raise ValueError(f"Unknown backend: {self.backend}")
+                return self.to_cpu(result)
+            except Exception as e:
+                warnings.warn(f"GPU maximum failed: {e}. Falling back to CPU.")
+                self.use_gpu = False
+        return np.maximum(a, b)
+    def __enter__(self):
+        """Context manager entry."""
+        return self
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        """Context manager exit - cleanup GPU memory."""
+        if self.use_gpu:
+            try:
+                if self.backend == 'cupy':
+                    cp.get_default_memory_pool().free_all_blocks()
+                elif self.backend == 'torch':
+                    torch.mps.empty_cache() if self.device_type == 'mps' else torch.cuda.empty_cache()
+            except:
+                pass
+        return False