PyPI - featrixsphere - Versions diffs - 0.2.5563__py3-none-any.whl → 0.2.5978__py3-none-any.whl - Mend

featrixsphere 0.2.5563py3-none-any.whl → 0.2.5978py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

featrixsphere/__init__.py +37 -18
featrixsphere/api/__init__.py +50 -0
featrixsphere/api/api_endpoint.py +280 -0
featrixsphere/api/client.py +396 -0
featrixsphere/api/foundational_model.py +658 -0
featrixsphere/api/http_client.py +209 -0
featrixsphere/api/notebook_helper.py +584 -0
featrixsphere/api/prediction_result.py +231 -0
featrixsphere/api/predictor.py +537 -0
featrixsphere/api/reference_record.py +227 -0
featrixsphere/api/vector_database.py +269 -0
featrixsphere/client.py +215 -12
{featrixsphere-0.2.5563.dist-info → featrixsphere-0.2.5978.dist-info}/METADATA +1 -1
featrixsphere-0.2.5978.dist-info/RECORD +17 -0
featrixsphere-0.2.5563.dist-info/RECORD +0 -7
{featrixsphere-0.2.5563.dist-info → featrixsphere-0.2.5978.dist-info}/WHEEL +0 -0
{featrixsphere-0.2.5563.dist-info → featrixsphere-0.2.5978.dist-info}/entry_points.txt +0 -0
{featrixsphere-0.2.5563.dist-info → featrixsphere-0.2.5978.dist-info}/top_level.txt +0 -0

featrixsphere/api/notebook_helper.py ADDED Viewed

@@ -0,0 +1,584 @@
+"""
+FeatrixNotebookHelper for Jupyter notebook visualization.
+Provides visualization methods for training metrics, embedding spaces,
+and model analysis in Jupyter notebooks.
+"""
+import logging
+from typing import Dict, Any, Optional, List, Union, Tuple, TYPE_CHECKING
+if TYPE_CHECKING:
+    from .foundational_model import FoundationalModel
+    from .predictor import Predictor
+    from .http_client import ClientContext
+    import matplotlib
+    import plotly
+    import numpy as np
+logger = logging.getLogger(__name__)
+class FeatrixNotebookHelper:
+    """
+    Helper class for Jupyter notebook visualization.
+    Access via featrix.get_notebook() - no separate import needed!
+    Usage:
+        notebook = featrix.get_notebook()
+        # Visualize training
+        fig = notebook.training_loss(fm, style='notebook')
+        fig.show()
+        # 3D embedding space
+        fig = notebook.embedding_space_3d(fm, interactive=True)
+        fig.show()
+        # Training movie
+        movie = notebook.training_movie(fm, notebook_mode=True)
+    """
+    def __init__(self, ctx: Optional['ClientContext'] = None):
+        """Initialize notebook helper with client context."""
+        self._ctx = ctx
+    def training_loss(
+        self,
+        model: Union['FoundationalModel', 'Predictor'],
+        style: str = 'notebook',
+        show_learning_rate: bool = True,
+        smooth: bool = True,
+        figsize: Tuple[int, int] = (12, 6)
+    ) -> Any:
+        """
+        Plot training loss curves.
+        Args:
+            model: FoundationalModel or Predictor to visualize
+            style: Plot style ('notebook', 'paper', 'presentation')
+            show_learning_rate: Show learning rate on secondary axis
+            smooth: Apply smoothing to loss curves
+            figsize: Figure size (width, height)
+        Returns:
+            matplotlib Figure
+        Example:
+            fig = notebook.training_loss(fm, style='notebook')
+            fig.show()
+        """
+        try:
+            import matplotlib.pyplot as plt
+            import numpy as np
+        except ImportError:
+            raise ImportError("matplotlib is required for training_loss visualization")
+        # Get training metrics
+        metrics = model.get_training_metrics() if hasattr(model, 'get_training_metrics') else model.get_metrics()
+        # Apply style
+        if style == 'notebook':
+            plt.style.use('seaborn-v0_8-whitegrid')
+        elif style == 'paper':
+            plt.style.use('seaborn-v0_8-paper')
+        elif style == 'presentation':
+            plt.style.use('seaborn-v0_8-talk')
+        fig, ax1 = plt.subplots(figsize=figsize)
+        # Get loss history
+        loss_history = metrics.get('loss_history', metrics.get('training_loss', []))
+        epochs = list(range(1, len(loss_history) + 1))
+        # Apply smoothing if requested
+        if smooth and len(loss_history) > 10:
+            window = min(10, len(loss_history) // 5)
+            loss_smoothed = np.convolve(loss_history, np.ones(window)/window, mode='valid')
+            epochs_smoothed = epochs[window-1:]
+            ax1.plot(epochs, loss_history, alpha=0.3, color='blue', label='Loss (raw)')
+            ax1.plot(epochs_smoothed, loss_smoothed, color='blue', linewidth=2, label='Loss (smoothed)')
+        else:
+            ax1.plot(epochs, loss_history, color='blue', linewidth=2, label='Loss')
+        ax1.set_xlabel('Epoch')
+        ax1.set_ylabel('Loss', color='blue')
+        ax1.tick_params(axis='y', labelcolor='blue')
+        # Show learning rate if available and requested
+        if show_learning_rate:
+            lr_history = metrics.get('lr_history', metrics.get('learning_rate', []))
+            if lr_history:
+                ax2 = ax1.twinx()
+                ax2.plot(epochs[:len(lr_history)], lr_history, color='red', linestyle='--', label='Learning Rate')
+                ax2.set_ylabel('Learning Rate', color='red')
+                ax2.tick_params(axis='y', labelcolor='red')
+                ax2.set_yscale('log')
+        # Title
+        model_type = 'FM' if hasattr(model, 'dimensions') else 'Predictor'
+        model_id = getattr(model, 'id', 'unknown')[:8]
+        ax1.set_title(f'{model_type} Training Loss ({model_id}...)')
+        fig.tight_layout()
+        return fig
+    def embedding_space_3d(
+        self,
+        fm: 'FoundationalModel',
+        sample_size: int = 2000,
+        interactive: bool = True,
+        color_by: Optional[str] = None,
+        figsize: Tuple[int, int] = (800, 600)
+    ) -> Any:
+        """
+        Create 3D visualization of embedding space.
+        Args:
+            fm: FoundationalModel to visualize
+            sample_size: Number of points to sample
+            interactive: Use interactive plotly (True) or static matplotlib (False)
+            color_by: Column name to color points by
+            figsize: Figure size (width, height) for plotly
+        Returns:
+            plotly Figure (if interactive=True) or matplotlib Figure
+        Example:
+            fig = notebook.embedding_space_3d(fm, interactive=True)
+            fig.show()
+        """
+        # Get projections from server
+        projections = fm.get_projections()
+        points_3d = projections.get('3d', projections.get('pca_3d', []))
+        labels = projections.get('labels', [])
+        colors = projections.get('colors', projections.get(color_by, []))
+        if not points_3d:
+            raise ValueError("No 3D projection data available")
+        if interactive:
+            try:
+                import plotly.graph_objects as go
+            except ImportError:
+                raise ImportError("plotly is required for interactive 3D visualization")
+            x = [p[0] for p in points_3d[:sample_size]]
+            y = [p[1] for p in points_3d[:sample_size]]
+            z = [p[2] for p in points_3d[:sample_size]]
+            trace = go.Scatter3d(
+                x=x, y=y, z=z,
+                mode='markers',
+                marker=dict(
+                    size=3,
+                    color=colors[:sample_size] if colors else None,
+                    colorscale='Viridis',
+                    opacity=0.8
+                ),
+                text=labels[:sample_size] if labels else None,
+                hovertemplate='%{text}<br>(%{x:.2f}, %{y:.2f}, %{z:.2f})<extra></extra>'
+            )
+            fig = go.Figure(data=[trace])
+            fig.update_layout(
+                title=f"Embedding Space 3D ({fm.id[:8]}...)",
+                width=figsize[0],
+                height=figsize[1],
+                scene=dict(
+                    xaxis_title='PC1',
+                    yaxis_title='PC2',
+                    zaxis_title='PC3',
+                )
+            )
+            return fig
+        else:
+            try:
+                import matplotlib.pyplot as plt
+                from mpl_toolkits.mplot3d import Axes3D
+            except ImportError:
+                raise ImportError("matplotlib is required for static 3D visualization")
+            fig = plt.figure(figsize=(figsize[0]/100, figsize[1]/100))
+            ax = fig.add_subplot(111, projection='3d')
+            x = [p[0] for p in points_3d[:sample_size]]
+            y = [p[1] for p in points_3d[:sample_size]]
+            z = [p[2] for p in points_3d[:sample_size]]
+            scatter = ax.scatter(x, y, z, c=colors[:sample_size] if colors else None,
+                               cmap='viridis', alpha=0.6, s=10)
+            ax.set_xlabel('PC1')
+            ax.set_ylabel('PC2')
+            ax.set_zlabel('PC3')
+            ax.set_title(f"Embedding Space 3D ({fm.id[:8]}...)")
+            if colors:
+                plt.colorbar(scatter)
+            return fig
+    def training_movie(
+        self,
+        model: Union['FoundationalModel', 'Predictor'],
+        notebook_mode: bool = True,
+        fps: int = 2,
+        figsize: Tuple[int, int] = (10, 6)
+    ) -> Any:
+        """
+        Create animated training movie.
+        Shows how the model evolves during training, visualizing
+        loss curves and optionally embedding space evolution.
+        Args:
+            model: FoundationalModel or Predictor to visualize
+            notebook_mode: True for Jupyter widget, False for animation
+            fps: Frames per second
+            figsize: Figure size
+        Returns:
+            ipywidgets Widget (if notebook_mode) or matplotlib animation
+        Example:
+            movie = notebook.training_movie(fm, notebook_mode=True)
+            # Widget displays automatically in Jupyter
+        """
+        try:
+            import matplotlib.pyplot as plt
+            import matplotlib.animation as animation
+            import numpy as np
+        except ImportError:
+            raise ImportError("matplotlib is required for training_movie")
+        # Get training metrics
+        metrics = model.get_training_metrics() if hasattr(model, 'get_training_metrics') else model.get_metrics()
+        loss_history = metrics.get('loss_history', metrics.get('training_loss', []))
+        if not loss_history:
+            raise ValueError("No training history available")
+        fig, ax = plt.subplots(figsize=figsize)
+        ax.set_xlim(0, len(loss_history))
+        ax.set_ylim(0, max(loss_history) * 1.1)
+        ax.set_xlabel('Epoch')
+        ax.set_ylabel('Loss')
+        ax.set_title('Training Progress')
+        line, = ax.plot([], [], 'b-', linewidth=2)
+        epoch_text = ax.text(0.02, 0.95, '', transform=ax.transAxes,
+                            fontsize=12, verticalalignment='top')
+        def init():
+            line.set_data([], [])
+            epoch_text.set_text('')
+            return line, epoch_text
+        def animate(frame):
+            x = list(range(frame + 1))
+            y = loss_history[:frame + 1]
+            line.set_data(x, y)
+            epoch_text.set_text(f'Epoch: {frame + 1}/{len(loss_history)}')
+            return line, epoch_text
+        anim = animation.FuncAnimation(
+            fig, animate, init_func=init,
+            frames=len(loss_history), interval=1000//fps,
+            blit=True, repeat=False
+        )
+        if notebook_mode:
+            try:
+                from IPython.display import HTML
+                plt.close(fig)  # Prevent static display
+                return HTML(anim.to_jshtml())
+            except ImportError:
+                return anim
+        else:
+            return anim
+    def embedding_evolution(
+        self,
+        fm: 'FoundationalModel',
+        epoch_range: Optional[Tuple[int, int]] = None,
+        interactive: bool = True,
+        sample_size: int = 500
+    ) -> Any:
+        """
+        Visualize embedding evolution over epochs.
+        Shows how the embedding space changes during training.
+        Args:
+            fm: FoundationalModel to visualize
+            epoch_range: Tuple of (start_epoch, end_epoch) or None for all
+            interactive: Use interactive plotly
+            sample_size: Number of points to sample
+        Returns:
+            plotly Figure (if interactive) or matplotlib Figure
+        Example:
+            fig = notebook.embedding_evolution(fm, epoch_range=(1, 50))
+            fig.show()
+        """
+        # This requires epoch-by-epoch projection data which may not be available
+        # Return a placeholder for now
+        try:
+            import plotly.graph_objects as go
+        except ImportError:
+            raise ImportError("plotly is required for embedding_evolution")
+        # Try to get evolution data
+        try:
+            metrics = fm.get_training_metrics()
+            evolution = metrics.get('embedding_evolution', [])
+        except Exception:
+            evolution = []
+        if not evolution:
+            # Create placeholder figure
+            fig = go.Figure()
+            fig.add_annotation(
+                text="Embedding evolution data not available",
+                xref="paper", yref="paper",
+                x=0.5, y=0.5, showarrow=False,
+                font=dict(size=16)
+            )
+            fig.update_layout(
+                title="Embedding Evolution (data not available)",
+                width=800, height=600
+            )
+            return fig
+        # If data is available, create animation
+        frames = []
+        for epoch_data in evolution:
+            epoch = epoch_data.get('epoch', 0)
+            points = epoch_data.get('points', [])[:sample_size]
+            frame = go.Frame(
+                data=[go.Scatter(
+                    x=[p[0] for p in points],
+                    y=[p[1] for p in points],
+                    mode='markers',
+                    marker=dict(size=5, opacity=0.6)
+                )],
+                name=str(epoch)
+            )
+            frames.append(frame)
+        fig = go.Figure(
+            data=frames[0].data if frames else [],
+            frames=frames,
+            layout=go.Layout(
+                title="Embedding Evolution",
+                updatemenus=[{
+                    "type": "buttons",
+                    "buttons": [
+                        {"label": "Play", "method": "animate", "args": [None, {"frame": {"duration": 500}}]},
+                        {"label": "Pause", "method": "animate", "args": [[None], {"mode": "immediate"}]}
+                    ]
+                }],
+                sliders=[{
+                    "steps": [{"args": [[str(e['epoch'])], {"frame": {"duration": 0}}], "label": str(e['epoch'])}
+                             for e in evolution],
+                    "currentvalue": {"prefix": "Epoch: "}
+                }]
+            )
+        )
+        return fig
+    def training_comparison(
+        self,
+        models: List[Union['FoundationalModel', 'Predictor']],
+        labels: Optional[List[str]] = None,
+        figsize: Tuple[int, int] = (12, 6)
+    ) -> Any:
+        """
+        Compare training across multiple models.
+        Args:
+            models: List of models to compare
+            labels: Optional labels for each model
+            figsize: Figure size
+        Returns:
+            matplotlib Figure
+        Example:
+            fig = notebook.training_comparison([fm1, fm2], labels=['v1', 'v2'])
+            fig.show()
+        """
+        try:
+            import matplotlib.pyplot as plt
+            import numpy as np
+        except ImportError:
+            raise ImportError("matplotlib is required for training_comparison")
+        fig, ax = plt.subplots(figsize=figsize)
+        colors = plt.cm.tab10(np.linspace(0, 1, len(models)))
+        for i, model in enumerate(models):
+            metrics = model.get_training_metrics() if hasattr(model, 'get_training_metrics') else model.get_metrics()
+            loss_history = metrics.get('loss_history', metrics.get('training_loss', []))
+            label = labels[i] if labels and i < len(labels) else f"Model {i+1}"
+            ax.plot(loss_history, color=colors[i], linewidth=2, label=label)
+        ax.set_xlabel('Epoch')
+        ax.set_ylabel('Loss')
+        ax.set_title('Training Comparison')
+        ax.legend()
+        ax.grid(True, alpha=0.3)
+        fig.tight_layout()
+        return fig
+    def embedding_space_training(
+        self,
+        fm: 'FoundationalModel',
+        style: str = 'notebook',
+        figsize: Tuple[int, int] = (14, 6)
+    ) -> Any:
+        """
+        Plot embedding space training metrics.
+        Shows detailed metrics specific to foundational model training.
+        Args:
+            fm: FoundationalModel to visualize
+            style: Plot style
+            figsize: Figure size
+        Returns:
+            matplotlib Figure
+        """
+        try:
+            import matplotlib.pyplot as plt
+            import numpy as np
+        except ImportError:
+            raise ImportError("matplotlib is required")
+        metrics = fm.get_training_metrics()
+        fig, axes = plt.subplots(1, 3, figsize=figsize)
+        # Loss curve
+        loss = metrics.get('loss_history', [])
+        if loss:
+            axes[0].plot(loss, 'b-', linewidth=2)
+            axes[0].set_title('Training Loss')
+            axes[0].set_xlabel('Epoch')
+            axes[0].set_ylabel('Loss')
+            axes[0].grid(True, alpha=0.3)
+        # Learning rate
+        lr = metrics.get('lr_history', [])
+        if lr:
+            axes[1].semilogy(lr, 'r-', linewidth=2)
+            axes[1].set_title('Learning Rate')
+            axes[1].set_xlabel('Epoch')
+            axes[1].set_ylabel('LR')
+            axes[1].grid(True, alpha=0.3)
+        # Gradient norm if available
+        grad_norm = metrics.get('grad_norm_history', [])
+        if grad_norm:
+            axes[2].plot(grad_norm, 'g-', linewidth=2)
+            axes[2].set_title('Gradient Norm')
+            axes[2].set_xlabel('Epoch')
+            axes[2].set_ylabel('Norm')
+            axes[2].grid(True, alpha=0.3)
+        else:
+            axes[2].text(0.5, 0.5, 'No gradient data', ha='center', va='center')
+            axes[2].set_title('Gradient Norm')
+        fig.suptitle(f'Embedding Space Training ({fm.id[:8]}...)', fontsize=14)
+        fig.tight_layout()
+        return fig
+    def single_predictor_training(
+        self,
+        predictor: 'Predictor',
+        style: str = 'notebook',
+        figsize: Tuple[int, int] = (14, 6)
+    ) -> Any:
+        """
+        Plot single predictor training metrics.
+        Shows detailed metrics specific to predictor training including
+        accuracy, AUC, and confusion matrix evolution.
+        Args:
+            predictor: Predictor to visualize
+            style: Plot style
+            figsize: Figure size
+        Returns:
+            matplotlib Figure
+        """
+        try:
+            import matplotlib.pyplot as plt
+            import numpy as np
+        except ImportError:
+            raise ImportError("matplotlib is required")
+        metrics = predictor.get_metrics()
+        fig, axes = plt.subplots(1, 3, figsize=figsize)
+        # Loss curve
+        loss = metrics.get('loss_history', metrics.get('single_predictor', {}).get('loss_history', []))
+        if loss:
+            axes[0].plot(loss, 'b-', linewidth=2)
+            axes[0].set_title('Training Loss')
+            axes[0].set_xlabel('Epoch')
+            axes[0].set_ylabel('Loss')
+            axes[0].grid(True, alpha=0.3)
+        # Accuracy
+        accuracy = metrics.get('accuracy_history', metrics.get('single_predictor', {}).get('accuracy_history', []))
+        if accuracy:
+            axes[1].plot(accuracy, 'g-', linewidth=2)
+            axes[1].set_title('Accuracy')
+            axes[1].set_xlabel('Epoch')
+            axes[1].set_ylabel('Accuracy')
+            axes[1].set_ylim(0, 1)
+            axes[1].grid(True, alpha=0.3)
+        else:
+            final_acc = metrics.get('single_predictor', {}).get('accuracy', predictor.accuracy)
+            if final_acc:
+                axes[1].axhline(y=final_acc, color='g', linewidth=2)
+                axes[1].set_title(f'Final Accuracy: {final_acc:.4f}')
+            else:
+                axes[1].text(0.5, 0.5, 'No accuracy data', ha='center', va='center')
+                axes[1].set_title('Accuracy')
+        # AUC
+        auc_history = metrics.get('auc_history', metrics.get('single_predictor', {}).get('auc_history', []))
+        if auc_history:
+            axes[2].plot(auc_history, 'r-', linewidth=2)
+            axes[2].set_title('AUC')
+            axes[2].set_xlabel('Epoch')
+            axes[2].set_ylabel('AUC')
+            axes[2].set_ylim(0, 1)
+            axes[2].grid(True, alpha=0.3)
+        else:
+            final_auc = metrics.get('single_predictor', {}).get('roc_auc', predictor.auc)
+            if final_auc:
+                axes[2].axhline(y=final_auc, color='r', linewidth=2)
+                axes[2].set_title(f'Final AUC: {final_auc:.4f}')
+            else:
+                axes[2].text(0.5, 0.5, 'No AUC data', ha='center', va='center')
+                axes[2].set_title('AUC')
+        fig.suptitle(f'Predictor Training ({predictor.target_column})', fontsize=14)
+        fig.tight_layout()
+        return fig

featrixsphere 0.2.5563__py3-none-any.whl → 0.2.5978__py3-none-any.whl

featrixsphere 0.2.5563py3-none-any.whl → 0.2.5978py3-none-any.whl