PyPI - explainiverse - Versions diffs - 0.6.0__py3-none-any.whl → 0.7.1__py3-none-any.whl - Mend

explainiverse 0.6.0py3-none-any.whl → 0.7.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

explainiverse/__init__.py +1 -1
explainiverse/adapters/pytorch_adapter.py +88 -25
explainiverse/core/explanation.py +165 -10
explainiverse/core/registry.py +18 -0
explainiverse/engine/suite.py +187 -78
explainiverse/evaluation/metrics.py +189 -108
explainiverse/explainers/attribution/lime_wrapper.py +90 -7
explainiverse/explainers/attribution/shap_wrapper.py +104 -8
explainiverse/explainers/gradient/__init__.py +12 -0
explainiverse/explainers/gradient/integrated_gradients.py +189 -76
explainiverse/explainers/gradient/tcav.py +865 -0
{explainiverse-0.6.0.dist-info → explainiverse-0.7.1.dist-info}/METADATA +60 -9
{explainiverse-0.6.0.dist-info → explainiverse-0.7.1.dist-info}/RECORD +15 -14
{explainiverse-0.6.0.dist-info → explainiverse-0.7.1.dist-info}/LICENSE +0 -0
{explainiverse-0.6.0.dist-info → explainiverse-0.7.1.dist-info}/WHEEL +0 -0

explainiverse/engine/suite.py CHANGED Viewed

@@ -1,120 +1,194 @@
 # src/explainiverse/engine/suite.py
+"""
+ExplanationSuite - Multi-explainer comparison and evaluation.
+Provides utilities for running multiple explainers on the same instances
+and comparing their outputs.
+"""
+from typing import Dict, List, Optional, Any, Tuple
+import numpy as np
-from explainiverse.core.explanation import Explanation
-from explainiverse.explainers.attribution.lime_wrapper import LimeExplainer
-from explainiverse.explainers.attribution.shap_wrapper import ShapExplainer
-from explainiverse.evaluation.metrics import compute_roar
-from sklearn.metrics import accuracy_score
-from sklearn.linear_model import LogisticRegression
 class ExplanationSuite:
     """
-    Runs multiple explainers on a single instance and compares their outputs.
+    Run and compare multiple explainers on the same instances.
+    This class provides a unified interface for:
+    - Running multiple explainers on a single instance
+    - Comparing attribution scores side-by-side
+    - Suggesting the best explainer based on model/task characteristics
+    - Evaluating explainers using ROAR (Remove And Retrain)
+    Example:
+        >>> from explainiverse import ExplanationSuite, SklearnAdapter
+        >>> suite = ExplanationSuite(
+        ...     model=adapter,
+        ...     explainer_configs=[
+        ...         ("lime", {"training_data": X_train, "feature_names": fnames, "class_names": cnames}),
+        ...         ("shap", {"background_data": X_train[:50], "feature_names": fnames, "class_names": cnames}),
+        ...     ]
+        ... )
+        >>> results = suite.run(X_test[0])
+        >>> suite.compare()
     """
-    def __init__(self, model, explainer_configs, data_meta=None):
+    def __init__(
+        self,
+        model,
+        explainer_configs: List[Tuple[str, Dict[str, Any]]],
+        data_meta: Optional[Dict[str, Any]] = None
+    ):
         """
+        Initialize the ExplanationSuite.
         Args:
-            model: a model adapter (e.g., SklearnAdapter)
-            explainer_configs: list of (name, kwargs) tuples for explainers
-            data_meta: optional metadata about the task, scope, or preference
+            model: A model adapter (e.g., SklearnAdapter, PyTorchAdapter)
+            explainer_configs: List of (explainer_name, kwargs) tuples.
+                The explainer_name should match a registered explainer in
+                the default_registry (e.g., "lime", "shap", "treeshap").
+            data_meta: Optional metadata about the task, scope, or preference.
+                Can include "task" ("classification" or "regression").
         """
         self.model = model
         self.configs = explainer_configs
         self.data_meta = data_meta or {}
-        self.explanations = {}
+        self.explanations: Dict[str, Any] = {}
+        self._registry = None
+    def _get_registry(self):
+        """Lazy load the registry to avoid circular imports."""
+        if self._registry is None:
+            from explainiverse.core.registry import default_registry
+            self._registry = default_registry
+        return self._registry
-    def run(self, instance):
+    def run(self, instance: np.ndarray) -> Dict[str, Any]:
         """
         Run all configured explainers on a single instance.
+        Args:
+            instance: Input instance to explain (1D numpy array)
+        Returns:
+            Dictionary mapping explainer names to Explanation objects
         """
+        instance = np.asarray(instance)
+        registry = self._get_registry()
         for name, params in self.configs:
-            explainer = self._load_explainer(name, **params)
-            explanation = explainer.explain(instance)
-            self.explanations[name] = explanation
+            try:
+                explainer = registry.create(name, model=self.model, **params)
+                explanation = explainer.explain(instance)
+                self.explanations[name] = explanation
+            except Exception as e:
+                print(f"[ExplanationSuite] Warning: Failed to run {name}: {e}")
+                continue
         return self.explanations
-    def compare(self):
+    def compare(self) -> None:
         """
-        Print attribution scores side-by-side.
+        Print attribution scores side-by-side for comparison.
         """
-        keys = set()
+        if not self.explanations:
+            print("No explanations to compare. Run suite.run(instance) first.")
+            return
+        # Collect all feature names across explanations
+        all_keys = set()
         for explanation in self.explanations.values():
-            keys.update(explanation.explanation_data.get("feature_attributions", {}).keys())
+            attrs = explanation.explanation_data.get("feature_attributions", {})
+            all_keys.update(attrs.keys())
         print("\nSide-by-Side Comparison:")
-        for key in sorted(keys):
-            row = [f"{key}"]
+        print("-" * 60)
+        # Header
+        header = ["Feature"] + list(self.explanations.keys())
+        print(" | ".join(f"{h:>15}" for h in header))
+        print("-" * 60)
+        # Rows
+        for key in sorted(all_keys):
+            row = [f"{key:>15}"]
             for name in self.explanations:
-                value = self.explanations[name].explanation_data.get("feature_attributions", {}).get(key, "—")
-                row.append(f"{name}: {value:.4f}" if isinstance(value, float) else f"{name}: {value}")
+                value = self.explanations[name].explanation_data.get(
+                    "feature_attributions", {}
+                ).get(key, None)
+                if value is not None:
+                    row.append(f"{value:>15.4f}")
+                else:
+                    row.append(f"{'—':>15}")
             print(" | ".join(row))
-    def suggest_best(self):
+    def suggest_best(self) -> str:
         """
-        Suggest the best explainer based on model type, output structure, and task metadata.
+        Suggest the best explainer based on model type and task characteristics.
+        Returns:
+            Name of the suggested explainer
         """
-        if "task" in self.data_meta:
-            task = self.data_meta["task"]
-        else:
-            task = "unknown"
-        model = self.model.model
+        task = self.data_meta.get("task", "unknown")
+        model = self.model.model if hasattr(self.model, 'model') else self.model
         # 1. Regression: SHAP preferred due to consistent output
         if task == "regression":
             return "shap"
-        # 2. Model with `predict_proba` → SHAP handles probabilistic outputs well
+        # 2. Model with predict_proba → SHAP handles probabilistic outputs well
         if hasattr(model, "predict_proba"):
             try:
-                output = self.model.predict([[0] * model.n_features_in_])
-                if output.shape[1] > 2:
-                    return "shap"  # Multi-class, SHAP more stable
-                else:
-                    return "lime"  # Binary, both are okay
+                # Check output dimensions
+                if hasattr(model, 'n_features_in_'):
+                    test_input = np.zeros((1, model.n_features_in_))
+                    output = self.model.predict(test_input)
+                    if output.shape[1] > 2:
+                        return "shap"  # Multi-class, SHAP more stable
+                    else:
+                        return "lime"  # Binary, both are okay
             except Exception:
                 return "shap"
-        # 3. Tree-based models → prefer SHAP (TreeSHAP if available)
-        if "tree" in str(type(model)).lower():
-            return "shap"
+        # 3. Tree-based models → prefer TreeSHAP
+        model_type_str = str(type(model)).lower()
+        if any(tree_type in model_type_str for tree_type in ['tree', 'forest', 'xgb', 'lgbm', 'catboost']):
+            return "treeshap"
-        # 4. Default fallback
-        return "lime"
-    def _load_explainer(self, name, **kwargs):
-        if name == "lime":
-            return LimeExplainer(model=self.model, **kwargs)
-        elif name == "shap":
-            return ShapExplainer(model=self.model, **kwargs)
-        else:
-            raise ValueError(f"Unknown explainer: {name}")
+        # 4. Neural networks → prefer gradient methods
+        if 'torch' in model_type_str or 'keras' in model_type_str or 'tensorflow' in model_type_str:
+            return "integrated_gradients"
+        # 5. Default fallback
+        return "lime"
     def evaluate_roar(
         self,
-        X_train,
-        y_train,
-        X_test,
-        y_test,
+        X_train: np.ndarray,
+        y_train: np.ndarray,
+        X_test: np.ndarray,
+        y_test: np.ndarray,
         top_k: int = 2,
         model_class=None,
-        model_kwargs: dict = None
-    ):
+        model_kwargs: Optional[Dict] = None
+    ) -> Dict[str, float]:
         """
         Evaluate each explainer using ROAR (Remove And Retrain).
+        ROAR measures explanation quality by retraining the model after
+        removing the top-k important features identified by each explainer.
+        A larger accuracy drop indicates more faithful explanations.
         Args:
-            X_train, y_train: training data
-            X_test, y_test: test data
-            top_k: number of features to mask
-            model_class: model constructor with .fit() and .predict() (default: same as current model)
-            model_kwargs: optional keyword args for new model instance
+            X_train, y_train: Training data
+            X_test, y_test: Test data
+            top_k: Number of features to mask
+            model_class: Model constructor with .fit() and .predict()
+                        If None, uses the same type as self.model.model
+            model_kwargs: Optional keyword args for new model instance
         Returns:
-            Dict of {explainer_name: accuracy drop (baseline - retrained)}
+            Dict mapping explainer names to accuracy drops
         """
         from explainiverse.evaluation.metrics import compute_roar
@@ -122,22 +196,57 @@ class ExplanationSuite:
         # Default to type(self.model.model) if not provided
         if model_class is None:
-            model_class = type(self.model.model)
+            raw_model = self.model.model if hasattr(self.model, 'model') else self.model
+            model_class = type(raw_model)
         roar_scores = {}
         for name, explanation in self.explanations.items():
             print(f"[ROAR] Evaluating explainer: {name}")
-            roar = compute_roar(
-                model_class=model_class,
-                X_train=X_train,
-                y_train=y_train,
-                X_test=X_test,
-                y_test=y_test,
-                explanations=[explanation],  # single-instance for now
-                top_k=top_k,
-                model_kwargs=model_kwargs
-            )
-            roar_scores[name] = roar
-        return roar_scores
+            try:
+                roar = compute_roar(
+                    model_class=model_class,
+                    X_train=X_train,
+                    y_train=y_train,
+                    X_test=X_test,
+                    y_test=y_test,
+                    explanations=[explanation],
+                    top_k=top_k,
+                    model_kwargs=model_kwargs
+                )
+                roar_scores[name] = roar
+            except Exception as e:
+                print(f"[ROAR] Failed for {name}: {e}")
+                roar_scores[name] = 0.0
+        return roar_scores
+    def get_explanation(self, name: str):
+        """
+        Get a specific explanation by explainer name.
+        Args:
+            name: Name of the explainer
+        Returns:
+            Explanation object or None if not found
+        """
+        return self.explanations.get(name)
+    def list_explainers(self) -> List[str]:
+        """
+        List all configured explainer names.
+        Returns:
+            List of explainer names
+        """
+        return [name for name, _ in self.configs]
+    def list_completed(self) -> List[str]:
+        """
+        List explainers that have been run successfully.
+        Returns:
+            List of explainer names with results
+        """
+        return list(self.explanations.keys())

explainiverse 0.6.0__py3-none-any.whl → 0.7.1__py3-none-any.whl

explainiverse 0.6.0py3-none-any.whl → 0.7.1py3-none-any.whl