PyPI - wisent - Versions diffs - 0.1.1__py3-none-any.whl → 0.5.2__py3-none-any.whl - Mend

wisent 0.1.1py3-none-any.whl → 0.5.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of wisent might be problematic. Click here for more details.

Files changed (237) hide show

wisent/__init__.py +1 -8
wisent/benchmarks/__init__.py +0 -0
wisent/benchmarks/coding/__init__.py +0 -0
wisent/benchmarks/coding/metrics/__init__.py +0 -0
wisent/benchmarks/coding/metrics/core/__init__.py +0 -0
wisent/benchmarks/coding/metrics/core/atoms.py +36 -0
wisent/benchmarks/coding/metrics/evaluator.py +275 -0
wisent/benchmarks/coding/metrics/passk.py +66 -0
wisent/benchmarks/coding/output_sanitizer/__init__.py +0 -0
wisent/benchmarks/coding/output_sanitizer/core/__init__.py +0 -0
wisent/benchmarks/coding/output_sanitizer/core/atoms.py +27 -0
wisent/benchmarks/coding/output_sanitizer/cpp_sanitizer.py +62 -0
wisent/benchmarks/coding/output_sanitizer/java_sanitizer.py +78 -0
wisent/benchmarks/coding/output_sanitizer/python_sanitizer.py +94 -0
wisent/benchmarks/coding/output_sanitizer/utils.py +107 -0
wisent/benchmarks/coding/providers/__init__.py +18 -0
wisent/benchmarks/coding/providers/core/__init__.py +0 -0
wisent/benchmarks/coding/providers/core/atoms.py +31 -0
wisent/benchmarks/coding/providers/livecodebench/__init__.py +0 -0
wisent/benchmarks/coding/providers/livecodebench/provider.py +53 -0
wisent/benchmarks/coding/safe_docker/__init__.py +0 -0
wisent/benchmarks/coding/safe_docker/core/__init__.py +0 -0
wisent/benchmarks/coding/safe_docker/core/atoms.py +105 -0
wisent/benchmarks/coding/safe_docker/core/runtime.py +118 -0
wisent/benchmarks/coding/safe_docker/entrypoint.py +123 -0
wisent/benchmarks/coding/safe_docker/recipes.py +60 -0
wisent/classifiers/__init__.py +0 -0
wisent/classifiers/core/__init__.py +0 -0
wisent/classifiers/core/atoms.py +747 -0
wisent/classifiers/models/__init__.py +0 -0
wisent/classifiers/models/logistic.py +29 -0
wisent/classifiers/models/mlp.py +47 -0
wisent/cli/__init__.py +0 -0
wisent/cli/classifiers/__init__.py +0 -0
wisent/cli/classifiers/classifier_rotator.py +137 -0
wisent/cli/cli_logger.py +142 -0
wisent/cli/data_loaders/__init__.py +0 -0
wisent/cli/data_loaders/data_loader_rotator.py +96 -0
wisent/cli/evaluators/__init__.py +0 -0
wisent/cli/evaluators/evaluator_rotator.py +148 -0
wisent/cli/steering_methods/__init__.py +0 -0
wisent/cli/steering_methods/steering_rotator.py +110 -0
wisent/cli/wisent_cli/__init__.py +0 -0
wisent/cli/wisent_cli/commands/__init__.py +0 -0
wisent/cli/wisent_cli/commands/help_cmd.py +52 -0
wisent/cli/wisent_cli/commands/listing.py +154 -0
wisent/cli/wisent_cli/commands/train_cmd.py +322 -0
wisent/cli/wisent_cli/main.py +93 -0
wisent/cli/wisent_cli/shell.py +80 -0
wisent/cli/wisent_cli/ui.py +69 -0
wisent/cli/wisent_cli/util/__init__.py +0 -0
wisent/cli/wisent_cli/util/aggregations.py +43 -0
wisent/cli/wisent_cli/util/parsing.py +126 -0
wisent/cli/wisent_cli/version.py +4 -0
wisent/core/__init__.py +27 -0
wisent/core/activations/__init__.py +0 -0
wisent/core/activations/activations_collector.py +338 -0
wisent/core/activations/core/__init__.py +0 -0
wisent/core/activations/core/atoms.py +216 -0
wisent/core/agent/__init__.py +18 -0
wisent/core/agent/budget.py +638 -0
wisent/core/agent/device_benchmarks.py +685 -0
wisent/core/agent/diagnose/__init__.py +55 -0
wisent/core/agent/diagnose/agent_classifier_decision.py +641 -0
wisent/core/agent/diagnose/classifier_marketplace.py +554 -0
wisent/core/agent/diagnose/create_classifier.py +1154 -0
wisent/core/agent/diagnose/response_diagnostics.py +268 -0
wisent/core/agent/diagnose/select_classifiers.py +506 -0
wisent/core/agent/diagnose/synthetic_classifier_option.py +754 -0
wisent/core/agent/diagnose/tasks/__init__.py +33 -0
wisent/core/agent/diagnose/tasks/task_manager.py +1456 -0
wisent/core/agent/diagnose/tasks/task_relevance.py +94 -0
wisent/core/agent/diagnose/tasks/task_selector.py +151 -0
wisent/core/agent/diagnose/test_synthetic_classifier.py +71 -0
wisent/core/agent/diagnose.py +242 -0
wisent/core/agent/steer.py +212 -0
wisent/core/agent/timeout.py +134 -0
wisent/core/autonomous_agent.py +1234 -0
wisent/core/bigcode_integration.py +583 -0
wisent/core/contrastive_pairs/__init__.py +15 -0
wisent/core/contrastive_pairs/core/__init__.py +0 -0
wisent/core/contrastive_pairs/core/atoms.py +45 -0
wisent/core/contrastive_pairs/core/buliders.py +59 -0
wisent/core/contrastive_pairs/core/pair.py +178 -0
wisent/core/contrastive_pairs/core/response.py +152 -0
wisent/core/contrastive_pairs/core/serialization.py +300 -0
wisent/core/contrastive_pairs/core/set.py +133 -0
wisent/core/contrastive_pairs/diagnostics/__init__.py +45 -0
wisent/core/contrastive_pairs/diagnostics/activations.py +53 -0
wisent/core/contrastive_pairs/diagnostics/base.py +73 -0
wisent/core/contrastive_pairs/diagnostics/control_vectors.py +169 -0
wisent/core/contrastive_pairs/diagnostics/coverage.py +79 -0
wisent/core/contrastive_pairs/diagnostics/divergence.py +98 -0
wisent/core/contrastive_pairs/diagnostics/duplicates.py +116 -0
wisent/core/contrastive_pairs/lm_eval_pairs/__init__.py +0 -0
wisent/core/contrastive_pairs/lm_eval_pairs/atoms.py +238 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_extractor_manifest.py +8 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_extractor_registry.py +132 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/__init__.py +0 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/winogrande.py +115 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_pairs_generation.py +50 -0
wisent/core/data_loaders/__init__.py +0 -0
wisent/core/data_loaders/core/__init__.py +0 -0
wisent/core/data_loaders/core/atoms.py +98 -0
wisent/core/data_loaders/loaders/__init__.py +0 -0
wisent/core/data_loaders/loaders/custom.py +120 -0
wisent/core/data_loaders/loaders/lm_loader.py +218 -0
wisent/core/detection_handling.py +257 -0
wisent/core/download_full_benchmarks.py +1386 -0
wisent/core/evaluators/__init__.py +0 -0
wisent/core/evaluators/oracles/__init__.py +0 -0
wisent/core/evaluators/oracles/interactive.py +73 -0
wisent/core/evaluators/oracles/nlp_evaluator.py +440 -0
wisent/core/evaluators/oracles/user_specified.py +67 -0
wisent/core/hyperparameter_optimizer.py +429 -0
wisent/core/lm_eval_harness_ground_truth.py +1396 -0
wisent/core/log_likelihoods_evaluator.py +321 -0
wisent/core/managed_cached_benchmarks.py +595 -0
wisent/core/mixed_benchmark_sampler.py +364 -0
wisent/core/model_config_manager.py +330 -0
wisent/core/model_persistence.py +317 -0
wisent/core/models/__init__.py +0 -0
wisent/core/models/core/__init__.py +0 -0
wisent/core/models/core/atoms.py +460 -0
wisent/core/models/wisent_model.py +727 -0
wisent/core/multi_steering.py +316 -0
wisent/core/optuna/__init__.py +57 -0
wisent/core/optuna/classifier/__init__.py +25 -0
wisent/core/optuna/classifier/activation_generator.py +349 -0
wisent/core/optuna/classifier/classifier_cache.py +509 -0
wisent/core/optuna/classifier/optuna_classifier_optimizer.py +606 -0
wisent/core/optuna/steering/__init__.py +0 -0
wisent/core/optuna/steering/bigcode_evaluator_wrapper.py +188 -0
wisent/core/optuna/steering/data_utils.py +342 -0
wisent/core/optuna/steering/metrics.py +474 -0
wisent/core/optuna/steering/optuna_pipeline.py +1738 -0
wisent/core/optuna/steering/steering_optimization.py +1111 -0
wisent/core/parser.py +1668 -0
wisent/core/prompts/__init__.py +0 -0
wisent/core/prompts/core/__init__.py +0 -0
wisent/core/prompts/core/atom.py +57 -0
wisent/core/prompts/core/prompt_formater.py +157 -0
wisent/core/prompts/prompt_stratiegies/__init__.py +0 -0
wisent/core/prompts/prompt_stratiegies/direct_completion.py +24 -0
wisent/core/prompts/prompt_stratiegies/instruction_following.py +24 -0
wisent/core/prompts/prompt_stratiegies/multiple_choice.py +29 -0
wisent/core/prompts/prompt_stratiegies/role_playing.py +31 -0
wisent/core/representation.py +5 -0
wisent/core/sample_size_optimizer.py +648 -0
wisent/core/sample_size_optimizer_v2.py +355 -0
wisent/core/save_results.py +277 -0
wisent/core/steering.py +652 -0
wisent/core/steering_method.py +26 -0
wisent/core/steering_methods/__init__.py +0 -0
wisent/core/steering_methods/core/__init__.py +0 -0
wisent/core/steering_methods/core/atoms.py +153 -0
wisent/core/steering_methods/methods/__init__.py +0 -0
wisent/core/steering_methods/methods/caa.py +44 -0
wisent/core/steering_optimizer.py +1297 -0
wisent/core/task_interface.py +132 -0
wisent/core/task_selector.py +189 -0
wisent/core/tasks/__init__.py +175 -0
wisent/core/tasks/aime_task.py +141 -0
wisent/core/tasks/file_task.py +211 -0
wisent/core/tasks/hle_task.py +180 -0
wisent/core/tasks/hmmt_task.py +119 -0
wisent/core/tasks/livecodebench_task.py +201 -0
wisent/core/tasks/livemathbench_task.py +158 -0
wisent/core/tasks/lm_eval_task.py +455 -0
wisent/core/tasks/math500_task.py +84 -0
wisent/core/tasks/polymath_task.py +146 -0
wisent/core/tasks/supergpqa_task.py +220 -0
wisent/core/time_estimator.py +149 -0
wisent/core/timing_calibration.py +174 -0
wisent/core/tracking/__init__.py +54 -0
wisent/core/tracking/latency.py +618 -0
wisent/core/tracking/memory.py +359 -0
wisent/core/trainers/__init__.py +0 -0
wisent/core/trainers/core/__init__.py +11 -0
wisent/core/trainers/core/atoms.py +45 -0
wisent/core/trainers/steering_trainer.py +271 -0
wisent/core/user_model_config.py +158 -0
wisent/opti/__init__.py +0 -0
wisent/opti/core/__init__.py +0 -0
wisent/opti/core/atoms.py +175 -0
wisent/opti/methods/__init__.py +0 -0
wisent/opti/methods/opti_classificator.py +172 -0
wisent/opti/methods/opti_steering.py +138 -0
wisent/synthetic/__init__.py +0 -0
wisent/synthetic/cleaners/__init__.py +0 -0
wisent/synthetic/cleaners/core/__init__.py +0 -0
wisent/synthetic/cleaners/core/atoms.py +58 -0
wisent/synthetic/cleaners/deduper_cleaner.py +53 -0
wisent/synthetic/cleaners/methods/__init__.py +0 -0
wisent/synthetic/cleaners/methods/base_dedupers.py +320 -0
wisent/synthetic/cleaners/methods/base_refusalers.py +286 -0
wisent/synthetic/cleaners/methods/core/__init__.py +0 -0
wisent/synthetic/cleaners/methods/core/atoms.py +47 -0
wisent/synthetic/cleaners/pairs_cleaner.py +90 -0
wisent/synthetic/cleaners/refusaler_cleaner.py +133 -0
wisent/synthetic/db_instructions/__init__.py +0 -0
wisent/synthetic/db_instructions/core/__init__.py +0 -0
wisent/synthetic/db_instructions/core/atoms.py +25 -0
wisent/synthetic/db_instructions/mini_dp.py +37 -0
wisent/synthetic/generators/__init__.py +0 -0
wisent/synthetic/generators/core/__init__.py +0 -0
wisent/synthetic/generators/core/atoms.py +73 -0
wisent/synthetic/generators/diversities/__init__.py +0 -0
wisent/synthetic/generators/diversities/core/__init__.py +0 -0
wisent/synthetic/generators/diversities/core/core.py +68 -0
wisent/synthetic/generators/diversities/methods/__init__.py +0 -0
wisent/synthetic/generators/diversities/methods/fast_diversity.py +249 -0
wisent/synthetic/generators/pairs_generator.py +179 -0
wisent-0.5.2.dist-info/METADATA +67 -0
wisent-0.5.2.dist-info/RECORD +218 -0
{wisent-0.1.1.dist-info → wisent-0.5.2.dist-info}/WHEEL +1 -1
{wisent-0.1.1.dist-info → wisent-0.5.2.dist-info/licenses}/LICENSE +2 -2
wisent/activations/__init__.py +0 -9
wisent/activations/client.py +0 -97
wisent/activations/extractor.py +0 -251
wisent/activations/models.py +0 -95
wisent/client.py +0 -45
wisent/control_vector/__init__.py +0 -9
wisent/control_vector/client.py +0 -85
wisent/control_vector/manager.py +0 -168
wisent/control_vector/models.py +0 -70
wisent/inference/__init__.py +0 -9
wisent/inference/client.py +0 -103
wisent/inference/inferencer.py +0 -250
wisent/inference/models.py +0 -66
wisent/utils/__init__.py +0 -3
wisent/utils/auth.py +0 -30
wisent/utils/http.py +0 -228
wisent/version.py +0 -3
wisent-0.1.1.dist-info/METADATA +0 -142
wisent-0.1.1.dist-info/RECORD +0 -23
{wisent-0.1.1.dist-info → wisent-0.5.2.dist-info}/top_level.txt +0 -0

wisent/core/sample_size_optimizer_v2.py ADDED Viewed

@@ -0,0 +1,355 @@
+"""
+Simplified Sample Size Optimizer using training-limit and testing-limit flags.
+Supports both classification and steering methods.
+"""
+import os
+import json
+import time
+import logging
+from typing import Dict, List, Optional, Any, Tuple
+from datetime import datetime
+import numpy as np
+import matplotlib.pyplot as plt
+from ..cli import run_task_pipeline
+from .model_config_manager import ModelConfigManager
+logger = logging.getLogger(__name__)
+class SimplifiedSampleSizeOptimizer:
+    """Simplified sample size optimizer that leverages CLI training/testing limits."""
+    def __init__(
+        self,
+        model_name: str,
+        task_name: str,
+        layer: int,
+        method_type: str = "classification",  # "classification" or "steering"
+        sample_sizes: Optional[List[int]] = None,
+        test_size: int = 200,
+        seed: int = 42,
+        verbose: bool = False,
+        **method_kwargs
+    ):
+        """
+        Initialize the optimizer.
+        Args:
+            model_name: Model to optimize
+            task_name: Task to optimize for
+            layer: Layer to use
+            method_type: "classification" or "steering"
+            sample_sizes: List of training sample sizes to test
+            test_size: Fixed test set size
+            seed: Random seed for reproducibility
+            verbose: Verbose output
+            **method_kwargs: Additional arguments for the method
+                For classification: token_aggregation, threshold, classifier_type
+                For steering: steering_method, steering_strength, token_targeting_strategy
+        """
+        self.model_name = model_name
+        self.task_name = task_name
+        self.layer = layer
+        self.method_type = method_type
+        self.sample_sizes = sample_sizes or [5, 10, 20, 50, 100, 200, 500]
+        self.test_size = test_size
+        self.seed = seed
+        self.verbose = verbose
+        self.method_kwargs = method_kwargs
+        # Results storage
+        self.results = {
+            "sample_sizes": [],
+            "accuracies": [],
+            "f1_scores": [],
+            "training_times": [],
+            "evaluation_times": []
+        }
+    def run_single_experiment(self, training_size: int) -> Dict[str, Any]:
+        """
+        Run a single experiment with a specific training size.
+        Args:
+            training_size: Number of training samples
+        Returns:
+            Dictionary with results
+        """
+        if self.verbose:
+            print(f"\n{'='*60}")
+            print(f"Testing {self.method_type} with {training_size} training samples")
+            print(f"{'='*60}")
+        start_time = time.time()
+        # Build arguments for run_task_pipeline
+        pipeline_args = {
+            "task_name": self.task_name,
+            "model_name": self.model_name,
+            "layer": str(self.layer),
+            "training_limit": training_size,
+            "testing_limit": self.test_size,
+            "seed": self.seed,
+            "verbose": self.verbose,
+            "split_ratio": 0.8,  # Standard split
+            "limit": training_size + self.test_size + 100,  # Ensure enough data
+        }
+        # Add method-specific arguments
+        if self.method_type == "classification":
+            pipeline_args.update({
+                "token_aggregation": self.method_kwargs.get("token_aggregation", "average"),
+                "detection_threshold": self.method_kwargs.get("threshold", 0.5),
+                "classifier_type": self.method_kwargs.get("classifier_type", "logistic"),
+                "steering_mode": False
+            })
+        else:  # steering
+            pipeline_args.update({
+                "steering_mode": True,
+                "steering_method": self.method_kwargs.get("steering_method", "CAA"),
+                "steering_strength": self.method_kwargs.get("steering_strength", 1.0),
+                "token_targeting_strategy": self.method_kwargs.get("token_targeting_strategy", "LAST_TOKEN"),
+                "token_aggregation": self.method_kwargs.get("token_aggregation", "average"),
+            })
+        try:
+            # Run the pipeline
+            result = run_task_pipeline(**pipeline_args)
+            end_time = time.time()
+            total_time = end_time - start_time
+            # Extract metrics based on method type
+            if self.method_type == "classification":
+                accuracy = result.get("test_accuracy", 0.0)
+                f1_score = result.get("test_f1_score", 0.0)
+            else:  # steering
+                # For steering, we look at the evaluation results
+                eval_results = result.get("evaluation_results", {})
+                accuracy = eval_results.get("accuracy", 0.0)
+                # Convert to float if it's a string percentage
+                if isinstance(accuracy, str) and accuracy.endswith('%'):
+                    accuracy = float(accuracy.rstrip('%')) / 100.0
+                f1_score = accuracy  # Use accuracy as proxy for F1 in steering
+            return {
+                "accuracy": accuracy,
+                "f1_score": f1_score,
+                "training_time": result.get("training_time", total_time * 0.8),
+                "evaluation_time": total_time * 0.2,
+                "total_time": total_time,
+                "success": True
+            }
+        except Exception as e:
+            logger.error(f"Failed to run experiment with {training_size} samples: {e}")
+            return {
+                "accuracy": 0.0,
+                "f1_score": 0.0,
+                "training_time": 0.0,
+                "evaluation_time": 0.0,
+                "total_time": 0.0,
+                "success": False,
+                "error": str(e)
+            }
+    def run_optimization(self) -> Dict[str, Any]:
+        """
+        Run the complete optimization process.
+        Returns:
+            Dictionary with optimization results
+        """
+        logger.info(f"Starting {self.method_type} sample size optimization...")
+        logger.info(f"Model: {self.model_name}, Task: {self.task_name}, Layer: {self.layer}")
+        logger.info(f"Testing sample sizes: {self.sample_sizes}")
+        logger.info(f"Fixed test size: {self.test_size}")
+        # Run experiments for each sample size
+        for sample_size in self.sample_sizes:
+            result = self.run_single_experiment(sample_size)
+            if result["success"]:
+                self.results["sample_sizes"].append(sample_size)
+                self.results["accuracies"].append(result["accuracy"])
+                self.results["f1_scores"].append(result["f1_score"])
+                self.results["training_times"].append(result["training_time"])
+                self.results["evaluation_times"].append(result["evaluation_time"])
+                if self.verbose:
+                    print(f"\n✓ Tested {sample_size} samples: accuracy={result['accuracy']:.3f}, f1={result['f1_score']:.3f}")
+        # Find optimal sample size
+        optimal_idx, optimal_size = self.find_optimal_sample_size()
+        return {
+            "optimal_sample_size": optimal_size,
+            "optimal_accuracy": self.results["accuracies"][optimal_idx] if optimal_idx >= 0 else None,
+            "optimal_f1_score": self.results["f1_scores"][optimal_idx] if optimal_idx >= 0 else None,
+            "all_results": self.results,
+            "method_type": self.method_type,
+            "method_kwargs": self.method_kwargs
+        }
+    def find_optimal_sample_size(self) -> Tuple[int, int]:
+        """
+        Find the optimal sample size based on accuracy and efficiency.
+        Returns:
+            Tuple of (optimal_index, optimal_sample_size)
+        """
+        if not self.results["accuracies"]:
+            return -1, 0
+        accuracies = np.array(self.results["accuracies"])
+        sample_sizes = np.array(self.results["sample_sizes"])
+        # Find the point of diminishing returns
+        # We want the smallest sample size that achieves near-optimal accuracy
+        max_accuracy = np.max(accuracies)
+        threshold = max_accuracy * 0.95  # Within 95% of best accuracy
+        # Find indices where accuracy is above threshold
+        good_indices = np.where(accuracies >= threshold)[0]
+        if len(good_indices) > 0:
+            # Choose the smallest sample size among good ones
+            optimal_idx = good_indices[0]
+        else:
+            # If no good indices, choose the best accuracy
+            optimal_idx = np.argmax(accuracies)
+        return optimal_idx, sample_sizes[optimal_idx]
+    def plot_results(self, save_path: Optional[str] = None) -> None:
+        """
+        Plot the optimization results.
+        Args:
+            save_path: Path to save the plot
+        """
+        if not self.results["sample_sizes"]:
+            logger.warning("No results to plot")
+            return
+        fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(12, 5))
+        # Plot accuracy and F1 score
+        ax1.plot(self.results["sample_sizes"], self.results["accuracies"],
+                 'b-o', label='Accuracy', markersize=8)
+        ax1.plot(self.results["sample_sizes"], self.results["f1_scores"],
+                 'r--s', label='F1 Score', markersize=8)
+        # Mark optimal point
+        optimal_idx, optimal_size = self.find_optimal_sample_size()
+        if optimal_idx >= 0:
+            ax1.axvline(x=optimal_size, color='g', linestyle=':', alpha=0.7,
+                       label=f'Optimal: {optimal_size}')
+        ax1.set_xlabel('Training Sample Size')
+        ax1.set_ylabel('Score')
+        ax1.set_title(f'{self.method_type.capitalize()} Performance vs Sample Size')
+        ax1.legend()
+        ax1.grid(True, alpha=0.3)
+        ax1.set_xscale('log')
+        # Plot training time
+        ax2.plot(self.results["sample_sizes"], self.results["training_times"],
+                 'g-^', label='Training Time', markersize=8)
+        ax2.set_xlabel('Training Sample Size')
+        ax2.set_ylabel('Time (seconds)')
+        ax2.set_title('Training Time vs Sample Size')
+        ax2.legend()
+        ax2.grid(True, alpha=0.3)
+        ax2.set_xscale('log')
+        plt.suptitle(f'Sample Size Optimization: {self.model_name} on {self.task_name}')
+        plt.tight_layout()
+        if save_path:
+            plt.savefig(save_path, dpi=150, bbox_inches='tight')
+            logger.info(f"Plot saved to {save_path}")
+        else:
+            plt.show()
+        plt.close()
+def optimize_sample_size(
+    model_name: str,
+    task_name: str,
+    layer: int,
+    method_type: str = "classification",
+    sample_sizes: Optional[List[int]] = None,
+    test_size: int = 200,
+    seed: int = 42,
+    verbose: bool = False,
+    save_plot: bool = False,
+    save_to_config: bool = True,
+    **method_kwargs
+) -> Dict[str, Any]:
+    """
+    Convenience function to run sample size optimization.
+    Args:
+        model_name: Model to optimize
+        task_name: Task to optimize for
+        layer: Layer to use
+        method_type: "classification" or "steering"
+        sample_sizes: Sample sizes to test
+        test_size: Fixed test set size
+        seed: Random seed
+        verbose: Verbose output
+        save_plot: Whether to save the plot
+        save_to_config: Whether to save results to model config
+        **method_kwargs: Method-specific arguments
+    Returns:
+        Optimization results
+    """
+    optimizer = SimplifiedSampleSizeOptimizer(
+        model_name=model_name,
+        task_name=task_name,
+        layer=layer,
+        method_type=method_type,
+        sample_sizes=sample_sizes,
+        test_size=test_size,
+        seed=seed,
+        verbose=verbose,
+        **method_kwargs
+    )
+    results = optimizer.run_optimization()
+    # Create plot if requested
+    if save_plot:
+        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+        plot_dir = f"sample_size_optimization/{model_name}"
+        os.makedirs(plot_dir, exist_ok=True)
+        plot_path = os.path.join(
+            plot_dir,
+            f"{task_name}_{method_type}_layer{layer}_{timestamp}.png"
+        )
+        optimizer.plot_results(plot_path)
+    # Save to config if requested
+    if save_to_config and results["optimal_sample_size"] > 0:
+        try:
+            config_manager = ModelConfigManager()
+            # For now, just log the optimal sample size
+            # TODO: Implement save_optimal_sample_size in ModelConfigManager
+            logger.info(
+                f"Optimal {method_type} sample size for {model_name} on {task_name}: "
+                f"{results['optimal_sample_size']} (accuracy: {results.get('optimal_accuracy', 'N/A')})"
+            )
+            if verbose:
+                print(f"\n💡 Note: To use this optimal sample size, add --limit {results['optimal_sample_size']} to your commands")
+        except Exception as e:
+            logger.warning(f"Could not save to config: {e}")
+    return results

wisent/core/save_results.py ADDED Viewed

@@ -0,0 +1,277 @@
+"""
+Functions for saving wisent-guard evaluation results in various formats.
+"""
+import os
+import json
+import csv
+import logging
+from typing import Dict, Any
+logger = logging.getLogger(__name__)
+def save_results_json(results: Dict[str, Any], output_path: str) -> None:
+    """Save results to JSON file."""
+    try:
+        os.makedirs(os.path.dirname(output_path), exist_ok=True)
+        with open(output_path, 'w') as f:
+            json.dump(results, f, indent=2, default=str)
+        logger.info(f"Results saved to {output_path}")
+    except Exception as e:
+        logger.error(f"Failed to save results to {output_path}: {e}")
+def save_results_csv(results: Dict[str, Any], output_path: str) -> None:
+    """Save results to CSV file."""
+    try:
+        os.makedirs(os.path.dirname(output_path), exist_ok=True)
+        # Flatten results for CSV
+        rows = []
+        for task_name, task_results in results.items():
+            if isinstance(task_results, dict):
+                row = {"task": task_name}
+                row.update(task_results)
+                rows.append(row)
+        if rows:
+            with open(output_path, 'w', newline='') as f:
+                writer = csv.DictWriter(f, fieldnames=rows[0].keys())
+                writer.writeheader()
+                writer.writerows(rows)
+            logger.info(f"CSV results saved to {output_path}")
+    except Exception as e:
+        logger.error(f"Failed to save CSV to {output_path}: {e}")
+def save_classification_results_csv(results: Dict[str, Any], output_path: str) -> None:
+    """
+    Save detailed classification results to CSV file for manual evaluation.
+    Exports one row per response with:
+    - For single-layer: question, response, token_scores, overall_prediction, ground_truth
+    - For multi-layer: question, response, token_scores_layer_X (for each layer),
+      aggregated_score_layer_X (for each layer), overall_prediction_layer_X (for each layer), ground_truth
+    """
+    try:
+        os.makedirs(os.path.dirname(output_path), exist_ok=True)
+        csv_rows = []
+        all_layers = set()  # Track all layers for multi-layer mode
+        is_multi_layer = False
+        # First pass: determine if we have multi-layer data and collect all layers
+        for task_name, task_results in results.items():
+            if not isinstance(task_results, dict) or 'sample_responses' not in task_results:
+                continue
+            # Skip steering mode results (they don't have classification data)
+            if task_results.get('steering_mode', False):
+                continue
+            sample_responses = task_results['sample_responses']
+            for response_data in sample_responses:
+                layer_results = response_data.get('layer_results', {})
+                if layer_results:
+                    is_multi_layer = True
+                    all_layers.update(layer_results.keys())
+        # Sort layers for consistent column ordering
+        sorted_layers = sorted(all_layers) if all_layers else []
+        # Second pass: create CSV rows
+        for task_name, task_results in results.items():
+            if not isinstance(task_results, dict) or 'sample_responses' not in task_results:
+                continue
+            # Skip steering mode results (they don't have classification data)
+            if task_results.get('steering_mode', False):
+                continue
+            sample_responses = task_results['sample_responses']
+            for response_data in sample_responses:
+                layer_results = response_data.get('layer_results', {})
+                # Create base row
+                csv_row = {
+                    'question': response_data.get('question', ''),
+                    'response': response_data.get('response', ''),
+                    'ground_truth': ''  # Empty for user to fill
+                }
+                if is_multi_layer and layer_results:
+                    # Multi-layer mode: create columns for each layer
+                    for layer in sorted_layers:
+                        layer_data = layer_results.get(layer, {})
+                        # Format token scores as pipe-separated values
+                        token_scores_str = ""
+                        if layer_data.get('token_scores'):
+                            token_scores_formatted = [f"{score:.6f}" for score in layer_data['token_scores']]
+                            token_scores_str = "|".join(token_scores_formatted)
+                        # Add layer-specific columns
+                        csv_row[f'token_scores_layer_{layer}'] = token_scores_str
+                        csv_row[f'aggregated_score_layer_{layer}'] = f"{layer_data.get('aggregated_score', 0.0):.6f}"
+                        csv_row[f'overall_prediction_layer_{layer}'] = layer_data.get('classification', 'UNKNOWN')
+                elif not is_multi_layer:
+                    # Single-layer mode: use original format
+                    token_scores_str = ""
+                    if response_data.get('token_scores'):
+                        token_scores_formatted = [f"{score:.6f}" for score in response_data['token_scores']]
+                        token_scores_str = "|".join(token_scores_formatted)
+                    csv_row['token_scores'] = token_scores_str
+                    csv_row['aggregated_score'] = f"{response_data.get('aggregated_score', 0.0):.6f}"
+                    csv_row['overall_prediction'] = response_data.get('classification', 'UNKNOWN')
+                csv_rows.append(csv_row)
+        # Only save if we have classification data
+        if csv_rows:
+            # Determine fieldnames based on mode
+            if is_multi_layer:
+                fieldnames = ['question', 'response']
+                for layer in sorted_layers:
+                    fieldnames.extend([
+                        f'token_scores_layer_{layer}',
+                        f'aggregated_score_layer_{layer}',
+                        f'overall_prediction_layer_{layer}'
+                    ])
+                fieldnames.append('ground_truth')
+            else:
+                fieldnames = ['question', 'response', 'token_scores', 'aggregated_score', 'overall_prediction', 'ground_truth']
+            with open(output_path, 'w', newline='', encoding='utf-8') as f:
+                writer = csv.DictWriter(f, fieldnames=fieldnames)
+                writer.writeheader()
+                writer.writerows(csv_rows)
+            logger.info(f"Classification results CSV saved to {output_path}")
+            print(f"\n📊 Classification results saved to: {output_path}")
+            print(f"   • {len(csv_rows)} responses exported")
+            if is_multi_layer:
+                print(f"   • Multi-layer format with columns for layers: {sorted_layers}")
+                print(f"   • Token scores, aggregated scores, and predictions saved per layer")
+            else:
+                print(f"   • Single-layer format")
+            print(f"   • Fill in the 'ground_truth' column with: 'TRUTHFUL' or 'HALLUCINATION'")
+            print(f"   • Use for manual evaluation and classifier optimization")
+        else:
+            logger.info("No classification results to export (steering mode or empty results)")
+    except Exception as e:
+        logger.error(f"Failed to save classification CSV to {output_path}: {e}")
+def create_evaluation_report(results: Dict[str, Any], output_path: str) -> None:
+    """Create a comprehensive evaluation report in markdown format."""
+    try:
+        with open(output_path, 'w') as f:
+            f.write("# Wisent-Guard Evaluation Report\n\n")
+            # Summary table
+            f.write("## Summary\n\n")
+            f.write("| Task | Training Accuracy | Evaluation Accuracy | Optimization |\n")
+            f.write("|------|------------------|--------------------|--------------|\n")
+            for task_name, task_results in results.items():
+                if task_results is None:
+                    f.write(f"| {task_name} | NULL | NULL | N/A |\n")
+                elif isinstance(task_results, dict) and "error" in task_results:
+                    f.write(f"| {task_name} | ERROR | ERROR | N/A |\n")
+                elif isinstance(task_results, dict):
+                    train_acc = task_results.get("training_results", {}).get("accuracy", "N/A")
+                    eval_acc = task_results.get("evaluation_results", {}).get("accuracy", "N/A")
+                    optimized = "Yes" if task_results.get("optimization_performed", False) else "No"
+                    if isinstance(train_acc, float):
+                        train_acc = f"{train_acc:.2%}"
+                    if isinstance(eval_acc, float):
+                        eval_acc = f"{eval_acc:.2%}"
+                    f.write(f"| {task_name} | {train_acc} | {eval_acc} | {optimized} |\n")
+            # Detailed results for each task
+            for task_name, task_results in results.items():
+                f.write(f"\n## {task_name}\n\n")
+                if task_results is None:
+                    f.write(f"**Error**: Task results are None\n")
+                elif isinstance(task_results, dict) and "error" in task_results:
+                    f.write(f"**Error**: {task_results['error']}\n")
+                elif isinstance(task_results, dict):
+                    # Configuration
+                    f.write("### Configuration\n")
+                    f.write(f"- **Model**: {task_results.get('model_name', 'Unknown')}\n")
+                    f.write(f"- **Layer**: {task_results.get('layer', 'Unknown')}\n")
+                    f.write(f"- **Classifier**: {task_results.get('classifier_type', 'Unknown')}\n")
+                    f.write(f"- **Token Aggregation**: {task_results.get('token_aggregation', 'Unknown')}\n")
+                    f.write(f"- **Ground Truth Method**: {task_results.get('ground_truth_method', 'Unknown')}\n")
+                    # Training results
+                    if "training_results" in task_results:
+                        train_results = task_results["training_results"]
+                        f.write("\n### Training Results\n")
+                        train_acc = train_results.get('accuracy', 'N/A')
+                        if isinstance(train_acc, float):
+                            f.write(f"- **Accuracy**: {train_acc:.2%}\n")
+                        else:
+                            f.write(f"- **Accuracy**: {train_acc}\n")
+                        train_prec = train_results.get('precision', 'N/A')
+                        if isinstance(train_prec, float):
+                            f.write(f"- **Precision**: {train_prec:.2f}\n")
+                        else:
+                            f.write(f"- **Precision**: {train_prec}\n")
+                        train_recall = train_results.get('recall', 'N/A')
+                        if isinstance(train_recall, float):
+                            f.write(f"- **Recall**: {train_recall:.2f}\n")
+                        else:
+                            f.write(f"- **Recall**: {train_recall}\n")
+                        train_f1 = train_results.get('f1', 'N/A')
+                        if isinstance(train_f1, float):
+                            f.write(f"- **F1 Score**: {train_f1:.2f}\n")
+                        else:
+                            f.write(f"- **F1 Score**: {train_f1}\n")
+                    # Evaluation results
+                    if "evaluation_results" in task_results:
+                        eval_results = task_results["evaluation_results"]
+                        f.write("\n### Evaluation Results\n")
+                        eval_acc = eval_results.get('accuracy', 'N/A')
+                        if isinstance(eval_acc, float):
+                            f.write(f"- **Accuracy**: {eval_acc:.2%}\n")
+                        else:
+                            f.write(f"- **Accuracy**: {eval_acc}\n")
+                        f.write(f"- **Total Predictions**: {eval_results.get('total_predictions', 'N/A')}\n")
+                        f.write(f"- **Correct Predictions**: {eval_results.get('correct_predictions', 'N/A')}\n")
+                    # Optimization results
+                    if task_results.get("optimization_performed", False):
+                        f.write("\n### Optimization Results\n")
+                        f.write(f"- **Best Layer**: {task_results.get('best_layer', 'Unknown')}\n")
+                        f.write(f"- **Best Aggregation**: {task_results.get('best_aggregation', 'Unknown')}\n")
+                        best_acc = task_results.get('best_accuracy', 'Unknown')
+                        if isinstance(best_acc, float):
+                            f.write(f"- **Best Accuracy**: {best_acc:.2%}\n")
+                        else:
+                            f.write(f"- **Best Accuracy**: {best_acc}\n")
+            f.write(f"\n---\n\n*Report generated on {__import__('datetime').datetime.now().strftime('%Y-%m-%d %H:%M:%S')}*\n")
+        logger.info(f"Evaluation report saved to {output_path}")
+    except Exception as e:
+        logger.error(f"Failed to create report at {output_path}: {e}")

wisent 0.1.1__py3-none-any.whl → 0.5.2__py3-none-any.whl

Potentially problematic release.

wisent 0.1.1py3-none-any.whl → 0.5.2py3-none-any.whl