PyPI - wisent - Versions diffs - 0.1.1__py3-none-any.whl → 0.5.2__py3-none-any.whl - Mend

wisent 0.1.1py3-none-any.whl → 0.5.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of wisent might be problematic. Click here for more details.

Files changed (237) hide show

wisent/__init__.py +1 -8
wisent/benchmarks/__init__.py +0 -0
wisent/benchmarks/coding/__init__.py +0 -0
wisent/benchmarks/coding/metrics/__init__.py +0 -0
wisent/benchmarks/coding/metrics/core/__init__.py +0 -0
wisent/benchmarks/coding/metrics/core/atoms.py +36 -0
wisent/benchmarks/coding/metrics/evaluator.py +275 -0
wisent/benchmarks/coding/metrics/passk.py +66 -0
wisent/benchmarks/coding/output_sanitizer/__init__.py +0 -0
wisent/benchmarks/coding/output_sanitizer/core/__init__.py +0 -0
wisent/benchmarks/coding/output_sanitizer/core/atoms.py +27 -0
wisent/benchmarks/coding/output_sanitizer/cpp_sanitizer.py +62 -0
wisent/benchmarks/coding/output_sanitizer/java_sanitizer.py +78 -0
wisent/benchmarks/coding/output_sanitizer/python_sanitizer.py +94 -0
wisent/benchmarks/coding/output_sanitizer/utils.py +107 -0
wisent/benchmarks/coding/providers/__init__.py +18 -0
wisent/benchmarks/coding/providers/core/__init__.py +0 -0
wisent/benchmarks/coding/providers/core/atoms.py +31 -0
wisent/benchmarks/coding/providers/livecodebench/__init__.py +0 -0
wisent/benchmarks/coding/providers/livecodebench/provider.py +53 -0
wisent/benchmarks/coding/safe_docker/__init__.py +0 -0
wisent/benchmarks/coding/safe_docker/core/__init__.py +0 -0
wisent/benchmarks/coding/safe_docker/core/atoms.py +105 -0
wisent/benchmarks/coding/safe_docker/core/runtime.py +118 -0
wisent/benchmarks/coding/safe_docker/entrypoint.py +123 -0
wisent/benchmarks/coding/safe_docker/recipes.py +60 -0
wisent/classifiers/__init__.py +0 -0
wisent/classifiers/core/__init__.py +0 -0
wisent/classifiers/core/atoms.py +747 -0
wisent/classifiers/models/__init__.py +0 -0
wisent/classifiers/models/logistic.py +29 -0
wisent/classifiers/models/mlp.py +47 -0
wisent/cli/__init__.py +0 -0
wisent/cli/classifiers/__init__.py +0 -0
wisent/cli/classifiers/classifier_rotator.py +137 -0
wisent/cli/cli_logger.py +142 -0
wisent/cli/data_loaders/__init__.py +0 -0
wisent/cli/data_loaders/data_loader_rotator.py +96 -0
wisent/cli/evaluators/__init__.py +0 -0
wisent/cli/evaluators/evaluator_rotator.py +148 -0
wisent/cli/steering_methods/__init__.py +0 -0
wisent/cli/steering_methods/steering_rotator.py +110 -0
wisent/cli/wisent_cli/__init__.py +0 -0
wisent/cli/wisent_cli/commands/__init__.py +0 -0
wisent/cli/wisent_cli/commands/help_cmd.py +52 -0
wisent/cli/wisent_cli/commands/listing.py +154 -0
wisent/cli/wisent_cli/commands/train_cmd.py +322 -0
wisent/cli/wisent_cli/main.py +93 -0
wisent/cli/wisent_cli/shell.py +80 -0
wisent/cli/wisent_cli/ui.py +69 -0
wisent/cli/wisent_cli/util/__init__.py +0 -0
wisent/cli/wisent_cli/util/aggregations.py +43 -0
wisent/cli/wisent_cli/util/parsing.py +126 -0
wisent/cli/wisent_cli/version.py +4 -0
wisent/core/__init__.py +27 -0
wisent/core/activations/__init__.py +0 -0
wisent/core/activations/activations_collector.py +338 -0
wisent/core/activations/core/__init__.py +0 -0
wisent/core/activations/core/atoms.py +216 -0
wisent/core/agent/__init__.py +18 -0
wisent/core/agent/budget.py +638 -0
wisent/core/agent/device_benchmarks.py +685 -0
wisent/core/agent/diagnose/__init__.py +55 -0
wisent/core/agent/diagnose/agent_classifier_decision.py +641 -0
wisent/core/agent/diagnose/classifier_marketplace.py +554 -0
wisent/core/agent/diagnose/create_classifier.py +1154 -0
wisent/core/agent/diagnose/response_diagnostics.py +268 -0
wisent/core/agent/diagnose/select_classifiers.py +506 -0
wisent/core/agent/diagnose/synthetic_classifier_option.py +754 -0
wisent/core/agent/diagnose/tasks/__init__.py +33 -0
wisent/core/agent/diagnose/tasks/task_manager.py +1456 -0
wisent/core/agent/diagnose/tasks/task_relevance.py +94 -0
wisent/core/agent/diagnose/tasks/task_selector.py +151 -0
wisent/core/agent/diagnose/test_synthetic_classifier.py +71 -0
wisent/core/agent/diagnose.py +242 -0
wisent/core/agent/steer.py +212 -0
wisent/core/agent/timeout.py +134 -0
wisent/core/autonomous_agent.py +1234 -0
wisent/core/bigcode_integration.py +583 -0
wisent/core/contrastive_pairs/__init__.py +15 -0
wisent/core/contrastive_pairs/core/__init__.py +0 -0
wisent/core/contrastive_pairs/core/atoms.py +45 -0
wisent/core/contrastive_pairs/core/buliders.py +59 -0
wisent/core/contrastive_pairs/core/pair.py +178 -0
wisent/core/contrastive_pairs/core/response.py +152 -0
wisent/core/contrastive_pairs/core/serialization.py +300 -0
wisent/core/contrastive_pairs/core/set.py +133 -0
wisent/core/contrastive_pairs/diagnostics/__init__.py +45 -0
wisent/core/contrastive_pairs/diagnostics/activations.py +53 -0
wisent/core/contrastive_pairs/diagnostics/base.py +73 -0
wisent/core/contrastive_pairs/diagnostics/control_vectors.py +169 -0
wisent/core/contrastive_pairs/diagnostics/coverage.py +79 -0
wisent/core/contrastive_pairs/diagnostics/divergence.py +98 -0
wisent/core/contrastive_pairs/diagnostics/duplicates.py +116 -0
wisent/core/contrastive_pairs/lm_eval_pairs/__init__.py +0 -0
wisent/core/contrastive_pairs/lm_eval_pairs/atoms.py +238 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_extractor_manifest.py +8 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_extractor_registry.py +132 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/__init__.py +0 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/winogrande.py +115 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_pairs_generation.py +50 -0
wisent/core/data_loaders/__init__.py +0 -0
wisent/core/data_loaders/core/__init__.py +0 -0
wisent/core/data_loaders/core/atoms.py +98 -0
wisent/core/data_loaders/loaders/__init__.py +0 -0
wisent/core/data_loaders/loaders/custom.py +120 -0
wisent/core/data_loaders/loaders/lm_loader.py +218 -0
wisent/core/detection_handling.py +257 -0
wisent/core/download_full_benchmarks.py +1386 -0
wisent/core/evaluators/__init__.py +0 -0
wisent/core/evaluators/oracles/__init__.py +0 -0
wisent/core/evaluators/oracles/interactive.py +73 -0
wisent/core/evaluators/oracles/nlp_evaluator.py +440 -0
wisent/core/evaluators/oracles/user_specified.py +67 -0
wisent/core/hyperparameter_optimizer.py +429 -0
wisent/core/lm_eval_harness_ground_truth.py +1396 -0
wisent/core/log_likelihoods_evaluator.py +321 -0
wisent/core/managed_cached_benchmarks.py +595 -0
wisent/core/mixed_benchmark_sampler.py +364 -0
wisent/core/model_config_manager.py +330 -0
wisent/core/model_persistence.py +317 -0
wisent/core/models/__init__.py +0 -0
wisent/core/models/core/__init__.py +0 -0
wisent/core/models/core/atoms.py +460 -0
wisent/core/models/wisent_model.py +727 -0
wisent/core/multi_steering.py +316 -0
wisent/core/optuna/__init__.py +57 -0
wisent/core/optuna/classifier/__init__.py +25 -0
wisent/core/optuna/classifier/activation_generator.py +349 -0
wisent/core/optuna/classifier/classifier_cache.py +509 -0
wisent/core/optuna/classifier/optuna_classifier_optimizer.py +606 -0
wisent/core/optuna/steering/__init__.py +0 -0
wisent/core/optuna/steering/bigcode_evaluator_wrapper.py +188 -0
wisent/core/optuna/steering/data_utils.py +342 -0
wisent/core/optuna/steering/metrics.py +474 -0
wisent/core/optuna/steering/optuna_pipeline.py +1738 -0
wisent/core/optuna/steering/steering_optimization.py +1111 -0
wisent/core/parser.py +1668 -0
wisent/core/prompts/__init__.py +0 -0
wisent/core/prompts/core/__init__.py +0 -0
wisent/core/prompts/core/atom.py +57 -0
wisent/core/prompts/core/prompt_formater.py +157 -0
wisent/core/prompts/prompt_stratiegies/__init__.py +0 -0
wisent/core/prompts/prompt_stratiegies/direct_completion.py +24 -0
wisent/core/prompts/prompt_stratiegies/instruction_following.py +24 -0
wisent/core/prompts/prompt_stratiegies/multiple_choice.py +29 -0
wisent/core/prompts/prompt_stratiegies/role_playing.py +31 -0
wisent/core/representation.py +5 -0
wisent/core/sample_size_optimizer.py +648 -0
wisent/core/sample_size_optimizer_v2.py +355 -0
wisent/core/save_results.py +277 -0
wisent/core/steering.py +652 -0
wisent/core/steering_method.py +26 -0
wisent/core/steering_methods/__init__.py +0 -0
wisent/core/steering_methods/core/__init__.py +0 -0
wisent/core/steering_methods/core/atoms.py +153 -0
wisent/core/steering_methods/methods/__init__.py +0 -0
wisent/core/steering_methods/methods/caa.py +44 -0
wisent/core/steering_optimizer.py +1297 -0
wisent/core/task_interface.py +132 -0
wisent/core/task_selector.py +189 -0
wisent/core/tasks/__init__.py +175 -0
wisent/core/tasks/aime_task.py +141 -0
wisent/core/tasks/file_task.py +211 -0
wisent/core/tasks/hle_task.py +180 -0
wisent/core/tasks/hmmt_task.py +119 -0
wisent/core/tasks/livecodebench_task.py +201 -0
wisent/core/tasks/livemathbench_task.py +158 -0
wisent/core/tasks/lm_eval_task.py +455 -0
wisent/core/tasks/math500_task.py +84 -0
wisent/core/tasks/polymath_task.py +146 -0
wisent/core/tasks/supergpqa_task.py +220 -0
wisent/core/time_estimator.py +149 -0
wisent/core/timing_calibration.py +174 -0
wisent/core/tracking/__init__.py +54 -0
wisent/core/tracking/latency.py +618 -0
wisent/core/tracking/memory.py +359 -0
wisent/core/trainers/__init__.py +0 -0
wisent/core/trainers/core/__init__.py +11 -0
wisent/core/trainers/core/atoms.py +45 -0
wisent/core/trainers/steering_trainer.py +271 -0
wisent/core/user_model_config.py +158 -0
wisent/opti/__init__.py +0 -0
wisent/opti/core/__init__.py +0 -0
wisent/opti/core/atoms.py +175 -0
wisent/opti/methods/__init__.py +0 -0
wisent/opti/methods/opti_classificator.py +172 -0
wisent/opti/methods/opti_steering.py +138 -0
wisent/synthetic/__init__.py +0 -0
wisent/synthetic/cleaners/__init__.py +0 -0
wisent/synthetic/cleaners/core/__init__.py +0 -0
wisent/synthetic/cleaners/core/atoms.py +58 -0
wisent/synthetic/cleaners/deduper_cleaner.py +53 -0
wisent/synthetic/cleaners/methods/__init__.py +0 -0
wisent/synthetic/cleaners/methods/base_dedupers.py +320 -0
wisent/synthetic/cleaners/methods/base_refusalers.py +286 -0
wisent/synthetic/cleaners/methods/core/__init__.py +0 -0
wisent/synthetic/cleaners/methods/core/atoms.py +47 -0
wisent/synthetic/cleaners/pairs_cleaner.py +90 -0
wisent/synthetic/cleaners/refusaler_cleaner.py +133 -0
wisent/synthetic/db_instructions/__init__.py +0 -0
wisent/synthetic/db_instructions/core/__init__.py +0 -0
wisent/synthetic/db_instructions/core/atoms.py +25 -0
wisent/synthetic/db_instructions/mini_dp.py +37 -0
wisent/synthetic/generators/__init__.py +0 -0
wisent/synthetic/generators/core/__init__.py +0 -0
wisent/synthetic/generators/core/atoms.py +73 -0
wisent/synthetic/generators/diversities/__init__.py +0 -0
wisent/synthetic/generators/diversities/core/__init__.py +0 -0
wisent/synthetic/generators/diversities/core/core.py +68 -0
wisent/synthetic/generators/diversities/methods/__init__.py +0 -0
wisent/synthetic/generators/diversities/methods/fast_diversity.py +249 -0
wisent/synthetic/generators/pairs_generator.py +179 -0
wisent-0.5.2.dist-info/METADATA +67 -0
wisent-0.5.2.dist-info/RECORD +218 -0
{wisent-0.1.1.dist-info → wisent-0.5.2.dist-info}/WHEEL +1 -1
{wisent-0.1.1.dist-info → wisent-0.5.2.dist-info/licenses}/LICENSE +2 -2
wisent/activations/__init__.py +0 -9
wisent/activations/client.py +0 -97
wisent/activations/extractor.py +0 -251
wisent/activations/models.py +0 -95
wisent/client.py +0 -45
wisent/control_vector/__init__.py +0 -9
wisent/control_vector/client.py +0 -85
wisent/control_vector/manager.py +0 -168
wisent/control_vector/models.py +0 -70
wisent/inference/__init__.py +0 -9
wisent/inference/client.py +0 -103
wisent/inference/inferencer.py +0 -250
wisent/inference/models.py +0 -66
wisent/utils/__init__.py +0 -3
wisent/utils/auth.py +0 -30
wisent/utils/http.py +0 -228
wisent/version.py +0 -3
wisent-0.1.1.dist-info/METADATA +0 -142
wisent-0.1.1.dist-info/RECORD +0 -23
{wisent-0.1.1.dist-info → wisent-0.5.2.dist-info}/top_level.txt +0 -0

wisent/classifiers/models/__init__.py ADDED Viewed

File without changes

wisent/classifiers/models/logistic.py ADDED Viewed

@@ -0,0 +1,29 @@
+from __future__ import annotations
+import torch
+from torch import nn
+from wisent.classifiers.core.atoms import BaseClassifier
+__all__ = ["LogisticClassifier"]
+class LogisticModel(nn.Module):
+    """Simple logistic regression model for activation classification."""
+    def __init__(self, input_dim: int):
+        super().__init__()
+        self.linear = nn.Linear(input_dim, 1)
+        self.sigmoid = nn.Sigmoid()
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        logits = self.linear(x)
+        if logits.ndim == 1:
+            logits = logits.unsqueeze(1)
+        return self.sigmoid(logits)
+class LogisticClassifier(BaseClassifier):
+    name = "logistic"
+    description = "One-layer logistic regression over dense features"
+    def build_model(self, input_dim: int, **_: object) -> nn.Module:
+        return LogisticModel(input_dim)

wisent/classifiers/models/mlp.py ADDED Viewed

@@ -0,0 +1,47 @@
+from __future__ import annotations
+import torch
+from torch import nn
+from wisent.classifiers.core.atoms import BaseClassifier
+__all__ = ["MLPClassifier"]
+class MLPModel(nn.Module):
+    """Multi-layer perceptron for activation classification."""
+    def __init__(self, input_dim: int, hidden_dim: int = 128, dropout: float = 0.2):
+        super().__init__()
+        self.net = nn.Sequential(
+            nn.Linear(input_dim, hidden_dim),
+            nn.ReLU(),
+            nn.Dropout(dropout),
+            nn.Linear(hidden_dim, hidden_dim // 2),
+            nn.ReLU(),
+            nn.Dropout(dropout),
+            nn.Linear(hidden_dim // 2, 1),
+            nn.Sigmoid(),
+        )
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        out = self.net(x)
+        if out.ndim == 1:
+            out = out.unsqueeze(1)
+        return out
+class MLPClassifier(BaseClassifier):
+    name = "mlp"
+    description = "Two-layer MLP with dropout and ReLU"
+    def __init__(self, *, hidden_dim: int = 128, **base_kwargs):
+        super().__init__(**base_kwargs)
+        self._hidden_dim = int(hidden_dim)
+    def build_model(self, input_dim: int, **model_params: object) -> nn.Module:
+        hd = int(model_params.get("hidden_dim", self._hidden_dim))
+        dp = float(model_params.get("dropout", 0.2))
+        self._hidden_dim = hd
+        return MLPModel(input_dim, hidden_dim=hd, dropout=dp)
+    def model_hyperparams(self) -> dict[str, int]:
+        return {"hidden_dim": self._hidden_dim, "dropout": 0.2}

wisent/cli/__init__.py ADDED Viewed

File without changes

wisent/cli/classifiers/__init__.py ADDED Viewed

File without changes

wisent/cli/classifiers/classifier_rotator.py ADDED Viewed

@@ -0,0 +1,137 @@
+from __future__ import annotations
+import importlib
+import importlib.util
+import inspect
+import pkgutil
+from pathlib import Path
+from typing import Any
+from wisent.core.classifiers.core.atoms import BaseClassifier, ClassifierError, ClassifierTrainReport
+__all__ = ["ClassifierRotator"]
+class ClassifierRotator:
+    """
+    Discover, list, and delegate to registered classifiers.
+    """
+    def __init__(
+        self,
+        classifier: str | BaseClassifier | type[BaseClassifier] | None = None,
+        classifiers_location: str | Path = "wisent_guard.core.classifiers.models",
+        autoload: bool = True,
+        **classifier_kwargs: Any,
+    ) -> None:
+        if autoload:
+            self.discover_classifiers(classifiers_location)
+        self._classifier = self._resolve_classifier(classifier, **classifier_kwargs)
+    @staticmethod
+    def discover_classifiers(location: str | Path = "wisent_guard.core.classifiers.models") -> None:
+        """
+        Import all classifier modules so BaseClassifier subclasses self-register.
+        - If `location` is a dotted module path (str without existing FS path),
+          import that package and iterate its __path__ (works with namespace packages).
+        - If `location` is an existing directory (Path/str), import all .py files inside.
+        """
+        loc_path = Path(str(location))
+        if loc_path.exists() and loc_path.is_dir():
+            ClassifierRotator._import_all_py_in_dir(loc_path)
+            return
+        if not isinstance(location, str):
+            raise ClassifierError(
+                f"Invalid classifiers location: {location!r}. Provide a dotted module path or a directory."
+            )
+        try:
+            pkg = importlib.import_module(location)
+        except ModuleNotFoundError as exc:
+            raise ClassifierError(
+                f"Cannot import classifier package {location!r}. "
+                f"Use a dotted path (no leading slash) and ensure your project root is on PYTHONPATH."
+            ) from exc
+        search_paths = list(getattr(pkg, "__path__", []))
+        if not search_paths:
+            pkg_file = getattr(pkg, "__file__", None)
+            if pkg_file:
+                search_paths = [str(Path(pkg_file).parent)]
+        for _finder, name, _ispkg in pkgutil.iter_modules(search_paths):
+            if name.startswith("_"):
+                continue
+            importlib.import_module(f"{location}.{name}")
+    @staticmethod
+    def _import_all_py_in_dir(directory: Path) -> None:
+        for py in directory.glob("*.py"):
+            if py.name.startswith("_"):
+                continue
+            mod_name = f"_dyn_classifiers_{py.stem}"
+            spec = importlib.util.spec_from_file_location(mod_name, py)
+            if spec and spec.loader:
+                module = importlib.util.module_from_spec(spec)
+                spec.loader.exec_module(module)  # type: ignore[attr-defined]
+    @staticmethod
+    def list_classifiers() -> list[dict[str, Any]]:
+        out: list[dict[str, Any]] = []
+        for name, cls in BaseClassifier.list_registered().items():
+            out.append(
+                {
+                    "name": name,
+                    "description": getattr(cls, "description", ""),
+                    "class": f"{cls.__module__}.{cls.__name__}",
+                }
+            )
+        return sorted(out, key=lambda x: x["name"])
+    @staticmethod
+    def _resolve_classifier(
+        classifier: str | BaseClassifier | type[BaseClassifier] | None,
+        **kwargs: Any,
+    ) -> BaseClassifier:
+        if classifier is None:
+            registry = BaseClassifier.list_registered()
+            if not registry:
+                raise ClassifierError("No classifiers registered.")
+            # Deterministic pick: first by name
+            return next(iter(sorted(registry.items())))[1](**kwargs)
+        if isinstance(classifier, BaseClassifier):
+            return classifier
+        if inspect.isclass(classifier) and issubclass(classifier, BaseClassifier):
+            return classifier(**kwargs)
+        if isinstance(classifier, str):
+            cls = BaseClassifier.get(classifier)
+            return cls(**kwargs)
+        raise TypeError(
+            "classifier must be None, a name (str), BaseClassifier instance, or BaseClassifier subclass."
+        )
+    def use(self, classifier: str | BaseClassifier | type[BaseClassifier], **kwargs: Any) -> None:
+        self._classifier = self._resolve_classifier(classifier, **kwargs)
+    def fit(self, X, y, **kwargs) -> ClassifierTrainReport:
+        return self._classifier.fit(X, y, **kwargs)
+    def predict(self, X):
+        return self._classifier.predict(X)
+    def predict_proba(self, X):
+        return self._classifier.predict_proba(X)
+    def evaluate(self, X, y) -> dict[str, float]:
+        return self._classifier.evaluate(X, y)
+    def save_model(self, path: str) -> None:
+        self._classifier.save_model(path)
+    def load_model(self, path: str) -> None:
+        self._classifier.load_model(path)
+    def set_threshold(self, threshold: float) -> None:
+        self._classifier.set_threshold(threshold)

wisent/cli/cli_logger.py ADDED Viewed

@@ -0,0 +1,142 @@
+from __future__ import annotations
+import json
+import logging
+import sys
+from datetime import datetime, timezone
+from typing import Any, Mapping
+__all__ = [
+    "setup_logger",
+    "bind",
+    "JsonFormatter",
+    "ContextAdapter",
+    "add_file_handler",
+]
+class JsonFormatter(logging.Formatter):
+    """
+    Minimal JSON formatter with structured fields + extras.
+    """
+    _STD = {
+        "name", "msg", "args", "levelname", "levelno", "pathname",
+        "filename", "module", "exc_info", "exc_text", "stack_info",
+        "lineno", "funcName", "created", "msecs", "relativeCreated",
+        "thread", "threadName", "processName", "process"
+    }
+    def format(self, record: logging.LogRecord) -> str:
+        payload: dict[str, Any] = {
+            "ts": datetime.fromtimestamp(record.created, tz=timezone.utc).isoformat(),
+            "level": record.levelname,
+            "logger": record.name,
+            "message": record.getMessage(),
+            "file": record.filename,
+            "func": record.funcName,
+            "line": record.lineno,
+        }
+        extras = {
+            k: v for k, v in record.__dict__.items()
+            if k not in self._STD and not k.startswith("_")
+        }
+        if extras:
+            payload["extra"] = extras
+        if record.exc_info:
+            payload["exc"] = self.formatException(record.exc_info)
+        return json.dumps(payload, ensure_ascii=False)
+class ContextAdapter(logging.LoggerAdapter):
+    """
+    LoggerAdapter that ensures persistent context fields appear in every log entry.
+    """
+    def process(self, msg, kwargs):
+        extra = kwargs.get("extra", {})
+        extra.update(self.extra or {})
+        kwargs["extra"] = extra
+        return msg, kwargs
+class _EnsureContextFilter(logging.Filter):
+    """
+    Adds default values for context keys so format strings never KeyError.
+    """
+    def __init__(self, defaults: Mapping[str, Any] | None = None):
+        super().__init__()
+        self.defaults = dict(defaults or {})
+    def filter(self, record: logging.LogRecord) -> bool:
+        for k, v in self.defaults.items():
+            if not hasattr(record, k):
+                setattr(record, k, v)
+        return True
+def setup_logger(
+    name: str = "wisent",
+    level: int = logging.INFO,
+    *,
+    json_logs: bool = False,
+    stream = sys.stderr,
+) -> logging.Logger:
+    """
+    Create or return a named logger with a single stream handler.
+    Safe to call multiple times; won’t duplicate handlers.
+    """
+    logger = logging.getLogger(name)
+    logger.setLevel(level)
+    if not logger.handlers:
+        handler = logging.StreamHandler(stream)
+        if json_logs:
+            handler.setFormatter(JsonFormatter())
+        else:
+            handler.setFormatter(logging.Formatter(
+                fmt="%(asctime)s | %(levelname)-8s | %(name)s | %(message)s "
+                    "[file=%(filename)s func=%(funcName)s line=%(lineno)d] "
+                    "%(task_name)s%(subtask)s",
+                datefmt="%Y-%m-%dT%H:%M:%S%z",
+            ))
+        # ensure context placeholders always exist
+        handler.addFilter(_EnsureContextFilter({"task_name": "", "subtask": ""}))
+        logger.addHandler(handler)
+        logger.propagate = False
+    return logger
+def add_file_handler(
+    logger: logging.Logger,
+    filepath: str,
+    *,
+    level: int | None = None,
+    json_logs: bool = False,
+) -> None:
+    """
+    Optionally add a file handler (e.g., for long-running CLI jobs).
+    """
+    fh = logging.FileHandler(filepath, encoding="utf-8")
+    fh.setLevel(level or logger.level)
+    if json_logs:
+        fh.setFormatter(JsonFormatter())
+    else:
+        fh.setFormatter(logging.Formatter(
+            fmt="%(asctime)s | %(levelname)-8s | %(name)s | %(message)s "
+                "[file=%(filename)s func=%(funcName)s line=%(lineno)d] "
+                "%(task_name)s%(subtask)s",
+            datefmt="%Y-%m-%dT%H:%M:%S%z",
+        ))
+    fh.addFilter(_EnsureContextFilter({"task_name": "", "subtask": ""}))
+    logger.addHandler(fh)
+def bind(
+    logger: logging.Logger | ContextAdapter,
+    **extra: Any
+) -> ContextAdapter:
+    """
+    Return a ContextAdapter with merged extras.
+    Works whether you pass a raw Logger or an existing ContextAdapter.
+    """
+    if isinstance(logger, ContextAdapter):
+        merged = {**logger.extra, **extra}
+        return ContextAdapter(logger.logger, merged)
+    return ContextAdapter(logger, extra)

wisent/cli/data_loaders/__init__.py ADDED Viewed

File without changes

wisent/cli/data_loaders/data_loader_rotator.py ADDED Viewed

@@ -0,0 +1,96 @@
+from __future__ import annotations
+import importlib
+import importlib.util
+import inspect
+import pkgutil
+from pathlib import Path
+from typing import Any, Dict, List, Optional, Type, Union
+from wisent.core.data_loaders.core.atoms import BaseDataLoader, DataLoaderError, LoadDataResult
+class DataLoaderRotator:
+    """Discover/select a data loader and use it to load data."""
+    def __init__(
+        self,
+        loader: Union[str, BaseDataLoader, Type[BaseDataLoader], None] = None,
+        loaders_location: Union[str, Path] = "wisent_guard.core.data_loaders.loaders",
+        autoload: bool = True,
+        **default_loader_kwargs: Any,
+    ) -> None:
+        self._scope_prefix = (
+            loaders_location if isinstance(loaders_location, str)
+            else Path(loaders_location).as_posix().replace("/", ".")
+        )
+        if autoload:
+            self.discover_loaders(loaders_location)
+        self._loader = self._resolve_loader(loader, **default_loader_kwargs)
+    @staticmethod
+    def discover_loaders(location: Union[str, Path]) -> None:
+        loc_path = Path(str(location))
+        if loc_path.exists() and loc_path.is_dir():
+            for py in loc_path.glob("*.py"):
+                if py.name.startswith("_"):
+                    continue
+                mod_name = f"_dyn_dataloaders_{py.stem}"
+                spec = importlib.util.spec_from_file_location(mod_name, py)
+                if spec and spec.loader:
+                    module = importlib.util.module_from_spec(spec)
+                    spec.loader.exec_module(module)  # type: ignore[attr-defined]
+            return
+        if not isinstance(location, str):
+            raise DataLoaderError(f"Invalid loaders location: {location!r}. Provide dotted path or a directory.")
+        pkg = importlib.import_module(location)
+        search_paths = list(getattr(pkg, "__path__", [])) or [Path(getattr(pkg, "__file__", "")).parent.as_posix()]
+        for _, name, _ in pkgutil.iter_modules(search_paths):
+            if name.startswith("_"):
+                continue
+            importlib.import_module(f"{location}.{name}")
+    def _scoped_registry(self) -> dict[str, type[BaseDataLoader]]:
+        reg = BaseDataLoader.list_registered()
+        return {n: c for n, c in reg.items() if c.__module__.startswith(self._scope_prefix)}
+    @staticmethod
+    def list_loaders(scope_prefix: Optional[str] = None) -> List[Dict[str, Any]]:
+        reg = BaseDataLoader.list_registered()
+        if scope_prefix:
+            reg = {n: c for n, c in reg.items() if c.__module__.startswith(scope_prefix)}
+        return [
+            {"name": n, "description": getattr(c, "description", ""), "class": f"{c.__module__}.{c.__name__}"}
+            for n, c in sorted(reg.items(), key=lambda kv: kv[0])
+        ]
+    def _resolve_loader(
+        self,
+        loader: Union[str, BaseDataLoader, Type[BaseDataLoader], None],
+        **kwargs: Any,
+    ) -> BaseDataLoader:
+        reg = self._scoped_registry()
+        if loader is None:
+            if not reg:
+                raise DataLoaderError(f"No data loaders registered under {self._scope_prefix!r}.")
+            cls = next(iter(sorted(reg.items(), key=lambda kv: kv[0])))[1]
+            return cls(**kwargs)
+        if isinstance(loader, BaseDataLoader):
+            loader.kwargs = {**kwargs, **loader.kwargs}
+            return loader
+        if inspect.isclass(loader) and issubclass(loader, BaseDataLoader):
+            if not loader.__module__.startswith(self._scope_prefix):
+                raise DataLoaderError(f"Loader class must live under {self._scope_prefix!r}.")
+            return loader(**kwargs)
+        if isinstance(loader, str):
+            if loader not in reg:
+                raise DataLoaderError(f"Unknown loader {loader!r} in scope {self._scope_prefix!r}.")
+            return reg[loader](**kwargs)
+        raise TypeError("loader must be None, a name (str), BaseDataLoader instance, or BaseDataLoader subclass.")
+    def use(self, loader: Union[str, BaseDataLoader, Type[BaseDataLoader]], **kwargs: Any) -> None:
+        self._loader = self._resolve_loader(loader, **kwargs)
+    def load(self, **kwargs: Any) -> LoadDataResult:
+        merged = {**getattr(self._loader, "kwargs", {}), **kwargs}
+        return self._loader.load(**merged)

wisent/cli/evaluators/__init__.py ADDED Viewed

File without changes

wisent/cli/evaluators/evaluator_rotator.py ADDED Viewed

@@ -0,0 +1,148 @@
+from __future__ import annotations
+import importlib
+import importlib.util
+import pkgutil
+from pathlib import Path
+from typing import Any, Dict, List, Optional, Sequence, Union, Type
+import inspect
+import logging
+from wisent.core.evaluators.core.atoms import BaseEvaluator, EvalResult, EvaluatorError
+logger = logging.getLogger(__name__)
+class EvaluatorRotator:
+    """Orchestrates evaluator selection and execution with flexible discovery."""
+    def __init__(
+        self,
+        evaluator: Union[str, BaseEvaluator, Type[BaseEvaluator], None] = None,
+        task_name: Optional[str] = None,
+        evaluators_location: Union[str, Path] = "wisent_guard.core.evaluators.oracles",
+        autoload: bool = True,
+    ) -> None:
+        if autoload:
+            self.discover_evaluators(evaluators_location)
+        self._evaluator = self._resolve_evaluator(evaluator)
+        self._task_name = task_name
+    @staticmethod
+    def discover_evaluators(location: Union[str, Path] = "wisent_guard.core.evaluators.oracles") -> None:
+        """
+        Import all evaluator modules so BaseEvaluator subclasses self-register.
+        - If `location` is a dotted module path (str without existing FS path),
+          import that package and iterate its __path__ (works with namespace packages).
+        - If `location` is an existing directory (Path/str), import all .py files inside.
+        """
+        loc_path = Path(str(location))
+        if loc_path.exists() and loc_path.is_dir():
+            EvaluatorRotator._import_all_py_in_dir(loc_path)
+            return
+        if not isinstance(location, str):
+            raise EvaluatorError(
+                f"Invalid evaluators location: {location!r}. Provide a dotted module path or a directory."
+            )
+        try:
+            pkg = importlib.import_module(location)
+        except ModuleNotFoundError as exc:
+            raise EvaluatorError(
+                f"Cannot import evaluator package {location!r}. "
+                f"Use dotted path (no leading slash) and ensure your project root is on PYTHONPATH."
+            ) from exc
+        search_paths = list(getattr(pkg, "__path__", []))  # supports namespace pkgs
+        if not search_paths:
+            # Some packages may still have __file__ only
+            pkg_file = getattr(pkg, "__file__", None)
+            if pkg_file:
+                search_paths = [str(Path(pkg_file).parent)]
+        for finder, name, ispkg in pkgutil.iter_modules(search_paths):
+            if name.startswith("_"):
+                continue
+            importlib.import_module(f"{location}.{name}")
+    @staticmethod
+    def _import_all_py_in_dir(directory: Path) -> None:
+        for py in directory.glob("*.py"):
+            if py.name.startswith("_"):
+                continue
+            mod_name = f"_dyn_evaluators_{py.stem}"
+            spec = importlib.util.spec_from_file_location(mod_name, py)
+            if spec and spec.loader:
+                module = importlib.util.module_from_spec(spec)
+                spec.loader.exec_module(module)  # type: ignore[attr-defined]
+    @staticmethod
+    def list_evaluators() -> List[Dict[str, Any]]:
+        out: List[Dict[str, Any]] = []
+        for name, cls in BaseEvaluator.list_registered().items():
+            out.append(
+                {
+                    "name": name,
+                    "description": getattr(cls, "description", ""),
+                    "task_names": list(getattr(cls, "task_names", ())),
+                    "class": f"{cls.__module__}.{cls.__name__}",
+                }
+            )
+        return sorted(out, key=lambda x: x["name"])
+    @staticmethod
+    def _resolve_evaluator(
+        evaluator: Union[str, BaseEvaluator, Type[BaseEvaluator], None]
+    ) -> BaseEvaluator:
+        if evaluator is None:
+            registry = BaseEvaluator.list_registered()
+            if "lm_eval" in registry:
+                return registry["lm_eval"]()
+            if registry:
+                return next(iter(registry.values()))()
+            raise EvaluatorError("No evaluators registered.")
+        if isinstance(evaluator, BaseEvaluator):
+            return evaluator
+        if inspect.isclass(evaluator) and issubclass(evaluator, BaseEvaluator):
+            return evaluator()
+        if isinstance(evaluator, str):
+            cls = BaseEvaluator.get(evaluator)
+            return cls()
+        raise TypeError(
+            "evaluator must be None, a name (str), BaseEvaluator instance, or BaseEvaluator subclass."
+        )
+    def use(self, evaluator: Union[str, BaseEvaluator, Type[BaseEvaluator]]) -> None:
+        self._evaluator = self._resolve_evaluator(evaluator)
+    def evaluate(self, response: str, expected: Any, **kwargs) -> EvalResult:
+        kwargs.setdefault("task_name", self._task_name)
+        return self._evaluator.evaluate(response, expected, **kwargs)
+    def evaluate_batch(
+        self, responses: Sequence[str], expected_answers: Sequence[Any], **kwargs
+    ) -> List[EvalResult]:
+        kwargs.setdefault("task_name", self._task_name)
+        return self._evaluator.evaluate_batch(responses, expected_answers, **kwargs)
+if __name__ == "__main__":
+    from evaluator_rotator import EvaluatorRotator
+    rot = EvaluatorRotator(
+    evaluators_location="wisent_guard.core.evaluators.oracles",  # << no leading slash
+    autoload=True,
+    )
+    rot.list_evaluators()
+    print("Available evaluators:")
+    for ev in rot.list_evaluators():
+        print(f" - {ev['name']}: {ev['description']} (tasks: {', '.join(ev['task_names'])})")
+    # rot.use("nlp")
+    # res = rot.evaluate("The answer is probably 42", expected="The answer is 12")
+    # print(res)

wisent/cli/steering_methods/__init__.py ADDED Viewed

File without changes

wisent 0.1.1__py3-none-any.whl → 0.5.2__py3-none-any.whl

Potentially problematic release.

wisent 0.1.1py3-none-any.whl → 0.5.2py3-none-any.whl