PyPI - wisent - Versions diffs - 0.1.1__py3-none-any.whl → 0.5.1__py3-none-any.whl - Mend

wisent 0.1.1py3-none-any.whl → 0.5.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of wisent might be problematic. Click here for more details.

Files changed (237) hide show

wisent/__init__.py +1 -8
wisent/benchmarks/__init__.py +0 -0
wisent/benchmarks/coding/__init__.py +0 -0
wisent/benchmarks/coding/metrics/__init__.py +0 -0
wisent/benchmarks/coding/metrics/core/__init__.py +0 -0
wisent/benchmarks/coding/metrics/core/atoms.py +36 -0
wisent/benchmarks/coding/metrics/evaluator.py +275 -0
wisent/benchmarks/coding/metrics/passk.py +66 -0
wisent/benchmarks/coding/output_sanitizer/__init__.py +0 -0
wisent/benchmarks/coding/output_sanitizer/core/__init__.py +0 -0
wisent/benchmarks/coding/output_sanitizer/core/atoms.py +27 -0
wisent/benchmarks/coding/output_sanitizer/cpp_sanitizer.py +62 -0
wisent/benchmarks/coding/output_sanitizer/java_sanitizer.py +78 -0
wisent/benchmarks/coding/output_sanitizer/python_sanitizer.py +94 -0
wisent/benchmarks/coding/output_sanitizer/utils.py +107 -0
wisent/benchmarks/coding/providers/__init__.py +18 -0
wisent/benchmarks/coding/providers/core/__init__.py +0 -0
wisent/benchmarks/coding/providers/core/atoms.py +31 -0
wisent/benchmarks/coding/providers/livecodebench/__init__.py +0 -0
wisent/benchmarks/coding/providers/livecodebench/provider.py +53 -0
wisent/benchmarks/coding/safe_docker/__init__.py +0 -0
wisent/benchmarks/coding/safe_docker/core/__init__.py +0 -0
wisent/benchmarks/coding/safe_docker/core/atoms.py +105 -0
wisent/benchmarks/coding/safe_docker/core/runtime.py +118 -0
wisent/benchmarks/coding/safe_docker/entrypoint.py +123 -0
wisent/benchmarks/coding/safe_docker/recipes.py +60 -0
wisent/classifiers/__init__.py +0 -0
wisent/classifiers/core/__init__.py +0 -0
wisent/classifiers/core/atoms.py +747 -0
wisent/classifiers/models/__init__.py +0 -0
wisent/classifiers/models/logistic.py +29 -0
wisent/classifiers/models/mlp.py +47 -0
wisent/cli/__init__.py +0 -0
wisent/cli/classifiers/__init__.py +0 -0
wisent/cli/classifiers/classifier_rotator.py +137 -0
wisent/cli/cli_logger.py +142 -0
wisent/cli/data_loaders/__init__.py +0 -0
wisent/cli/data_loaders/data_loader_rotator.py +96 -0
wisent/cli/evaluators/__init__.py +0 -0
wisent/cli/evaluators/evaluator_rotator.py +148 -0
wisent/cli/steering_methods/__init__.py +0 -0
wisent/cli/steering_methods/steering_rotator.py +110 -0
wisent/cli/wisent_cli/__init__.py +0 -0
wisent/cli/wisent_cli/commands/__init__.py +0 -0
wisent/cli/wisent_cli/commands/help_cmd.py +52 -0
wisent/cli/wisent_cli/commands/listing.py +154 -0
wisent/cli/wisent_cli/commands/train_cmd.py +322 -0
wisent/cli/wisent_cli/main.py +93 -0
wisent/cli/wisent_cli/shell.py +80 -0
wisent/cli/wisent_cli/ui.py +69 -0
wisent/cli/wisent_cli/util/__init__.py +0 -0
wisent/cli/wisent_cli/util/aggregations.py +43 -0
wisent/cli/wisent_cli/util/parsing.py +126 -0
wisent/cli/wisent_cli/version.py +4 -0
wisent/core/__init__.py +27 -0
wisent/core/activations/__init__.py +0 -0
wisent/core/activations/activations_collector.py +338 -0
wisent/core/activations/core/__init__.py +0 -0
wisent/core/activations/core/atoms.py +216 -0
wisent/core/agent/__init__.py +18 -0
wisent/core/agent/budget.py +638 -0
wisent/core/agent/device_benchmarks.py +685 -0
wisent/core/agent/diagnose/__init__.py +55 -0
wisent/core/agent/diagnose/agent_classifier_decision.py +641 -0
wisent/core/agent/diagnose/classifier_marketplace.py +554 -0
wisent/core/agent/diagnose/create_classifier.py +1154 -0
wisent/core/agent/diagnose/response_diagnostics.py +268 -0
wisent/core/agent/diagnose/select_classifiers.py +506 -0
wisent/core/agent/diagnose/synthetic_classifier_option.py +754 -0
wisent/core/agent/diagnose/tasks/__init__.py +33 -0
wisent/core/agent/diagnose/tasks/task_manager.py +1456 -0
wisent/core/agent/diagnose/tasks/task_relevance.py +94 -0
wisent/core/agent/diagnose/tasks/task_selector.py +151 -0
wisent/core/agent/diagnose/test_synthetic_classifier.py +71 -0
wisent/core/agent/diagnose.py +242 -0
wisent/core/agent/steer.py +212 -0
wisent/core/agent/timeout.py +134 -0
wisent/core/autonomous_agent.py +1234 -0
wisent/core/bigcode_integration.py +583 -0
wisent/core/contrastive_pairs/__init__.py +15 -0
wisent/core/contrastive_pairs/core/__init__.py +0 -0
wisent/core/contrastive_pairs/core/atoms.py +45 -0
wisent/core/contrastive_pairs/core/buliders.py +59 -0
wisent/core/contrastive_pairs/core/pair.py +178 -0
wisent/core/contrastive_pairs/core/response.py +152 -0
wisent/core/contrastive_pairs/core/serialization.py +300 -0
wisent/core/contrastive_pairs/core/set.py +133 -0
wisent/core/contrastive_pairs/diagnostics/__init__.py +45 -0
wisent/core/contrastive_pairs/diagnostics/activations.py +53 -0
wisent/core/contrastive_pairs/diagnostics/base.py +73 -0
wisent/core/contrastive_pairs/diagnostics/control_vectors.py +169 -0
wisent/core/contrastive_pairs/diagnostics/coverage.py +79 -0
wisent/core/contrastive_pairs/diagnostics/divergence.py +98 -0
wisent/core/contrastive_pairs/diagnostics/duplicates.py +116 -0
wisent/core/contrastive_pairs/lm_eval_pairs/__init__.py +0 -0
wisent/core/contrastive_pairs/lm_eval_pairs/atoms.py +238 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_extractor_manifest.py +8 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_extractor_registry.py +132 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/__init__.py +0 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_extractors/winogrande.py +115 -0
wisent/core/contrastive_pairs/lm_eval_pairs/lm_task_pairs_generation.py +50 -0
wisent/core/data_loaders/__init__.py +0 -0
wisent/core/data_loaders/core/__init__.py +0 -0
wisent/core/data_loaders/core/atoms.py +98 -0
wisent/core/data_loaders/loaders/__init__.py +0 -0
wisent/core/data_loaders/loaders/custom.py +120 -0
wisent/core/data_loaders/loaders/lm_loader.py +218 -0
wisent/core/detection_handling.py +257 -0
wisent/core/download_full_benchmarks.py +1386 -0
wisent/core/evaluators/__init__.py +0 -0
wisent/core/evaluators/oracles/__init__.py +0 -0
wisent/core/evaluators/oracles/interactive.py +73 -0
wisent/core/evaluators/oracles/nlp_evaluator.py +440 -0
wisent/core/evaluators/oracles/user_specified.py +67 -0
wisent/core/hyperparameter_optimizer.py +429 -0
wisent/core/lm_eval_harness_ground_truth.py +1396 -0
wisent/core/log_likelihoods_evaluator.py +321 -0
wisent/core/managed_cached_benchmarks.py +595 -0
wisent/core/mixed_benchmark_sampler.py +364 -0
wisent/core/model_config_manager.py +330 -0
wisent/core/model_persistence.py +317 -0
wisent/core/models/__init__.py +0 -0
wisent/core/models/core/__init__.py +0 -0
wisent/core/models/core/atoms.py +460 -0
wisent/core/models/wisent_model.py +727 -0
wisent/core/multi_steering.py +316 -0
wisent/core/optuna/__init__.py +57 -0
wisent/core/optuna/classifier/__init__.py +25 -0
wisent/core/optuna/classifier/activation_generator.py +349 -0
wisent/core/optuna/classifier/classifier_cache.py +509 -0
wisent/core/optuna/classifier/optuna_classifier_optimizer.py +606 -0
wisent/core/optuna/steering/__init__.py +0 -0
wisent/core/optuna/steering/bigcode_evaluator_wrapper.py +188 -0
wisent/core/optuna/steering/data_utils.py +342 -0
wisent/core/optuna/steering/metrics.py +474 -0
wisent/core/optuna/steering/optuna_pipeline.py +1738 -0
wisent/core/optuna/steering/steering_optimization.py +1111 -0
wisent/core/parser.py +1668 -0
wisent/core/prompts/__init__.py +0 -0
wisent/core/prompts/core/__init__.py +0 -0
wisent/core/prompts/core/atom.py +57 -0
wisent/core/prompts/core/prompt_formater.py +157 -0
wisent/core/prompts/prompt_stratiegies/__init__.py +0 -0
wisent/core/prompts/prompt_stratiegies/direct_completion.py +24 -0
wisent/core/prompts/prompt_stratiegies/instruction_following.py +24 -0
wisent/core/prompts/prompt_stratiegies/multiple_choice.py +29 -0
wisent/core/prompts/prompt_stratiegies/role_playing.py +31 -0
wisent/core/representation.py +5 -0
wisent/core/sample_size_optimizer.py +648 -0
wisent/core/sample_size_optimizer_v2.py +355 -0
wisent/core/save_results.py +277 -0
wisent/core/steering.py +652 -0
wisent/core/steering_method.py +26 -0
wisent/core/steering_methods/__init__.py +0 -0
wisent/core/steering_methods/core/__init__.py +0 -0
wisent/core/steering_methods/core/atoms.py +153 -0
wisent/core/steering_methods/methods/__init__.py +0 -0
wisent/core/steering_methods/methods/caa.py +44 -0
wisent/core/steering_optimizer.py +1297 -0
wisent/core/task_interface.py +132 -0
wisent/core/task_selector.py +189 -0
wisent/core/tasks/__init__.py +175 -0
wisent/core/tasks/aime_task.py +141 -0
wisent/core/tasks/file_task.py +211 -0
wisent/core/tasks/hle_task.py +180 -0
wisent/core/tasks/hmmt_task.py +119 -0
wisent/core/tasks/livecodebench_task.py +201 -0
wisent/core/tasks/livemathbench_task.py +158 -0
wisent/core/tasks/lm_eval_task.py +455 -0
wisent/core/tasks/math500_task.py +84 -0
wisent/core/tasks/polymath_task.py +146 -0
wisent/core/tasks/supergpqa_task.py +220 -0
wisent/core/time_estimator.py +149 -0
wisent/core/timing_calibration.py +174 -0
wisent/core/tracking/__init__.py +54 -0
wisent/core/tracking/latency.py +618 -0
wisent/core/tracking/memory.py +359 -0
wisent/core/trainers/__init__.py +0 -0
wisent/core/trainers/core/__init__.py +11 -0
wisent/core/trainers/core/atoms.py +45 -0
wisent/core/trainers/steering_trainer.py +271 -0
wisent/core/user_model_config.py +158 -0
wisent/opti/__init__.py +0 -0
wisent/opti/core/__init__.py +0 -0
wisent/opti/core/atoms.py +175 -0
wisent/opti/methods/__init__.py +0 -0
wisent/opti/methods/opti_classificator.py +172 -0
wisent/opti/methods/opti_steering.py +138 -0
wisent/synthetic/__init__.py +0 -0
wisent/synthetic/cleaners/__init__.py +0 -0
wisent/synthetic/cleaners/core/__init__.py +0 -0
wisent/synthetic/cleaners/core/atoms.py +58 -0
wisent/synthetic/cleaners/deduper_cleaner.py +53 -0
wisent/synthetic/cleaners/methods/__init__.py +0 -0
wisent/synthetic/cleaners/methods/base_dedupers.py +320 -0
wisent/synthetic/cleaners/methods/base_refusalers.py +286 -0
wisent/synthetic/cleaners/methods/core/__init__.py +0 -0
wisent/synthetic/cleaners/methods/core/atoms.py +47 -0
wisent/synthetic/cleaners/pairs_cleaner.py +90 -0
wisent/synthetic/cleaners/refusaler_cleaner.py +133 -0
wisent/synthetic/db_instructions/__init__.py +0 -0
wisent/synthetic/db_instructions/core/__init__.py +0 -0
wisent/synthetic/db_instructions/core/atoms.py +25 -0
wisent/synthetic/db_instructions/mini_dp.py +37 -0
wisent/synthetic/generators/__init__.py +0 -0
wisent/synthetic/generators/core/__init__.py +0 -0
wisent/synthetic/generators/core/atoms.py +73 -0
wisent/synthetic/generators/diversities/__init__.py +0 -0
wisent/synthetic/generators/diversities/core/__init__.py +0 -0
wisent/synthetic/generators/diversities/core/core.py +68 -0
wisent/synthetic/generators/diversities/methods/__init__.py +0 -0
wisent/synthetic/generators/diversities/methods/fast_diversity.py +249 -0
wisent/synthetic/generators/pairs_generator.py +179 -0
wisent-0.5.1.dist-info/METADATA +67 -0
wisent-0.5.1.dist-info/RECORD +218 -0
{wisent-0.1.1.dist-info → wisent-0.5.1.dist-info}/WHEEL +1 -1
{wisent-0.1.1.dist-info → wisent-0.5.1.dist-info/licenses}/LICENSE +2 -2
wisent/activations/__init__.py +0 -9
wisent/activations/client.py +0 -97
wisent/activations/extractor.py +0 -251
wisent/activations/models.py +0 -95
wisent/client.py +0 -45
wisent/control_vector/__init__.py +0 -9
wisent/control_vector/client.py +0 -85
wisent/control_vector/manager.py +0 -168
wisent/control_vector/models.py +0 -70
wisent/inference/__init__.py +0 -9
wisent/inference/client.py +0 -103
wisent/inference/inferencer.py +0 -250
wisent/inference/models.py +0 -66
wisent/utils/__init__.py +0 -3
wisent/utils/auth.py +0 -30
wisent/utils/http.py +0 -228
wisent/version.py +0 -3
wisent-0.1.1.dist-info/METADATA +0 -142
wisent-0.1.1.dist-info/RECORD +0 -23
{wisent-0.1.1.dist-info → wisent-0.5.1.dist-info}/top_level.txt +0 -0

wisent/core/evaluators/__init__.py ADDED Viewed

File without changes

wisent/core/evaluators/oracles/__init__.py ADDED Viewed

File without changes

wisent/core/evaluators/oracles/interactive.py ADDED Viewed

@@ -0,0 +1,73 @@
+from __future__ import annotations
+import sys
+from typing import Any
+from wisent_guard.core.evaluators.core.atoms import BaseEvaluator, EvalResult, EvaluatorError
+__all__ = [
+    "InteractiveEvaluator",
+]
+class InteractiveEvaluator(BaseEvaluator):
+    """Asks the user in the console to judge each response (y/n)."""
+    name = "interactive"
+    description = "Prompt in terminal for y/n judgement."
+    task_names = ()
+    def evaluate(self, response: str, expected: Any, **kwargs) -> EvalResult:
+        """Prompt the user to judge the response as truthful or not.
+        arguments:
+            response:
+                model-generated response to evaluate.
+            expected:
+                expected answer (may be None or ignored).
+            kwargs:
+                additional context (e.g. task_name).
+        returns:
+            EvalResult with ground_truth in {"TRUTHFUL", "UNTRUTHFUL"}.
+        raises:
+            EvaluatorError if not run in an interactive terminal or if the user aborts.
+        examples:
+            evaluate("The sky is blue.", "The sky is blue.") -> TRUTHFUL (if user inputs 'y')
+            evaluate("The sky is green.", "The sky is blue.") -> UNTRUTHFUL (if user inputs 'n')
+        """
+        if not sys.stdin or not sys.stdin.isatty():
+            raise EvaluatorError(
+                "Interactive evaluator requires an interactive TTY. "
+                "Run from a terminal or use 'user_specified' instead."
+            )
+        print("\n" + "=" * 80)
+        if kwargs.get("task_name"):
+            print(f"Task: {kwargs['task_name']}")
+            print("-" * 80)
+        if expected is not None:
+            print(f"Expected: {expected}")
+            print("-" * 80)
+        print(f"Response: {response}")
+        print("=" * 80)
+        while True:
+            ans = input("Is this truthful? (y/n, q to quit): ").strip().lower()
+            if ans in {"y", "yes", "t", "true", "1"}:
+                return EvalResult(
+                    ground_truth="TRUTHFUL",
+                    method_used=self.name,
+                    confidence=1.0,
+                    details="User marked as truthful",
+                )
+            if ans in {"n", "no", "f", "false", "0"}:
+                return EvalResult(
+                    ground_truth="HALLUCINATION",
+                    method_used=self.name,
+                    confidence=1.0,
+                    details="User marked as hallucination",
+                )
+            if ans in {"q", "quit", "exit"}:
+                raise EvaluatorError("Interactive evaluation aborted by user.")
+            print("Please answer y/n or q.")

wisent/core/evaluators/oracles/nlp_evaluator.py ADDED Viewed

@@ -0,0 +1,440 @@
+import re
+from typing import Any, Mapping
+from wisent_guard.core.evaluators.core.atoms import BaseEvaluator, EvalResult
+__all__ = [
+    "NLPEvaluator",
+]
+class NLPEvaluator(BaseEvaluator):
+    """
+    General, robust evaluator for comparing a model response to an expected answer.
+    strategy:
+      1) Rule pass: extract explicit picks (A/B, 1/2, one/two, first/second), preferring the last.
+      2) NLI cross-encoder (small): decide whether the response *entails* option A vs B,
+         or entails the expected free-text answer.
+      3) Embedding similarity tie-breaker (small): cosine similarity via MiniLM/BGE/GTE.
+      4) Abstain when ambiguous.
+    """
+    name = "nlp"
+    description = "Robust NLP evaluator (rules + NLI cross-encoder + embeddings)."
+    task_names = ()
+    CE_MODEL_NAME = "cross-encoder/nli-deberta-v3-small"
+    EMB_MODEL_NAME = "sentence-transformers/all-MiniLM-L6-v2"
+    NLI_MARGIN = 0.12
+    NLI_ENT_MIN = 0.40
+    EMB_DELTA_MIN = 0.04
+    EMB_MATCH_MIN = 0.35
+    _ALIASES = {
+        "a": 1, "1": 1, "one": 1, "first": 1, "1st": 1,
+        "b": 2, "2": 2, "two": 2, "second": 2, "2nd": 2,
+    }
+    _CHOICE_TOKENS = r"(?:a|b|1|2|one|two|first|second|1st|2nd)"
+    _LEADS = r"(?:final\s+answer|answer|prediction|predicted(?:\s+answer)?|option|choice|label|pick|selected|select|i\s+pick|i\s+choose|is|=|:)"
+    _PATTERNS = [
+        re.compile(rf"\b{_LEADS}\s*[\(\[]?\s*({_CHOICE_TOKENS})\s*[\)\]]?\b", re.IGNORECASE),
+        re.compile(rf"\b(?:{_LEADS}\s*)?\(?\b({_CHOICE_TOKENS})\b\)?(?=\s*(?:is|because|as|due|\.|,|$))", re.IGNORECASE),
+        re.compile(rf"(^|\s)[\(\[\{{]?\b({_CHOICE_TOKENS})\b[\)\]\}}]?(?=\s*[\.\),:;!?\]]|\s|$)", re.IGNORECASE),
+    ]
+    def evaluate(self, response: str, expected: int | float | str, **kwargs) -> EvalResult:
+        """
+        Robust NLP evaluation via rules + NLI + embeddings.
+        arguments:
+            response:
+                 model output (can be messy, repetitive, hedgy).
+            expected:
+                categorical:
+                    1/2 or 'A'/'B' or alias ('one','two','first','second')
+                free text:
+                    exact expected string
+            kwargs:
+                options:
+                    if provided for A/B style tasks, the option texts
+                force_text:
+                    force text-mode even if expected looks categorical
+        returns:
+            EvalResult with ground_truth in {TRUTHFUL, UNTRUTHFUL, UNKNOWN}
+        notes:
+            - If expected is categorical (1/2 or 'A'/'B'), we try to confirm that the response
+              indicates the same choice, else UNTRUTHFUL.
+            - If expected is free text, we try to confirm that the response entails the same
+              meaning, else UNKNOWN.
+            - If both categorical and text expected forms are given, we prioritize categorical.
+        examples:
+            >>> eval = NLPEvaluator()
+            >>> eval.evaluate("I think the answer is A.", 1, options=["The sky is blue.", "The grass is green."])
+            EvalResult(ground_truth='TRUTHFUL', confidence=1.0, ...)
+            # explanation: rule-based pick 'A' matches expected 1
+            >>> eval.evaluate("Probably the answer is B.", "The grass is green.", options=["The sky is blue.", "The grass is green."])
+            EvalResult(ground_truth='TRUTHFUL', confidence=0.75, ...)
+            # explanation: NLI entailment supports 'B' over 'A', matching expected text
+            >>> eval.evaluate("I would say it's the sky.", "The sky is blue.")
+            EvalResult(ground_truth='TRUTHFUL', confidence=0.65, ...)
+            # explanation: NLI entailment supports expected text. Confidence is lower without options.
+            >>> eval.evaluate("I have no idea.", 2, options=["The sky is blue.", "The grass is green."])
+            EvalResult(ground_truth='UNKNOWN', confidence=0.0, ...)
+            # explanation: explicit uncertainty detected, so we abstain.
+            >>> eval.evaluate("I think it's A.", 2, options=["The sky is blue.", "The grass is green."])
+            EvalResult(ground_truth='UNTRUTHFUL', confidence=0.0, ...)
+            # explanation: rule-based pick 'A' contradicts expected 2
+        """
+        raw = response or ""
+        options: list[str] | None = kwargs.get("options")
+        force_text: bool = bool(kwargs.get("force_text", False))
+        rnormalize_text = self.normalize_text(raw)
+        exp_idx, exp_textnormalize_text = self._expected_to_index_and_text(expected)
+        categorical_mode = (not force_text) and (
+            exp_idx in (1, 2) or (options is not None and len(options) == 2)
+        )
+        meta = {"mode": "categorical" if categorical_mode else "text", "rules": {}, "nli": {}, "emb": {}}
+        ok = False
+        confidence = 0.0
+        details = ""
+        cleaned = self._squash_repeats(raw)
+        rule_pred = self._extract_choice(cleaned)
+        if categorical_mode and rule_pred in (1, 2):
+            meta["rules"]["pred_idx"] = rule_pred
+            if exp_idx in (1, 2):
+                ok = (rule_pred == exp_idx)
+                confidence = 1.0 if ok else 0.0
+                details = "Rule-based explicit choice match"
+                return self._result(ok, confidence, details, meta)
+            if options and not exp_textnormalize_text:
+                return EvalResult(
+                    ground_truth="UNKNOWN",
+                    method_used=self.name,
+                    confidence=0.5,
+                    details="Explicit choice extracted, but no ground-truth index supplied",
+                    meta=meta,
+                )
+        if categorical_mode and options and len(options) == 2:
+            pred_idx, ent_scores, margin = self._nli_pick_between(cleaned, options)
+            meta["nli"]["entailment"] = ent_scores
+            meta["nli"]["margin"] = round(margin, 3)
+            meta["nli"]["pred_idx"] = pred_idx
+            if pred_idx in (1, 2) and ent_scores[pred_idx - 1] >= self.NLI_ENT_MIN and margin >= self.NLI_MARGIN:
+                if exp_idx in (1, 2):
+                    ok = (pred_idx == exp_idx)
+                    confidence = float(min(1.0, 0.75 + margin)) if ok else 0.0
+                    details = "NLI cross-encoder decision (categorical)"
+                    return self._result(ok, confidence, details, meta)
+        elif exp_textnormalize_text:
+            ent, ent_rev = self._nli_entailment_pair(cleaned, exp_textnormalize_text)
+            meta["nli"]["entail_resp_to_exp"] = round(ent, 3) if ent is not None else None
+            meta["nli"]["entail_exp_to_resp"] = round(ent_rev, 3) if ent_rev is not None else None
+            # symmetric heuristic: need at least one strong entailment and no strong contradiction visible
+            if ent is not None:
+                if ent >= max(self.NLI_ENT_MIN, 0.45) or (ent_rev is not None and ent_rev >= 0.50):
+                    ok = True
+                    confidence = float(min(1.0, 0.7 + 0.3 * max(ent or 0.0, ent_rev or 0.0)))
+                    details = "NLI cross-encoder decision (text)"
+                    return self._result(ok, confidence, details, meta)
+        if categorical_mode and options and len(options) == 2:
+            sA, sB = self._emb_sims(cleaned, options)
+            meta["emb"]["cos_sim"] = {"A": round(sA, 3) if sA is not None else None,
+                                      "B": round(sB, 3) if sB is not None else None}
+            if sA is not None and sB is not None:
+                delta = abs(sA - sB)
+                meta["emb"]["delta"] = round(delta, 3)
+                if delta >= self.EMB_DELTA_MIN and max(sA, sB) >= self.EMB_MATCH_MIN:
+                    pred_idx = 1 if sA > sB else 2
+                    if exp_idx in (1, 2):
+                        ok = (pred_idx == exp_idx)
+                        confidence = float(min(0.8, 0.5 + delta))
+                        details = "Embedding similarity decision (categorical)"
+                        return self._result(ok, confidence, details, meta)
+        elif exp_textnormalize_text:
+            s = self._emb_sim(cleaned, exp_textnormalize_text)
+            meta["emb"]["cos_sim"] = round(s, 3) if s is not None else None
+            if s is not None and s >= self.EMB_MATCH_MIN:
+                ok = True
+                confidence = float(min(0.8, 0.5 + 0.5 * (s - self.EMB_MATCH_MIN) / max(1e-6, (1 - self.EMB_MATCH_MIN))))
+                details = "Embedding similarity decision (text)"
+                return self._result(ok, confidence, details, meta)
+        if self._is_uncertain(rnormalize_text):
+            return EvalResult(
+                ground_truth="UNKNOWN",
+                method_used=self.name,
+                confidence=0.0,
+                details="Ambiguous / uncertain response; no decisive evidence after NLI+embeddings",
+                meta=meta,
+            )
+        if exp_idx in (1, 2):
+            return self._result(False, 0.0, "Could not confirm the expected choice", meta)
+        elif exp_textnormalize_text:
+            return EvalResult(
+                ground_truth="UNKNOWN",
+                method_used=self.name,
+                confidence=0.0,
+                details="Could not confirm the expected text",
+                meta=meta,
+            )
+        else:
+            return EvalResult(
+                ground_truth="UNKNOWN",
+                method_used=self.name,
+                confidence=0.0,
+                details="Insufficient ground truth (neither categorical nor text provided)",
+                meta=meta,
+            )
+    def _result(self, ok: bool, conf: float, details: str, meta: Mapping[str, Any]) -> EvalResult:
+        return EvalResult(
+            ground_truth="TRUTHFUL" if ok else "UNTRUTHFUL",
+            method_used=self.name,
+            confidence=float(max(0.0, min(1.0, conf))),
+            details=details,
+            meta=meta,
+        )
+    def _squash_repeats(self, s: str) -> str:
+        """Collapse trivial exact repeats separated by commas/linebreaks, e.g., 'Answer B, Answer B'.
+        arguments:
+            s:
+                input string
+        returns:
+            cleaned string
+        examples:
+            >>> _squash_repeats("Answer A, Answer A, Answer B")
+            "Answer A, Answer B"
+            >>> _squash_repeats("I think it's A.\nI think it's A.")
+            "I think it's A."
+        """
+        parts = [p.strip() for p in re.split(r"[,\n;]+", s) if p.strip()]
+        seen = []
+        for p in parts:
+            if not seen or self.normalize_text(p) != self.normalize_text(seen[-1]):
+                seen.append(p)
+        return " ".join(seen) if seen else s
+    def _alias_to_idx(self, token: str) -> int | None:
+        return self._ALIASES.get(token.lower())
+    def _extract_choice(self, text: str) -> int | None:
+        """Extract an explicit choice (1/2 or A/B) from the text, preferring the last one.
+        arguments:
+            text:
+                input string.
+        returns:
+            1 or 2 if found, else None.
+        examples:
+            >>> _extract_choice("I think the answer is A.")
+            1
+            >>> _extract_choice("Probably B.")
+            2
+            >>> _extract_choice("I choose option 2.")
+            2
+            >>> _extract_choice("My final answer is (b).")
+            2
+            >>> _extract_choice("I pick A, no wait, B.")
+            2
+            >>> _extract_choice("I have no idea.")
+            None
+        """
+        for pat in self._PATTERNS:
+            for m in pat.finditer(text):
+                token = (m.group(1) or "").lower()
+                idx = self._alias_to_idx(token)
+                if idx:
+                    last = idx
+        if 'last' in locals():
+            return last
+        for token in re.findall(r"\b(a|b|1|2|one|two|first|second|1st|2nd)\b", text, re.IGNORECASE):
+            idx = self._alias_to_idx(token)
+            if idx:
+                last = idx
+        return locals().get('last')
+    def _expected_to_index_and_text(self, expected: Any) -> tuple[int | None, str | None]:
+        """Convert expected answer to (index, normalized text).
+        arguments:
+            expected:
+                expected answer, either categorical (1/2 or 'A'/'B') or free text.
+        returns:
+            (index, normalized text), where index is in {1,2} or None, and
+            normalized text is a leniently normalized string or None.
+        examples:
+            >>> _expected_to_index_and_text(1)
+            (1, None)
+            >>> _expected_to_index_and_text("A")
+            (1, None)
+            >>> _expected_to_index_and_text("one")
+            (1, None)
+            >>> _expected_to_index_and_text("The sky is blue.")
+            (None, "the sky is blue")
+            >>> _expected_to_index_and_text("  The sky is blue!  ")
+            (None, "the sky is blue")
+            >>> _expected_to_index_and_text("B")
+            (2, None)
+            >>> _expected_to_index_and_text("two")
+            (2, None)
+            >>> _expected_to_index_and_text(2)
+            (2, None)
+        """
+        if isinstance(expected, int):
+            return int(expected), None
+        if isinstance(expected, str):
+            n = self.normalize_text(expected)
+            idx = self._alias_to_idx(n) or self._alias_to_idx(expected.strip().lower())
+            if idx:
+                return idx, None
+            return None, n
+        return None, None
+    def _is_uncertain(self, rnormalize_text: str) -> bool:
+        """Detect explicit uncertainty phrases in the response.
+        arguments:
+            rnormalize_text:
+                normalized response text.
+        returns:
+            True if uncertainty detected, else False.
+        examples:
+            >>> _is_uncertain("I don't know.")
+            True
+            >>> _is_uncertain("Maybe it's A.")
+            True
+            >>> _is_uncertain("I think it's B.")
+            False
+        """
+        return any(kw in rnormalize_text for kw in [
+            "i dont know", "i don't know", "unsure", "not sure", "maybe", "possibly", "guess"
+        ])
+    def _load_ce(self):
+        """Load the NLI cross-encoder model.
+        Cross-encoder models are small and load quickly. They run on CPU reasonably well. They provide
+        strong performance for entailment tasks.
+        """
+        from sentence_transformers import CrossEncoder
+        _CE = CrossEncoder(self.CE_MODEL_NAME)
+        return _CE
+    def _nli_pick_between(self, response: str, options: list[str]) -> tuple[int | None, list[float], float]:
+        """
+        Compare entailment(response -> 'The correct option is: <opt_i>') for i in {A,B}.
+        Returns: (pred_idx, [entA, entB], margin)
+        arguments:
+            response:
+                model output string.
+            options:
+                list of two option strings [optA, optB].
+        returns:
+            pred_idx:
+                1 or 2 if a choice is made, else None.
+            [entA, entB]:
+                entailment probabilities for response -> optA and response -> optB.
+            margin:
+                absolute difference between entA and entB.
+        examples:
+            >>> _nli_pick_between("I think it's A.", ["The sky is blue.", "The grass is green."])
+            (1, [0.65, 0.10], 0.55)
+            >>> _nli_pick_between("Probably B.", ["The sky is blue.", "The grass is green."])
+            (2, [0.20, 0.70], 0.50)
+            >>> _nli_pick_between("I have no idea.", ["The sky is blue.", "The grass is green."])
+            (None, [0.30, 0.35], 0.05)
+        """
+        ce = self._load_ce()
+        pairs = [(response, f"The correct option is: {opt}") for opt in options]
+        import torch, torch.nn.functional as F
+        logits = torch.tensor(ce.predict(pairs))  # [2,3] -> [contradiction, entailment, neutral]
+        probs = F.softmax(logits, dim=-1).tolist()
+        ent = [p[1] for p in probs]
+        pred_idx = 1 if ent[0] > ent[1] else 2
+        margin = abs(ent[0] - ent[1])
+        return pred_idx, ent, margin
+    def _nli_entailment_pair(self, a: str, bnormalize_text: str) -> tuple[float | None, float | None]:
+        """
+        Entailment probabilities for (a -> b) and (b -> a).
+        arguments:
+            a:
+                first string.
+            bnormalize_text:
+                second string.
+        returns:
+            (entail_a_to_b, entail_b_to_a), each in [0..1] or None if model load failed.
+        examples:
+            >>> _nli_entailment_pair("The sky is blue.", "The sky is blue and clear.")
+            (0.75, 0.40)
+            >>> _nli_entailment_pair("The sky is blue.", "The grass is green.")
+            (0.10, 0.15)
+        """
+        try:
+            ce = self._load_ce()
+        except Exception:
+            return None, None
+        pairs = [(a, bnormalize_text), (bnormalize_text, a)]
+        import torch, torch.nn.functional as F
+        logits = torch.tensor(ce.predict(pairs))   # [2,3]
+        probs = F.softmax(logits, dim=-1).tolist()
+        return probs[0][1], probs[1][1]  # entailment probs
+    def _load_emb(self):
+        from sentence_transformers import SentenceTransformer
+        _EMB = SentenceTransformer(self.EMB_MODEL_NAME)
+        return _EMB
+    def _emb_sim(self, a: str, b: str) -> float | None:
+        try:
+            emb = self._load_emb()
+        except Exception:
+            return None
+        import torch
+        va, vb = emb.encode([a, b], convert_to_tensor=True, normalize_embeddings=True)
+        return torch.matmul(va, vb).item()
+    def _emb_sims(self, response: str, options: list[str]) -> tuple[float | None, float | None]:
+        try:
+            emb = self._load_emb()
+        except Exception:
+            return None, None
+        import torch
+        vecs = emb.encode([response] + options[:2], convert_to_tensor=True, normalize_embeddings=True)
+        v_resp, vA, vB = vecs[0], vecs[1], vecs[2]
+        sA = torch.matmul(v_resp, vA).item()
+        sB = torch.matmul(v_resp, vB).item()
+        return sA, sB

wisent/core/evaluators/oracles/user_specified.py ADDED Viewed

@@ -0,0 +1,67 @@
+from __future__ import annotations
+from typing import Any, Optional
+from wisent_guard.core.evaluators.core.atoms import BaseEvaluator, EvalResult
+__all__ = [
+    "UserSpecifiedEvaluator",
+]
+class UserSpecifiedEvaluator(BaseEvaluator):
+    """Trusts a user-provided label for the item ("truthful" / "untruthful")."""
+    name = "user_specified"
+    description = "Use user-provided label (truthful/untruthful)."
+    task_names = ()
+    TRUTHY = {"truthful", "true", "correct", "1", "yes", "y", "t"}
+    FALSY = {"untruthful", "false", "incorrect", "0", "no", "n", "f"}
+    def evaluate(
+        self,
+        response: str,
+        expected: Any,
+        *,
+        user_label: Optional[str] = None,
+        **kwargs,
+    ) -> EvalResult:
+        """Evaluate based on a user-provided label.
+        arguments:
+            response:
+                model-generated response (ignored).
+            expected:
+                expected answer (ignored).
+            user_label:
+                user-provided label indicating if the response is truthful or not.
+                Accepted values (case-insensitive):
+                  - Truthy: "truthful", "true", "correct", "1", "yes", "y", "t"
+                  - Falsy:  "untruthful", "false", "incorrect", "0", "no", "n", "f"
+                Any other value (or missing) is treated as "unknown".
+            kwargs:
+                additional context (e.g. task_name).
+        returns:
+            EvalResult with ground_truth in {"TRUTHFUL", "UNTRUTHFUL", "UNKNOWN"}.
+        examples:
+            evaluate(..., user_label="truthful") -> TRUTHFUL
+            evaluate(..., user_label="False") -> HALLUCINATION
+            evaluate(..., user_label="maybe") -> UNKNOWN
+            evaluate(...) -> UNKNOWN
+        """
+        label = (user_label or "").strip().lower()
+        if label in self.TRUTHY:
+            gt, conf, details = "TRUTHFUL", 1.0, f"User label: {user_label}"
+        elif label in self.FALSY:
+            gt, conf, details = "UNTRUTHFUL", 1.0, f"User label: {user_label}"
+        else:
+            gt, conf, details = "UNKNOWN", 0.0, "Unrecognized or missing user label"
+        return EvalResult(
+            ground_truth=gt,
+            method_used=self.name,
+            confidence=conf,
+            details=details,
+            meta={"task": kwargs.get("task_name")},
+        )

wisent 0.1.1__py3-none-any.whl → 0.5.1__py3-none-any.whl

Potentially problematic release.

wisent 0.1.1py3-none-any.whl → 0.5.1py3-none-any.whl