PyPI - agent_os_kernel - Versions diffs - 3.1.0__py3-none-any.whl - Mend

agent_os_kernel 3.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (337) hide show

agent_control_plane/__init__.py +662 -0
agent_control_plane/a2a_adapter.py +543 -0
agent_control_plane/adapter.py +417 -0
agent_control_plane/agent_hibernation.py +394 -0
agent_control_plane/agent_kernel.py +470 -0
agent_control_plane/compliance.py +720 -0
agent_control_plane/constraint_graphs.py +478 -0
agent_control_plane/control_plane.py +854 -0
agent_control_plane/example_executors.py +195 -0
agent_control_plane/execution_engine.py +231 -0
agent_control_plane/flight_recorder.py +846 -0
agent_control_plane/governance_layer.py +435 -0
agent_control_plane/hf_utils.py +563 -0
agent_control_plane/interfaces/__init__.py +55 -0
agent_control_plane/interfaces/kernel_interface.py +361 -0
agent_control_plane/interfaces/plugin_interface.py +497 -0
agent_control_plane/interfaces/protocol_interfaces.py +387 -0
agent_control_plane/kernel_space.py +1009 -0
agent_control_plane/langchain_adapter.py +424 -0
agent_control_plane/lifecycle.py +3113 -0
agent_control_plane/mcp_adapter.py +653 -0
agent_control_plane/ml_safety.py +563 -0
agent_control_plane/multimodal.py +727 -0
agent_control_plane/mute_agent.py +422 -0
agent_control_plane/observability.py +787 -0
agent_control_plane/orchestrator.py +482 -0
agent_control_plane/plugin_registry.py +750 -0
agent_control_plane/policy_engine.py +954 -0
agent_control_plane/process_isolation.py +777 -0
agent_control_plane/shadow_mode.py +310 -0
agent_control_plane/signals.py +493 -0
agent_control_plane/supervisor_agents.py +430 -0
agent_control_plane/time_travel_debugger.py +557 -0
agent_control_plane/tool_registry.py +452 -0
agent_control_plane/vfs.py +697 -0
agent_kernel/__init__.py +69 -0
agent_kernel/analyzer.py +435 -0
agent_kernel/auditor.py +36 -0
agent_kernel/completeness_auditor.py +237 -0
agent_kernel/detector.py +203 -0
agent_kernel/kernel.py +744 -0
agent_kernel/memory_manager.py +85 -0
agent_kernel/models.py +374 -0
agent_kernel/nudge_mechanism.py +263 -0
agent_kernel/outcome_analyzer.py +338 -0
agent_kernel/patcher.py +582 -0
agent_kernel/semantic_analyzer.py +316 -0
agent_kernel/semantic_purge.py +349 -0
agent_kernel/simulator.py +449 -0
agent_kernel/teacher.py +85 -0
agent_kernel/triage.py +152 -0
agent_os/__init__.py +409 -0
agent_os/_adversarial_impl.py +200 -0
agent_os/_circuit_breaker_impl.py +232 -0
agent_os/_mcp_metrics.py +193 -0
agent_os/adversarial.py +20 -0
agent_os/agents_compat.py +490 -0
agent_os/audit_logger.py +135 -0
agent_os/base_agent.py +651 -0
agent_os/circuit_breaker.py +34 -0
agent_os/cli/__init__.py +659 -0
agent_os/cli/cmd_audit.py +128 -0
agent_os/cli/cmd_init.py +152 -0
agent_os/cli/cmd_policy.py +41 -0
agent_os/cli/cmd_policy_gen.py +180 -0
agent_os/cli/cmd_validate.py +258 -0
agent_os/cli/mcp_scan.py +265 -0
agent_os/cli/output.py +192 -0
agent_os/cli/policy_checker.py +330 -0
agent_os/compat.py +74 -0
agent_os/constraint_graph.py +234 -0
agent_os/content_governance.py +140 -0
agent_os/context_budget.py +305 -0
agent_os/credential_redactor.py +224 -0
agent_os/diff_policy.py +89 -0
agent_os/egress_policy.py +159 -0
agent_os/escalation.py +276 -0
agent_os/event_bus.py +124 -0
agent_os/exceptions.py +180 -0
agent_os/execution_context_policy.py +141 -0
agent_os/github_enterprise.py +96 -0
agent_os/health.py +20 -0
agent_os/integrations/__init__.py +279 -0
agent_os/integrations/a2a_adapter.py +279 -0
agent_os/integrations/agent_lightning/__init__.py +30 -0
agent_os/integrations/anthropic_adapter.py +420 -0
agent_os/integrations/autogen_adapter.py +620 -0
agent_os/integrations/base.py +1137 -0
agent_os/integrations/compat.py +229 -0
agent_os/integrations/config.py +98 -0
agent_os/integrations/conversation_guardian.py +957 -0
agent_os/integrations/crewai_adapter.py +467 -0
agent_os/integrations/drift_detector.py +425 -0
agent_os/integrations/dry_run.py +124 -0
agent_os/integrations/escalation.py +582 -0
agent_os/integrations/gemini_adapter.py +364 -0
agent_os/integrations/google_adk_adapter.py +633 -0
agent_os/integrations/guardrails_adapter.py +394 -0
agent_os/integrations/health.py +197 -0
agent_os/integrations/langchain_adapter.py +654 -0
agent_os/integrations/llamafirewall.py +343 -0
agent_os/integrations/llamaindex_adapter.py +188 -0
agent_os/integrations/logging.py +191 -0
agent_os/integrations/maf_adapter.py +631 -0
agent_os/integrations/mistral_adapter.py +365 -0
agent_os/integrations/openai_adapter.py +816 -0
agent_os/integrations/openai_agents_sdk.py +406 -0
agent_os/integrations/policy_compose.py +171 -0
agent_os/integrations/profiling.py +144 -0
agent_os/integrations/pydantic_ai_adapter.py +420 -0
agent_os/integrations/rate_limiter.py +130 -0
agent_os/integrations/rbac.py +143 -0
agent_os/integrations/registry.py +113 -0
agent_os/integrations/scope_guard.py +303 -0
agent_os/integrations/semantic_kernel_adapter.py +769 -0
agent_os/integrations/smolagents_adapter.py +629 -0
agent_os/integrations/templates.py +178 -0
agent_os/integrations/token_budget.py +134 -0
agent_os/integrations/tool_aliases.py +190 -0
agent_os/integrations/webhooks.py +177 -0
agent_os/lite.py +208 -0
agent_os/mcp_gateway.py +385 -0
agent_os/mcp_message_signer.py +273 -0
agent_os/mcp_protocols.py +161 -0
agent_os/mcp_response_scanner.py +232 -0
agent_os/mcp_security.py +924 -0
agent_os/mcp_session_auth.py +231 -0
agent_os/mcp_sliding_rate_limiter.py +184 -0
agent_os/memory_guard.py +409 -0
agent_os/metrics.py +134 -0
agent_os/mute.py +428 -0
agent_os/mute_agent.py +209 -0
agent_os/policies/__init__.py +77 -0
agent_os/policies/async_evaluator.py +275 -0
agent_os/policies/backends.py +670 -0
agent_os/policies/bridge.py +169 -0
agent_os/policies/budget.py +85 -0
agent_os/policies/cli.py +294 -0
agent_os/policies/conflict_resolution.py +270 -0
agent_os/policies/data_classification.py +252 -0
agent_os/policies/evaluator.py +239 -0
agent_os/policies/policy_schema.json +228 -0
agent_os/policies/rate_limiting.py +145 -0
agent_os/policies/schema.py +115 -0
agent_os/policies/shared.py +331 -0
agent_os/prompt_injection.py +694 -0
agent_os/providers.py +182 -0
agent_os/py.typed +0 -0
agent_os/retry.py +81 -0
agent_os/reversibility.py +251 -0
agent_os/sandbox.py +432 -0
agent_os/sandbox_provider.py +140 -0
agent_os/secure_codegen.py +525 -0
agent_os/security_skills.py +538 -0
agent_os/semantic_policy.py +422 -0
agent_os/server/__init__.py +15 -0
agent_os/server/__main__.py +25 -0
agent_os/server/app.py +277 -0
agent_os/server/models.py +104 -0
agent_os/shift_left_metrics.py +130 -0
agent_os/stateless.py +742 -0
agent_os/supervisor.py +148 -0
agent_os/task_outcome.py +148 -0
agent_os/transparency.py +181 -0
agent_os/trust_root.py +128 -0
agent_os_kernel-3.1.0.dist-info/METADATA +1269 -0
agent_os_kernel-3.1.0.dist-info/RECORD +337 -0
agent_os_kernel-3.1.0.dist-info/WHEEL +4 -0
agent_os_kernel-3.1.0.dist-info/entry_points.txt +2 -0
agent_os_kernel-3.1.0.dist-info/licenses/LICENSE +21 -0
agent_os_observability/__init__.py +27 -0
agent_os_observability/dashboards.py +898 -0
agent_os_observability/metrics.py +398 -0
agent_os_observability/server.py +223 -0
agent_os_observability/tracer.py +232 -0
agent_primitives/__init__.py +24 -0
agent_primitives/failures.py +84 -0
agent_primitives/py.typed +0 -0
amb_core/__init__.py +177 -0
amb_core/adapters/__init__.py +57 -0
amb_core/adapters/aws_sqs_broker.py +376 -0
amb_core/adapters/azure_servicebus_broker.py +340 -0
amb_core/adapters/kafka_broker.py +260 -0
amb_core/adapters/nats_broker.py +285 -0
amb_core/adapters/rabbitmq_broker.py +235 -0
amb_core/adapters/redis_broker.py +262 -0
amb_core/broker.py +145 -0
amb_core/bus.py +481 -0
amb_core/cloudevents.py +509 -0
amb_core/dlq.py +345 -0
amb_core/hf_utils.py +536 -0
amb_core/memory_broker.py +410 -0
amb_core/models.py +141 -0
amb_core/persistence.py +529 -0
amb_core/schema.py +294 -0
amb_core/tracing.py +358 -0
atr/__init__.py +640 -0
atr/access.py +348 -0
atr/composition.py +645 -0
atr/decorator.py +357 -0
atr/executor.py +384 -0
atr/health.py +557 -0
atr/hf_utils.py +449 -0
atr/injection.py +422 -0
atr/metrics.py +440 -0
atr/policies.py +403 -0
atr/py.typed +2 -0
atr/registry.py +452 -0
atr/schema.py +480 -0
atr/tools/safe/__init__.py +75 -0
atr/tools/safe/calculator.py +467 -0
atr/tools/safe/datetime_tool.py +443 -0
atr/tools/safe/file_reader.py +402 -0
atr/tools/safe/http_client.py +316 -0
atr/tools/safe/json_parser.py +374 -0
atr/tools/safe/text_tool.py +537 -0
atr/tools/safe/toolkit.py +175 -0
caas/__init__.py +162 -0
caas/api/__init__.py +7 -0
caas/api/server.py +1328 -0
caas/caching.py +834 -0
caas/cli.py +210 -0
caas/conversation.py +223 -0
caas/decay.py +72 -0
caas/detection/__init__.py +9 -0
caas/detection/detector.py +238 -0
caas/enrichment.py +130 -0
caas/gateway/__init__.py +27 -0
caas/gateway/trust_gateway.py +474 -0
caas/hf_utils.py +479 -0
caas/ingestion/__init__.py +23 -0
caas/ingestion/processors.py +253 -0
caas/ingestion/structure_parser.py +188 -0
caas/models.py +356 -0
caas/pragmatic_truth.py +444 -0
caas/routing/__init__.py +10 -0
caas/routing/heuristic_router.py +58 -0
caas/storage/__init__.py +9 -0
caas/storage/store.py +389 -0
caas/triad.py +213 -0
caas/tuning/__init__.py +9 -0
caas/tuning/tuner.py +329 -0
caas/vfs/__init__.py +14 -0
caas/vfs/filesystem.py +452 -0
cmvk/__init__.py +218 -0
cmvk/audit.py +402 -0
cmvk/benchmarks.py +478 -0
cmvk/constitutional.py +904 -0
cmvk/hf_utils.py +301 -0
cmvk/metrics.py +473 -0
cmvk/profiles.py +300 -0
cmvk/py.typed +0 -0
cmvk/types.py +12 -0
cmvk/verification.py +956 -0
emk/__init__.py +89 -0
emk/causal.py +352 -0
emk/hf_utils.py +421 -0
emk/indexer.py +83 -0
emk/py.typed +0 -0
emk/schema.py +204 -0
emk/sleep_cycle.py +347 -0
emk/store.py +281 -0
iatp/__init__.py +166 -0
iatp/attestation.py +461 -0
iatp/cli.py +317 -0
iatp/hf_utils.py +472 -0
iatp/ipc_pipes.py +580 -0
iatp/main.py +412 -0
iatp/models/__init__.py +447 -0
iatp/policy_engine.py +337 -0
iatp/py.typed +2 -0
iatp/recovery.py +321 -0
iatp/security/__init__.py +270 -0
iatp/sidecar/__init__.py +519 -0
iatp/telemetry/__init__.py +164 -0
iatp/tests/__init__.py +1 -0
iatp/tests/test_attestation.py +370 -0
iatp/tests/test_cli.py +131 -0
iatp/tests/test_ed25519_attestation.py +211 -0
iatp/tests/test_models.py +130 -0
iatp/tests/test_policy_engine.py +347 -0
iatp/tests/test_recovery.py +281 -0
iatp/tests/test_security.py +222 -0
iatp/tests/test_sidecar.py +167 -0
iatp/tests/test_telemetry.py +175 -0
mcp_kernel_server/__init__.py +28 -0
mcp_kernel_server/cli.py +274 -0
mcp_kernel_server/resources.py +217 -0
mcp_kernel_server/server.py +564 -0
mcp_kernel_server/tools.py +1174 -0
mute_agent/__init__.py +68 -0
mute_agent/core/__init__.py +1 -0
mute_agent/core/execution_agent.py +166 -0
mute_agent/core/handshake_protocol.py +201 -0
mute_agent/core/reasoning_agent.py +238 -0
mute_agent/knowledge_graph/__init__.py +1 -0
mute_agent/knowledge_graph/graph_elements.py +65 -0
mute_agent/knowledge_graph/multidimensional_graph.py +170 -0
mute_agent/knowledge_graph/subgraph.py +224 -0
mute_agent/listener/__init__.py +43 -0
mute_agent/listener/adapters/__init__.py +31 -0
mute_agent/listener/adapters/base_adapter.py +189 -0
mute_agent/listener/adapters/caas_adapter.py +344 -0
mute_agent/listener/adapters/control_plane_adapter.py +436 -0
mute_agent/listener/adapters/iatp_adapter.py +332 -0
mute_agent/listener/adapters/scak_adapter.py +251 -0
mute_agent/listener/listener.py +610 -0
mute_agent/listener/state_observer.py +436 -0
mute_agent/listener/threshold_config.py +313 -0
mute_agent/super_system/__init__.py +1 -0
mute_agent/super_system/router.py +204 -0
mute_agent/visualization/__init__.py +10 -0
mute_agent/visualization/graph_debugger.py +502 -0
nexus/README.md +60 -0
nexus/__init__.py +51 -0
nexus/arbiter.py +359 -0
nexus/client.py +466 -0
nexus/dmz.py +444 -0
nexus/escrow.py +430 -0
nexus/exceptions.py +286 -0
nexus/pyproject.toml +36 -0
nexus/registry.py +393 -0
nexus/reputation.py +425 -0
nexus/schemas/__init__.py +51 -0
nexus/schemas/compliance.py +276 -0
nexus/schemas/escrow.py +251 -0
nexus/schemas/manifest.py +225 -0
nexus/schemas/receipt.py +208 -0
nexus/tests/__init__.py +0 -0
nexus/tests/conftest.py +146 -0
nexus/tests/test_arbiter.py +192 -0
nexus/tests/test_dmz.py +194 -0
nexus/tests/test_escrow.py +276 -0
nexus/tests/test_exceptions.py +225 -0
nexus/tests/test_registry.py +232 -0
nexus/tests/test_reputation.py +328 -0
nexus/tests/test_schemas.py +295 -0

agent_kernel/semantic_analyzer.py ADDED Viewed

@@ -0,0 +1,316 @@
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT License.
+"""
+Semantic Analyzer - Advanced refusal detection beyond regex patterns.
+This module provides semantic analysis of agent responses to detect
+"refusal" vs "compliance" behavior using contextual understanding
+rather than just pattern matching.
+"""
+import logging
+from typing import Optional, List
+from .models import SemanticAnalysis
+logger = logging.getLogger(__name__)
+class SemanticAnalyzer:
+    """
+    Analyzes agent responses semantically to detect refusal patterns.
+    Unlike regex-based detection, this analyzes the semantic meaning
+    to catch subtle forms of giving up like:
+    - "I'm afraid those records are elusive at the moment."
+    - "The information seems to be unavailable."
+    - "It appears there's nothing to show."
+    This is inspired by "Refusal Benchmarking" in AI safety research.
+    """
+    def __init__(self):
+        """Initialize the semantic analyzer."""
+        self.refusal_indicators = self._load_refusal_indicators()
+        self.compliance_indicators = self._load_compliance_indicators()
+    def _load_refusal_indicators(self) -> List[str]:
+        """Load semantic indicators of refusal/giving up."""
+        return [
+            # Direct refusal phrases
+            "cannot", "can't", "unable", "impossible", "won't",
+            "don't have", "doesn't exist", "not available", "unavailable",
+            # Evasive/elusive language
+            "elusive", "appears to be", "seems to be", "might be",
+            "could be", "perhaps", "possibly", "unclear",
+            # Uncertainty/hedging
+            "I'm afraid", "unfortunately", "regrettably", "sadly",
+            "it seems", "it appears", "looks like",
+            # Empty/negative results
+            "no data", "no results", "no information", "nothing found",
+            "zero results", "empty", "none available",
+            # Insufficient effort indicators
+            "not sure", "uncertain", "don't know", "can't tell",
+            "hard to say", "difficult to determine"
+        ]
+    def _load_compliance_indicators(self) -> List[str]:
+        """Load semantic indicators of compliance/success."""
+        return [
+            # Action completion
+            "found", "discovered", "located", "identified", "retrieved",
+            "obtained", "extracted", "collected",
+            # Data presentation
+            "here is", "here are", "the results", "the data shows",
+            "according to", "based on", "from the",
+            # Quantity indicators
+            "total", "count", "number of", "records", "entries",
+            "items", "results show",
+            # Confidence indicators
+            "successfully", "confirmed", "verified", "validated"
+        ]
+    def analyze(
+        self,
+        agent_response: str,
+        user_prompt: str,
+        tool_telemetry: Optional[List] = None
+    ) -> SemanticAnalysis:
+        """
+        Perform semantic analysis on agent response.
+        Args:
+            agent_response: The agent's response to analyze
+            user_prompt: The original user prompt for context
+            tool_telemetry: Optional tool execution telemetry
+        Returns:
+            SemanticAnalysis with classification and confidence
+        """
+        response_lower = agent_response.lower()
+        prompt_lower = user_prompt.lower()
+        # Calculate refusal and compliance scores
+        refusal_score = self._calculate_refusal_score(response_lower)
+        compliance_score = self._calculate_compliance_score(response_lower)
+        # Check for tool execution context
+        tool_context_score = self._analyze_tool_context(tool_telemetry)
+        # Determine if this is a refusal
+        is_refusal = self._determine_refusal(
+            refusal_score,
+            compliance_score,
+            tool_context_score,
+            response_lower
+        )
+        # Calculate confidence based on multiple signals
+        confidence = self._calculate_confidence(
+            refusal_score,
+            compliance_score,
+            tool_context_score,
+            response_lower
+        )
+        # Determine semantic category
+        category = self._determine_category(
+            is_refusal,
+            refusal_score,
+            compliance_score
+        )
+        # Generate reasoning explanation
+        reasoning = self._generate_reasoning(
+            is_refusal,
+            refusal_score,
+            compliance_score,
+            tool_context_score,
+            response_lower
+        )
+        return SemanticAnalysis(
+            is_refusal=is_refusal,
+            refusal_confidence=confidence,
+            semantic_category=category,
+            reasoning=reasoning
+        )
+    def _calculate_refusal_score(self, response: str) -> float:
+        """Calculate refusal score based on indicators present."""
+        matches = sum(1 for indicator in self.refusal_indicators if indicator in response)
+        # Normalize to 0-1 range
+        return min(matches / 3.0, 1.0)  # 3+ matches = 1.0
+    def _calculate_compliance_score(self, response: str) -> float:
+        """Calculate compliance score based on indicators present."""
+        matches = sum(1 for indicator in self.compliance_indicators if indicator in response)
+        # Normalize to 0-1 range
+        return min(matches / 3.0, 1.0)  # 3+ matches = 1.0
+    def _analyze_tool_context(self, tool_telemetry: Optional[List]) -> float:
+        """
+        Analyze tool execution context.
+        Returns a score indicating likelihood of laziness:
+        - 0.0: Tools called and returned data (not lazy)
+        - 0.5: Tools called but empty results (might be lazy)
+        - 1.0: Tools not called (likely lazy)
+        """
+        if not tool_telemetry:
+            return 0.7  # No telemetry suggests possible laziness
+        from .models import ToolExecutionStatus
+        # Check if any tools were called
+        called_tools = [t for t in tool_telemetry if t.tool_status != ToolExecutionStatus.NOT_CALLED]
+        if not called_tools:
+            return 1.0  # No tools called - clear laziness
+        # Check if tools returned empty results
+        empty_results = [t for t in called_tools if t.tool_status == ToolExecutionStatus.EMPTY_RESULT]
+        if len(empty_results) == len(called_tools):
+            return 0.3  # All tools returned empty - likely legitimate
+        # Mix of results
+        return 0.5
+    def _determine_refusal(
+        self,
+        refusal_score: float,
+        compliance_score: float,
+        tool_context_score: float,
+        response: str
+    ) -> bool:
+        """
+        Determine if response indicates refusal.
+        Uses multiple signals to make decision:
+        - Refusal language
+        - Lack of compliance language
+        - Tool execution context
+        - Response length
+        """
+        # Short responses with refusal language
+        if len(response) < 50 and refusal_score > 0.3:
+            return True
+        # High refusal score and low compliance
+        if refusal_score > 0.5 and compliance_score < 0.2:
+            return True
+        # High tool laziness (not called) + some refusal language
+        if tool_context_score > 0.7 and refusal_score > 0.2:
+            return True
+        # Moderate refusal with no compliance
+        if refusal_score > 0.3 and compliance_score == 0.0:
+            return True
+        return False
+    def _calculate_confidence(
+        self,
+        refusal_score: float,
+        compliance_score: float,
+        tool_context_score: float,
+        response: str
+    ) -> float:
+        """
+        Calculate confidence in the refusal detection.
+        Higher confidence when:
+        - Clear refusal indicators
+        - Clear tool context (called or not)
+        - Low ambiguity
+        """
+        # Base confidence from score differences
+        score_diff = abs(refusal_score - compliance_score)
+        base_confidence = min(score_diff + 0.5, 1.0)
+        # Boost confidence if tool context is clear
+        if tool_context_score < 0.3 or tool_context_score > 0.7:
+            base_confidence = min(base_confidence + 0.1, 1.0)
+        # Reduce confidence for very short responses (ambiguous)
+        if len(response) < 20:
+            base_confidence *= 0.8
+        # Boost confidence for very clear patterns
+        if refusal_score > 0.7 or compliance_score > 0.7:
+            base_confidence = min(base_confidence + 0.15, 1.0)
+        return round(base_confidence, 2)
+    def _determine_category(
+        self,
+        is_refusal: bool,
+        refusal_score: float,
+        compliance_score: float
+    ) -> str:
+        """Determine semantic category of response."""
+        if is_refusal:
+            return "refusal"
+        if compliance_score > 0.5:
+            return "compliance"
+        if refusal_score > 0.2 and compliance_score > 0.2:
+            return "unclear"
+        return "error"
+    def _generate_reasoning(
+        self,
+        is_refusal: bool,
+        refusal_score: float,
+        compliance_score: float,
+        tool_context_score: float,
+        response: str
+    ) -> str:
+        """Generate human-readable reasoning for the classification."""
+        if is_refusal:
+            reasons = []
+            if refusal_score > 0.5:
+                reasons.append(f"Strong refusal language detected (score: {refusal_score:.2f})")
+            elif refusal_score > 0.3:
+                reasons.append(f"Moderate refusal indicators present (score: {refusal_score:.2f})")
+            if compliance_score < 0.2:
+                reasons.append(f"Low compliance indicators (score: {compliance_score:.2f})")
+            if tool_context_score > 0.7:
+                reasons.append("Tools not called or minimal usage")
+            elif tool_context_score > 0.4:
+                reasons.append("Tools returned empty results")
+            if len(response) < 50:
+                reasons.append("Response is brief, suggesting minimal effort")
+            return "Response indicates refusal/give-up: " + "; ".join(reasons)
+        else:
+            reasons = []
+            if compliance_score > 0.5:
+                reasons.append(f"Strong compliance indicators (score: {compliance_score:.2f})")
+            elif compliance_score > 0.2:
+                reasons.append(f"Some compliance indicators present (score: {compliance_score:.2f})")
+            if tool_context_score < 0.3:
+                reasons.append("Tools executed and returned data")
+            if refusal_score < 0.2:
+                reasons.append("Minimal refusal language")
+            return "Response indicates compliance/success: " + "; ".join(reasons)

agent_kernel/semantic_purge.py ADDED Viewed

@@ -0,0 +1,349 @@
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT License.
+"""
+Semantic Purge - Scale by Subtraction for patch lifecycle management.
+Implements the "Taxonomy of Lessons" to prevent context bloat:
+- Type A (Syntax/Capability): High decay - likely model defects, purge on upgrade
+- Type B (Business/Context): Zero decay - world truths, retain forever
+This allows reducing context usage by 40-60% over the agent's lifetime.
+"""
+import logging
+from typing import List, Dict, Optional
+from datetime import datetime
+from .models import (
+    CorrectionPatch, ClassifiedPatch, PatchDecayType,
+    CognitiveGlitch, CompletenessAudit
+)
+logger = logging.getLogger(__name__)
+class PatchClassifier:
+    """
+    Classifies patches into Type A (Syntax) vs Type B (Business).
+    This is the "Taxonomy of Lessons" that determines lifecycle.
+    """
+    def __init__(self):
+        self.syntax_indicators = [
+            "output json", "format", "syntax", "parse", "validation error",
+            "type mismatch", "parameter type", "limit 10", "use uuid",
+            "tool definition", "schema injection", "parameter checking"
+        ]
+        self.business_indicators = [
+            "fiscal year", "project", "entity", "business rule", "policy",
+            "archived", "deprecated", "does not exist", "negative constraint",
+            "company", "organization", "domain", "customer", "workflow"
+        ]
+    def classify_patch(
+        self,
+        patch: CorrectionPatch,
+        current_model_version: str
+    ) -> ClassifiedPatch:
+        """
+        Classify a patch as Type A or Type B.
+        Args:
+            patch: The correction patch to classify
+            current_model_version: Current model version (e.g., "gpt-4o", "gpt-5")
+        Returns:
+            ClassifiedPatch with decay type and metadata
+        """
+        logger.info(f"Classifying patch {patch.patch_id}")
+        # Analyze patch content to determine type
+        decay_type = self._determine_decay_type(patch)
+        # Determine if should purge on upgrade
+        should_purge = (decay_type == PatchDecayType.SYNTAX_CAPABILITY)
+        # Build metadata
+        metadata = self._build_decay_metadata(patch, decay_type)
+        classified = ClassifiedPatch(
+            base_patch=patch,
+            decay_type=decay_type,
+            created_at_model_version=current_model_version,
+            decay_metadata=metadata,
+            should_purge_on_upgrade=should_purge
+        )
+        logger.info(f"Classified as {decay_type.value} (purge on upgrade: {should_purge})")
+        return classified
+    def _determine_decay_type(self, patch: CorrectionPatch) -> PatchDecayType:
+        """
+        Determine if patch is Type A (Syntax) or Type B (Business).
+        Type A - Syntax/Capability (HIGH DECAY):
+        - Model-specific issues (JSON formatting, type errors)
+        - Tool usage errors (wrong parameter types)
+        - Syntax errors, validation issues
+        - Query construction problems
+        - These are likely fixed in newer model versions
+        Type B - Business/Context (ZERO DECAY):
+        - Company-specific rules ("Fiscal year starts in July")
+        - Entity existence ("Project_Alpha is deprecated")
+        - Policy violations (medical advice restrictions)
+        - Domain knowledge (archived locations, workflows)
+        - These are world truths that models can't learn
+        """
+        # Check diagnosis first (most reliable indicator)
+        if patch.diagnosis:
+            glitch = patch.diagnosis.cognitive_glitch
+            # Tool misuse is almost always Type A (model capability issue)
+            if glitch == CognitiveGlitch.TOOL_MISUSE:
+                return PatchDecayType.SYNTAX_CAPABILITY
+            # Policy violations are Type B (business rules)
+            if glitch == CognitiveGlitch.POLICY_VIOLATION:
+                return PatchDecayType.BUSINESS_CONTEXT
+            # Hallucinations about entities are Type B (world knowledge)
+            if glitch == CognitiveGlitch.HALLUCINATION:
+                return PatchDecayType.BUSINESS_CONTEXT
+            # Schema mismatches depend on content
+            if glitch == CognitiveGlitch.SCHEMA_MISMATCH:
+                # Check if it's about company-specific schema
+                content_str = str(patch.patch_content).lower()
+                if any(indicator in content_str for indicator in self.business_indicators):
+                    return PatchDecayType.BUSINESS_CONTEXT
+                return PatchDecayType.SYNTAX_CAPABILITY
+        # Analyze patch content
+        content_str = str(patch.patch_content).lower()
+        # Count indicators
+        syntax_score = sum(1 for ind in self.syntax_indicators if ind in content_str)
+        business_score = sum(1 for ind in self.business_indicators if ind in content_str)
+        # Check for specific patterns
+        if patch.patch_type == "system_prompt":
+            rule = patch.patch_content.get("rule", "")
+            rule_lower = rule.lower()
+            # Schema injection and parameter checking are Type A
+            if "schema injection" in rule_lower or "parameter type" in rule_lower:
+                return PatchDecayType.SYNTAX_CAPABILITY
+            # Constitutional rules about domains are Type B
+            if "constitutional" in rule_lower or "refuse" in rule_lower:
+                return PatchDecayType.BUSINESS_CONTEXT
+            # Entity-specific negative constraints are Type B
+            if "does not exist" in rule_lower or "deprecated" in rule_lower:
+                return PatchDecayType.BUSINESS_CONTEXT
+        # RAG memory patches are typically Type B (business context)
+        if patch.patch_type == "rag_memory":
+            negative_constraint = patch.patch_content.get("negative_constraint")
+            if negative_constraint:
+                return PatchDecayType.BUSINESS_CONTEXT
+        # Score-based classification
+        if business_score > syntax_score:
+            return PatchDecayType.BUSINESS_CONTEXT
+        elif syntax_score > 0:
+            return PatchDecayType.SYNTAX_CAPABILITY
+        # Default to business context (safer - won't accidentally purge important rules)
+        return PatchDecayType.BUSINESS_CONTEXT
+    def _build_decay_metadata(self, patch: CorrectionPatch, decay_type: PatchDecayType) -> Dict:
+        """Build metadata for decay management."""
+        metadata = {
+            "classification_reason": self._get_classification_reason(patch, decay_type),
+            "estimated_lifetime": "until_upgrade" if decay_type == PatchDecayType.SYNTAX_CAPABILITY else "permanent",
+            "priority": "low" if decay_type == PatchDecayType.SYNTAX_CAPABILITY else "high"
+        }
+        if decay_type == PatchDecayType.SYNTAX_CAPABILITY:
+            metadata["purge_trigger"] = "model_version_upgrade"
+            metadata["expected_fix_in"] = "next_model_generation"
+        else:
+            metadata["purge_trigger"] = "manual_review_only"
+            metadata["rag_storage_recommended"] = True
+        return metadata
+    def _get_classification_reason(self, patch: CorrectionPatch, decay_type: PatchDecayType) -> str:
+        """Get human-readable reason for classification."""
+        if patch.diagnosis:
+            glitch = patch.diagnosis.cognitive_glitch.value
+            if decay_type == PatchDecayType.SYNTAX_CAPABILITY:
+                return f"Model capability issue ({glitch}) - likely fixed in upgraded models"
+            else:
+                return f"Domain/business knowledge ({glitch}) - requires permanent retention"
+        return "Content-based classification"
+class SemanticPurge:
+    """
+    Manages patch lifecycle and purging.
+    This is "Scale by Subtraction" - reducing context by purging temporary wisdom.
+    """
+    def __init__(self):
+        self.classifier = PatchClassifier()
+        self.classified_patches: Dict[str, ClassifiedPatch] = {}
+        self.purge_history: List[Dict] = []
+    def register_patch(
+        self,
+        patch: CorrectionPatch,
+        current_model_version: str
+    ) -> ClassifiedPatch:
+        """
+        Register a patch with classification for lifecycle management.
+        Args:
+            patch: The correction patch
+            current_model_version: Current model version
+        Returns:
+            ClassifiedPatch with metadata
+        """
+        classified = self.classifier.classify_patch(patch, current_model_version)
+        self.classified_patches[patch.patch_id] = classified
+        logger.info(f"Registered patch {patch.patch_id} as {classified.decay_type.value}")
+        return classified
+    def purge_on_upgrade(
+        self,
+        old_model_version: str,
+        new_model_version: str
+    ) -> Dict[str, List[str]]:
+        """
+        Purge Type A patches when model version upgrades.
+        This is the "Purge Event" - async purging to reclaim tokens.
+        Args:
+            old_model_version: Previous model version
+            new_model_version: New model version
+        Returns:
+            Dictionary with purged and retained patch IDs
+        """
+        logger.info(f"🗑️  PURGE EVENT: Model upgrade {old_model_version} → {new_model_version}")
+        purged_patches = []
+        retained_patches = []
+        for patch_id, classified in self.classified_patches.items():
+            if classified.should_purge_on_upgrade:
+                # This is Type A (Syntax) - likely fixed in new model
+                purged_patches.append(patch_id)
+                logger.info(f"   Purging Type A patch {patch_id}: {classified.decay_metadata.get('classification_reason', '')}")
+            else:
+                # This is Type B (Business) - retain forever
+                retained_patches.append(patch_id)
+        # Record purge event
+        purge_event = {
+            "timestamp": datetime.utcnow(),
+            "old_version": old_model_version,
+            "new_version": new_model_version,
+            "purged_count": len(purged_patches),
+            "retained_count": len(retained_patches),
+            "purged_patches": purged_patches,
+            "tokens_reclaimed": self._estimate_tokens_reclaimed(purged_patches)
+        }
+        self.purge_history.append(purge_event)
+        # Remove purged patches
+        for patch_id in purged_patches:
+            del self.classified_patches[patch_id]
+        logger.info(f"✓ Purged {len(purged_patches)} Type A patches")
+        logger.info(f"✓ Retained {len(retained_patches)} Type B patches")
+        logger.info(f"✓ Estimated tokens reclaimed: {purge_event['tokens_reclaimed']}")
+        return {
+            "purged": purged_patches,
+            "retained": retained_patches,
+            "stats": {
+                "purged_count": len(purged_patches),
+                "retained_count": len(retained_patches),
+                "tokens_reclaimed": purge_event["tokens_reclaimed"]
+            }
+        }
+    def _estimate_tokens_reclaimed(self, purged_patch_ids: List[str]) -> int:
+        """
+        Estimate tokens reclaimed by purging patches.
+        Rough estimate: each patch uses 50-200 tokens depending on complexity.
+        """
+        return len(purged_patch_ids) * 100  # Average 100 tokens per patch
+    def get_purge_stats(self) -> Dict:
+        """Get statistics about purging activity."""
+        total_patches = len(self.classified_patches)
+        type_a_count = sum(1 for p in self.classified_patches.values()
+                          if p.decay_type == PatchDecayType.SYNTAX_CAPABILITY)
+        type_b_count = sum(1 for p in self.classified_patches.values()
+                          if p.decay_type == PatchDecayType.BUSINESS_CONTEXT)
+        total_purged = sum(event["purged_count"] for event in self.purge_history)
+        total_tokens_reclaimed = sum(event["tokens_reclaimed"] for event in self.purge_history)
+        return {
+            "current_patches": total_patches,
+            "type_a_syntax": type_a_count,
+            "type_b_business": type_b_count,
+            "purge_events": len(self.purge_history),
+            "total_purged": total_purged,
+            "total_tokens_reclaimed": total_tokens_reclaimed,
+            "estimated_savings": f"{(type_a_count / (total_patches or 1)) * 100:.1f}% can be purged on upgrade"
+        }
+    def get_purgeable_patches(self) -> List[ClassifiedPatch]:
+        """Get list of patches that would be purged on upgrade."""
+        return [
+            p for p in self.classified_patches.values()
+            if p.should_purge_on_upgrade
+        ]
+    def get_permanent_patches(self) -> List[ClassifiedPatch]:
+        """Get list of permanent (Type B) patches."""
+        return [
+            p for p in self.classified_patches.values()
+            if not p.should_purge_on_upgrade
+        ]
+    def register_completeness_audit(
+        self,
+        audit: CompletenessAudit,
+        current_model_version: str
+    ):
+        """
+        Register a competence patch from completeness audit.
+        Competence patches are always Type B (business context) because they
+        represent gaps in domain knowledge, not model defects.
+        """
+        # Create a synthetic patch for the competence lesson
+        # In a real system, this would be integrated with the patcher
+        logger.info(f"Registering competence patch from audit {audit.audit_id}")
+        logger.info(f"   Lesson: {audit.competence_patch[:80]}...")
+        # Competence patches are always Type B - domain knowledge
+        # These represent what the agent didn't know about the domain/business