PyPI - cognitive-modules - Versions diffs - 0.4.0__py3-none-any.whl → 0.5.1__py3-none-any.whl - Mend

cognitive-modules 0.4.0py3-none-any.whl → 0.5.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

cognitive/__init__.py +1 -1
cognitive/cli.py +173 -18
cognitive/loader.py +191 -14
cognitive/mcp_server.py +245 -0
cognitive/migrate.py +624 -0
cognitive/runner.py +443 -80
cognitive/server.py +294 -0
cognitive/validator.py +380 -122
{cognitive_modules-0.4.0.dist-info → cognitive_modules-0.5.1.dist-info}/METADATA +194 -177
cognitive_modules-0.5.1.dist-info/RECORD +18 -0
cognitive_modules-0.4.0.dist-info/RECORD +0 -15
{cognitive_modules-0.4.0.dist-info → cognitive_modules-0.5.1.dist-info}/WHEEL +0 -0
{cognitive_modules-0.4.0.dist-info → cognitive_modules-0.5.1.dist-info}/entry_points.txt +0 -0
{cognitive_modules-0.4.0.dist-info → cognitive_modules-0.5.1.dist-info}/licenses/LICENSE +0 -0
{cognitive_modules-0.4.0.dist-info → cognitive_modules-0.5.1.dist-info}/top_level.txt +0 -0

cognitive/runner.py CHANGED Viewed

@@ -1,11 +1,17 @@
 """
 Module Runner - Execute cognitive modules with validation.
-Supports v2 envelope format and legacy formats.
+Supports v2.2 envelope format with Control/Data plane separation.
+v2.2 Features:
+  - meta (Control Plane): confidence, risk, explain
+  - data (Data Plane): business payload + rationale
+  - Repair pass for schema validation failures
+  - Auto-wrap v2.1 payloads to v2.2 envelope
 """
 import json
 from pathlib import Path
-from typing import Optional, TypedDict, Union
+from typing import Optional, TypedDict, Union, Literal
 import jsonschema
 import yaml
@@ -15,25 +21,112 @@ from .loader import load_module
 from .providers import call_llm
+# =============================================================================
+# Type Definitions (v2.2)
+# =============================================================================
+RiskLevel = Literal["none", "low", "medium", "high"]
+class EnvelopeMeta(TypedDict, total=False):
+    """Control plane metadata - unified across all modules."""
+    confidence: float  # 0-1
+    risk: RiskLevel
+    explain: str  # max 280 chars
+    trace_id: str
+    model: str
+    latency_ms: float
 class EnvelopeError(TypedDict):
     code: str
     message: str
-class EnvelopeSuccess(TypedDict):
-    ok: bool  # True
+class EnvelopeSuccessV22(TypedDict):
+    ok: Literal[True]
+    meta: EnvelopeMeta
+    data: dict
+class EnvelopeFailureV22(TypedDict, total=False):
+    ok: Literal[False]
+    meta: EnvelopeMeta
+    error: EnvelopeError
+    partial_data: Optional[dict]
+EnvelopeResponseV22 = Union[EnvelopeSuccessV22, EnvelopeFailureV22]
+# Legacy types for compatibility
+class EnvelopeSuccessV21(TypedDict):
+    ok: Literal[True]
     data: dict
-class EnvelopeFailure(TypedDict):
-    ok: bool  # False
+class EnvelopeFailureV21(TypedDict, total=False):
+    ok: Literal[False]
     error: EnvelopeError
     partial_data: Optional[dict]
-EnvelopeResponse = Union[EnvelopeSuccess, EnvelopeFailure]
+EnvelopeResponse = Union[EnvelopeResponseV22, EnvelopeSuccessV21, EnvelopeFailureV21]
+# =============================================================================
+# Risk Aggregation
+# =============================================================================
+RISK_LEVELS = {"none": 0, "low": 1, "medium": 2, "high": 3}
+RISK_NAMES = ["none", "low", "medium", "high"]
+RiskRule = Literal["max_changes_risk", "max_issues_risk", "explicit"]
+def aggregate_risk_from_list(items: list[dict]) -> RiskLevel:
+    """Compute max risk from list of items with risk field."""
+    if not items:
+        return "medium"  # Default conservative
+    max_level = 0
+    for item in items:
+        risk = item.get("risk", "medium")
+        level = RISK_LEVELS.get(risk, 2)
+        max_level = max(max_level, level)
+    return RISK_NAMES[max_level]
+def aggregate_risk(
+    data: dict,
+    risk_rule: RiskRule = "max_changes_risk"
+) -> RiskLevel:
+    """
+    Compute aggregated risk based on risk_rule.
+    Rules:
+    - max_changes_risk: max(data.changes[*].risk) - default
+    - max_issues_risk: max(data.issues[*].risk) - for review modules
+    - explicit: return "medium", module should set risk explicitly
+    """
+    if risk_rule == "max_changes_risk":
+        changes = data.get("changes", [])
+        return aggregate_risk_from_list(changes)
+    elif risk_rule == "max_issues_risk":
+        issues = data.get("issues", [])
+        return aggregate_risk_from_list(issues)
+    elif risk_rule == "explicit":
+        return "medium"  # Module should override
+    else:
+        # Fallback to changes
+        changes = data.get("changes", [])
+        return aggregate_risk_from_list(changes)
+# =============================================================================
+# Schema Validation
+# =============================================================================
 def validate_data(data: dict, schema: dict, label: str = "Data") -> list[str]:
     """Validate data against schema. Returns list of errors."""
     errors = []
@@ -48,9 +141,193 @@ def validate_data(data: dict, schema: dict, label: str = "Data") -> list[str]:
     return errors
+# =============================================================================
+# Repair Pass (v2.2)
+# =============================================================================
+def repair_envelope(
+    data: dict,
+    meta_schema: Optional[dict] = None,
+    max_explain_length: int = 280,
+    risk_rule: RiskRule = "max_changes_risk"
+) -> dict:
+    """
+    Attempt to repair envelope format issues without changing semantics.
+    Repairs (lossless only):
+    - Missing meta fields (fill with conservative defaults)
+    - Truncate explain if too long
+    - Trim whitespace from string fields
+    Does NOT repair:
+    - Invalid enum values (treated as validation failure)
+    """
+    repaired = dict(data)
+    # Ensure meta exists
+    if "meta" not in repaired:
+        repaired["meta"] = {}
+    meta = repaired["meta"]
+    data_payload = repaired.get("data", {})
+    # Repair confidence
+    if "confidence" not in meta:
+        # Try to extract from data (v2.1 compatibility)
+        meta["confidence"] = data_payload.get("confidence", 0.5)
+    # Ensure confidence is in valid range
+    if isinstance(meta.get("confidence"), (int, float)):
+        meta["confidence"] = max(0.0, min(1.0, float(meta["confidence"])))
+    # Repair risk - use configurable aggregation rule
+    if "risk" not in meta:
+        meta["risk"] = aggregate_risk(data_payload, risk_rule)
+    # Trim whitespace from risk (lossless), but do NOT invent new values
+    if isinstance(meta.get("risk"), str):
+        meta["risk"] = meta["risk"].strip().lower()
+        # If invalid after trim, leave as-is (validation will catch it)
+    # Repair explain
+    if "explain" not in meta:
+        # Try to extract from rationale
+        rationale = data_payload.get("rationale", "")
+        if rationale:
+            meta["explain"] = str(rationale)[:max_explain_length]
+        else:
+            meta["explain"] = "No explanation provided"
+    # Trim whitespace from explain (lossless)
+    if isinstance(meta.get("explain"), str):
+        meta["explain"] = meta["explain"].strip()
+    # Truncate explain if too long
+    if len(meta.get("explain", "")) > max_explain_length:
+        meta["explain"] = meta["explain"][:max_explain_length - 3] + "..."
+    return repaired
+def repair_error_envelope(
+    data: dict,
+    max_explain_length: int = 280
+) -> dict:
+    """Repair error envelope format."""
+    repaired = dict(data)
+    # Ensure meta exists for errors
+    if "meta" not in repaired:
+        repaired["meta"] = {}
+    meta = repaired["meta"]
+    # Set default meta for errors
+    if "confidence" not in meta:
+        meta["confidence"] = 0.0
+    if "risk" not in meta:
+        meta["risk"] = "high"
+    if "explain" not in meta:
+        error = repaired.get("error", {})
+        meta["explain"] = error.get("message", "An error occurred")[:max_explain_length]
+    return repaired
+# =============================================================================
+# Envelope Detection & Conversion
+# =============================================================================
+def is_envelope_response(data: dict) -> bool:
+    """Check if response is in envelope format (v2.1 or v2.2)."""
+    return isinstance(data.get("ok"), bool)
+def is_v22_envelope(data: dict) -> bool:
+    """Check if response is in v2.2 envelope format (has meta)."""
+    return is_envelope_response(data) and "meta" in data
+def wrap_v21_to_v22(v21_response: dict) -> EnvelopeResponseV22:
+    """
+    Convert v2.1 envelope to v2.2 envelope.
+    Adds meta field by extracting/computing from data.
+    """
+    if is_v22_envelope(v21_response):
+        return v21_response  # Already v2.2
+    if v21_response.get("ok") is True:
+        data = v21_response.get("data", {})
+        # Extract or compute meta fields
+        confidence = data.get("confidence", 0.5)
+        rationale = data.get("rationale", "")
+        return {
+            "ok": True,
+            "meta": {
+                "confidence": confidence,
+                "risk": aggregate_risk(data),  # Uses default max_changes_risk
+                "explain": rationale[:280] if rationale else "No explanation provided"
+            },
+            "data": data
+        }
+    else:
+        error = v21_response.get("error", {"code": "UNKNOWN", "message": "Unknown error"})
+        return {
+            "ok": False,
+            "meta": {
+                "confidence": 0.0,
+                "risk": "high",
+                "explain": error.get("message", "An error occurred")[:280]
+            },
+            "error": error,
+            "partial_data": v21_response.get("partial_data")
+        }
+def convert_legacy_to_envelope(data: dict, is_error: bool = False) -> EnvelopeResponseV22:
+    """Convert legacy format (no envelope) to v2.2 envelope."""
+    if is_error or "error" in data:
+        error = data.get("error", {})
+        error_msg = error.get("message", str(error)) if isinstance(error, dict) else str(error)
+        return {
+            "ok": False,
+            "meta": {
+                "confidence": 0.0,
+                "risk": "high",
+                "explain": error_msg[:280]
+            },
+            "error": {
+                "code": error.get("code", "UNKNOWN") if isinstance(error, dict) else "UNKNOWN",
+                "message": error_msg
+            },
+            "partial_data": None
+        }
+    else:
+        # Legacy success response - data is the payload itself
+        confidence = data.get("confidence", 0.5)
+        rationale = data.get("rationale", "")
+        return {
+            "ok": True,
+            "meta": {
+                "confidence": confidence,
+                "risk": aggregate_risk(data),  # Uses default max_changes_risk
+                "explain": rationale[:280] if rationale else "No explanation provided"
+            },
+            "data": data
+        }
+# =============================================================================
+# Prompt Building
+# =============================================================================
 def substitute_arguments(text: str, input_data: dict) -> str:
     """Substitute $ARGUMENTS and $N placeholders in text."""
-    # Get arguments
     args_value = input_data.get("$ARGUMENTS", input_data.get("query", input_data.get("code", "")))
     # Replace $ARGUMENTS
@@ -66,7 +343,7 @@ def substitute_arguments(text: str, input_data: dict) -> str:
     return text
-def build_prompt(module: dict, input_data: dict, use_envelope: bool = False) -> str:
+def build_prompt(module: dict, input_data: dict, use_envelope: bool = False, use_v22: bool = False) -> str:
     """Build the complete prompt for the LLM."""
     # Substitute $ARGUMENTS in prompt
     prompt = substitute_arguments(module["prompt"], input_data)
@@ -82,13 +359,23 @@ def build_prompt(module: dict, input_data: dict, use_envelope: bool = False) ->
     ]
     if use_envelope:
-        parts.extend([
-            "\n## Response Format (Envelope)\n",
-            "You MUST wrap your response in the envelope format:\n",
-            "- Success: { \"ok\": true, \"data\": { ...your output... } }\n",
-            "- Error: { \"ok\": false, \"error\": { \"code\": \"ERROR_CODE\", \"message\": \"...\" } }\n",
-            "Return ONLY valid JSON.\n",
-        ])
+        if use_v22:
+            parts.extend([
+                "\n## Response Format (Envelope v2.2)\n",
+                "You MUST wrap your response in the v2.2 envelope format with separate meta and data:\n",
+                "- Success: { \"ok\": true, \"meta\": { \"confidence\": 0.9, \"risk\": \"low\", \"explain\": \"short summary\" }, \"data\": { ...payload... } }\n",
+                "- Error: { \"ok\": false, \"meta\": { \"confidence\": 0.0, \"risk\": \"high\", \"explain\": \"error summary\" }, \"error\": { \"code\": \"ERROR_CODE\", \"message\": \"...\" } }\n",
+                "Note: meta.explain must be ≤280 characters. data.rationale can be longer for detailed reasoning.\n",
+                "Return ONLY valid JSON.\n",
+            ])
+        else:
+            parts.extend([
+                "\n## Response Format (Envelope)\n",
+                "You MUST wrap your response in the envelope format:\n",
+                "- Success: { \"ok\": true, \"data\": { ...your output... } }\n",
+                "- Error: { \"ok\": false, \"error\": { \"code\": \"ERROR_CODE\", \"message\": \"...\" } }\n",
+                "Return ONLY valid JSON.\n",
+            ])
     else:
         parts.extend([
             "\n## Instructions\n",
@@ -99,6 +386,10 @@ def build_prompt(module: dict, input_data: dict, use_envelope: bool = False) ->
     return "".join(parts)
+# =============================================================================
+# LLM Response Parsing
+# =============================================================================
 def parse_llm_response(response: str) -> dict:
     """Parse LLM response, handling potential markdown code blocks."""
     text = response.strip()
@@ -117,44 +408,9 @@ def parse_llm_response(response: str) -> dict:
     return json.loads(text)
-def is_envelope_response(data: dict) -> bool:
-    """Check if response is in envelope format."""
-    return isinstance(data.get("ok"), bool)
-def parse_envelope_response(data: dict) -> EnvelopeResponse:
-    """Parse and normalize envelope response."""
-    if data.get("ok") is True:
-        return {
-            "ok": True,
-            "data": data.get("data", {})
-        }
-    else:
-        return {
-            "ok": False,
-            "error": data.get("error", {"code": "UNKNOWN", "message": "Unknown error"}),
-            "partial_data": data.get("partial_data")
-        }
-def convert_to_envelope(data: dict, is_error: bool = False) -> EnvelopeResponse:
-    """Convert legacy format to envelope format."""
-    if is_error or "error" in data:
-        error = data.get("error", {})
-        return {
-            "ok": False,
-            "error": {
-                "code": error.get("code", "UNKNOWN"),
-                "message": error.get("message", str(error))
-            },
-            "partial_data": None
-        }
-    else:
-        return {
-            "ok": True,
-            "data": data
-        }
+# =============================================================================
+# Main Runner
+# =============================================================================
 def run_module(
     name_or_path: str,
@@ -163,10 +419,12 @@ def run_module(
     validate_output: bool = True,
     model: Optional[str] = None,
     use_envelope: Optional[bool] = None,
-) -> EnvelopeResponse:
+    use_v22: Optional[bool] = None,
+    enable_repair: bool = True,
+) -> EnvelopeResponseV22:
     """
     Run a cognitive module with the given input.
-    Returns envelope format response.
+    Returns v2.2 envelope format response.
     Args:
         name_or_path: Module name or path to module directory
@@ -175,10 +433,15 @@ def run_module(
         validate_output: Whether to validate output against schema
         model: Optional model override
         use_envelope: Force envelope format (auto-detect if None)
+        use_v22: Force v2.2 envelope format (auto-detect if None)
+        enable_repair: Enable repair pass for validation failures
     Returns:
-        EnvelopeResponse with ok=True/False and data/error
+        EnvelopeResponseV22 with ok=True/False, meta, and data/error
     """
+    import time
+    start_time = time.time()
     # Find module path
     path = Path(name_or_path)
     if path.exists() and path.is_dir():
@@ -188,6 +451,11 @@ def run_module(
         if not module_path:
             return {
                 "ok": False,
+                "meta": {
+                    "confidence": 1.0,
+                    "risk": "high",
+                    "explain": f"Module '{name_or_path}' not found."
+                },
                 "error": {"code": "MODULE_NOT_FOUND", "message": f"Module not found: {name_or_path}"},
                 "partial_data": None
             }
@@ -195,57 +463,118 @@ def run_module(
     # Load module (auto-detects format)
     module = load_module(module_path)
-    # Determine if we should use envelope format
+    # Determine envelope version
+    compat = module.get("compat", {})
+    is_v22_module = module.get("tier") is not None or "meta_schema" in module
     should_use_envelope = use_envelope
     if should_use_envelope is None:
-        # Auto-detect: use envelope for v2 format or if output.envelope is True
         output_contract = module.get("output_contract", {})
         should_use_envelope = (
             module.get("format") == "v2" or
             output_contract.get("envelope", False)
         )
+    should_use_v22 = use_v22
+    if should_use_v22 is None:
+        should_use_v22 = is_v22_module or compat.get("runtime_auto_wrap", False)
     # Validate input
-    if validate_input and module["input_schema"]:
+    if validate_input and module.get("input_schema"):
         errors = validate_data(input_data, module["input_schema"], "Input")
         if errors:
             return {
                 "ok": False,
+                "meta": {
+                    "confidence": 1.0,
+                    "risk": "none",
+                    "explain": "Input validation failed."
+                },
                 "error": {"code": "INVALID_INPUT", "message": str(errors)},
                 "partial_data": None
             }
     # Build prompt and call LLM
-    full_prompt = build_prompt(module, input_data, use_envelope=should_use_envelope)
+    full_prompt = build_prompt(
+        module,
+        input_data,
+        use_envelope=should_use_envelope,
+        use_v22=should_use_v22
+    )
     response = call_llm(full_prompt, model=model)
+    # Calculate latency
+    latency_ms = (time.time() - start_time) * 1000
     # Parse response
     try:
         output_data = parse_llm_response(response)
     except json.JSONDecodeError as e:
         return {
             "ok": False,
+            "meta": {
+                "confidence": 0.0,
+                "risk": "high",
+                "explain": "Failed to parse LLM response as JSON."
+            },
             "error": {"code": "PARSE_ERROR", "message": f"Failed to parse JSON: {e}"},
             "partial_data": None
         }
-    # Handle envelope format
-    if is_envelope_response(output_data):
-        result = parse_envelope_response(output_data)
+    # Convert to v2.2 envelope
+    if is_v22_envelope(output_data):
+        result = output_data
+    elif is_envelope_response(output_data):
+        # v2.1 envelope -> v2.2
+        result = wrap_v21_to_v22(output_data)
     else:
-        # Convert legacy format to envelope
-        result = convert_to_envelope(output_data)
+        # Legacy format -> v2.2
+        result = convert_legacy_to_envelope(output_data)
-    # Validate output (only for success responses)
-    if result["ok"] and validate_output and module["output_schema"]:
-        data_to_validate = result.get("data", {})
-        errors = validate_data(data_to_validate, module["output_schema"], "Output")
-        if errors:
-            return {
-                "ok": False,
-                "error": {"code": "OUTPUT_VALIDATION_ERROR", "message": str(errors)},
-                "partial_data": data_to_validate
-            }
+    # Add latency to meta
+    if "meta" in result:
+        result["meta"]["latency_ms"] = latency_ms
+        if model:
+            result["meta"]["model"] = model
+    # Validate and potentially repair
+    if result.get("ok") and validate_output:
+        # Get data schema (support both "data" and "output" aliases)
+        data_schema = module.get("data_schema") or module.get("output_schema")
+        meta_schema = module.get("meta_schema")
+        # Get risk_rule from module.yaml meta config
+        meta_config = module.get("metadata", {}).get("meta", {})
+        risk_rule = meta_config.get("risk_rule", "max_changes_risk")
+        if data_schema:
+            data_to_validate = result.get("data", {})
+            errors = validate_data(data_to_validate, data_schema, "Data")
+            if errors and enable_repair:
+                # Attempt repair pass
+                result = repair_envelope(result, meta_schema, risk_rule=risk_rule)
+                # Re-validate after repair
+                errors = validate_data(result.get("data", {}), data_schema, "Data")
+            if errors:
+                return {
+                    "ok": False,
+                    "meta": {
+                        "confidence": 0.0,
+                        "risk": "high",
+                        "explain": "Schema validation failed after repair attempt."
+                    },
+                    "error": {"code": "SCHEMA_VALIDATION_FAILED", "message": str(errors)},
+                    "partial_data": result.get("data")
+                }
+        # Validate meta if schema exists
+        if meta_schema:
+            meta_errors = validate_data(result.get("meta", {}), meta_schema, "Meta")
+            if meta_errors and enable_repair:
+                result = repair_envelope(result, meta_schema, risk_rule=risk_rule)
     return result
@@ -267,10 +596,44 @@ def run_module_legacy(
         validate_input=validate_input,
         validate_output=validate_output,
         model=model,
-        use_envelope=False
+        use_envelope=False,
+        use_v22=False
     )
-    if result["ok"]:
-        return result["data"]
+    if result.get("ok"):
+        return result.get("data", {})
     else:
-        raise ValueError(f"{result['error']['code']}: {result['error']['message']}")
+        error = result.get("error", {})
+        raise ValueError(f"{error.get('code', 'UNKNOWN')}: {error.get('message', 'Unknown error')}")
+# =============================================================================
+# Convenience Functions
+# =============================================================================
+def extract_meta(result: EnvelopeResponseV22) -> EnvelopeMeta:
+    """Extract meta from v2.2 envelope for routing/logging."""
+    return result.get("meta", {
+        "confidence": 0.5,
+        "risk": "medium",
+        "explain": "No meta available"
+    })
+def should_escalate(result: EnvelopeResponseV22, confidence_threshold: float = 0.7) -> bool:
+    """Determine if result should be escalated to human review based on meta."""
+    meta = extract_meta(result)
+    # Escalate if low confidence
+    if meta.get("confidence", 0) < confidence_threshold:
+        return True
+    # Escalate if high risk
+    if meta.get("risk") == "high":
+        return True
+    # Escalate if error
+    if not result.get("ok"):
+        return True
+    return False

cognitive-modules 0.4.0__py3-none-any.whl → 0.5.1__py3-none-any.whl

cognitive-modules 0.4.0py3-none-any.whl → 0.5.1py3-none-any.whl