PyPI - capiscio-sdk - Versions diffs - 0.2.0__py3-none-any.whl - Mend

capiscio-sdk 0.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

capiscio_sdk/__init__.py +42 -0
capiscio_sdk/config.py +114 -0
capiscio_sdk/errors.py +69 -0
capiscio_sdk/executor.py +216 -0
capiscio_sdk/infrastructure/__init__.py +5 -0
capiscio_sdk/infrastructure/cache.py +73 -0
capiscio_sdk/infrastructure/rate_limiter.py +110 -0
capiscio_sdk/py.typed +0 -0
capiscio_sdk/scoring/__init__.py +42 -0
capiscio_sdk/scoring/availability.py +299 -0
capiscio_sdk/scoring/compliance.py +314 -0
capiscio_sdk/scoring/trust.py +340 -0
capiscio_sdk/scoring/types.py +353 -0
capiscio_sdk/types.py +234 -0
capiscio_sdk/validators/__init__.py +18 -0
capiscio_sdk/validators/agent_card.py +444 -0
capiscio_sdk/validators/certificate.py +384 -0
capiscio_sdk/validators/message.py +360 -0
capiscio_sdk/validators/protocol.py +162 -0
capiscio_sdk/validators/semver.py +202 -0
capiscio_sdk/validators/signature.py +234 -0
capiscio_sdk/validators/url_security.py +269 -0
capiscio_sdk-0.2.0.dist-info/METADATA +221 -0
capiscio_sdk-0.2.0.dist-info/RECORD +26 -0
capiscio_sdk-0.2.0.dist-info/WHEEL +4 -0
capiscio_sdk-0.2.0.dist-info/licenses/LICENSE +190 -0

capiscio_sdk/scoring/trust.py ADDED Viewed

@@ -0,0 +1,340 @@
+"""Trust scorer for security and authenticity signals.
+Calculates trust score (0-100) based on:
+- Cryptographic signatures (40 points)
+- Provider information (25 points)
+- Security configuration (20 points)
+- Documentation and transparency (15 points)
+Applies confidence multiplier based on signature state:
+- Valid signature: 1.0x (full confidence)
+- No signature: 0.6x (unverified claims)
+- Invalid signature: 0.4x (active distrust)
+"""
+from typing import Any, Dict, List
+from ..types import ValidationIssue
+from .types import (
+    TrustScore,
+    TrustBreakdown,
+    SignaturesBreakdown,
+    ProviderBreakdown,
+    SecurityBreakdown,
+    DocumentationBreakdown,
+    get_trust_rating,
+    get_trust_confidence_multiplier,
+)
+class TrustScorer:
+    """Calculates trust scores for security and authenticity signals."""
+    def score_agent_card(
+        self,
+        card_data: Dict[str, Any],
+        issues: List[ValidationIssue],
+        skip_signature_verification: bool = False
+    ) -> TrustScore:
+        """Calculate trust score for an agent card.
+        Args:
+            card_data: Agent card data dictionary
+            issues: List of validation issues found
+            skip_signature_verification: Whether signature verification was skipped
+        Returns:
+            TrustScore with detailed breakdown
+        """
+        # Calculate each component
+        signatures = self._score_signatures(card_data, issues, skip_signature_verification)
+        provider = self._score_provider(card_data, issues)
+        security = self._score_security(card_data, issues)
+        documentation = self._score_documentation(card_data)
+        # Calculate raw score
+        raw_score = (
+            signatures.score +
+            provider.score +
+            security.score +
+            documentation.score
+        )
+        raw_score = max(0, min(100, raw_score))
+        # Apply confidence multiplier
+        confidence_multiplier = get_trust_confidence_multiplier(
+            has_valid_signature=signatures.has_valid_signature,
+            has_invalid_signature=signatures.has_invalid_signature
+        )
+        total = int(raw_score * confidence_multiplier)
+        # Create breakdown
+        breakdown = TrustBreakdown(
+            signatures=signatures,
+            provider=provider,
+            security=security,
+            documentation=documentation
+        )
+        # Extract issue messages
+        issue_messages = [
+            issue.message for issue in issues
+            if self._is_trust_issue(issue)
+        ]
+        return TrustScore(
+            total=total,
+            raw_score=raw_score,
+            confidence_multiplier=confidence_multiplier,
+            rating=get_trust_rating(total),
+            breakdown=breakdown,
+            issues=issue_messages,
+            partial_validation=skip_signature_verification
+        )
+    def _score_signatures(
+        self,
+        card_data: Dict[str, Any],
+        issues: List[ValidationIssue],
+        skip_verification: bool
+    ) -> SignaturesBreakdown:
+        """Score cryptographic signatures (40 points).
+        Args:
+            card_data: Agent card data
+            issues: Validation issues
+            skip_verification: Whether verification was skipped
+        Returns:
+            SignaturesBreakdown with signature metrics
+        """
+        score = 0
+        tested = not skip_verification
+        has_valid = False
+        multiple_sigs = False
+        covers_all = False
+        is_recent = False
+        has_invalid = False
+        has_expired = False
+        if tested:
+            # Check for valid signature (25 points)
+            has_valid = not self._has_issue_code(issues, [
+                "SIGNATURE_VERIFICATION_FAILED",
+                "MISSING_SIGNATURE"
+            ])
+            if has_valid:
+                score += 25
+            # Check for invalid signature
+            has_invalid = self._has_issue_code(issues, "SIGNATURE_VERIFICATION_FAILED")
+            # Check for expired signature
+            has_expired = self._has_issue_code(issues, "SIGNATURE_EXPIRED")
+            # Check for multiple signatures (5 points)
+            signatures = card_data.get("signatures", [])
+            if isinstance(signatures, list) and len(signatures) > 1:
+                multiple_sigs = True
+                score += 5
+            # Check if signature covers all fields (5 points)
+            # In practice, this would verify the JWS payload includes all card fields
+            if has_valid and not self._has_issue_code(issues, "INCOMPLETE_SIGNATURE_COVERAGE"):
+                covers_all = True
+                score += 5
+            # Check if signature is recent (5 points)
+            # Signatures less than 90 days old
+            if has_valid and not has_expired:
+                is_recent = True
+                score += 5
+        return SignaturesBreakdown(
+            score=score,
+            max_score=40,
+            tested=tested,
+            has_valid_signature=has_valid,
+            multiple_signatures=multiple_sigs,
+            covers_all_fields=covers_all,
+            is_recent=is_recent,
+            has_invalid_signature=has_invalid,
+            has_expired_signature=has_expired
+        )
+    def _score_provider(
+        self,
+        card_data: Dict[str, Any],
+        issues: List[ValidationIssue]
+    ) -> ProviderBreakdown:
+        """Score provider information (25 points).
+        Args:
+            card_data: Agent card data
+            issues: Validation issues
+        Returns:
+            ProviderBreakdown with provider metrics
+        """
+        score = 0
+        provider = card_data.get("provider", {})
+        # Ensure provider is a dict (defensive coding for validation errors)
+        if not isinstance(provider, dict):
+            provider = {}
+        # Check for organization (10 points)
+        has_org = bool(provider.get("organization"))
+        if has_org:
+            score += 10
+        # Check for provider URL (10 points)
+        has_url = bool(provider.get("url"))
+        if has_url:
+            score += 10
+        # Check if URL is reachable (5 points)
+        # This would require network test, so we check if no related errors
+        url_reachable = None
+        if has_url and not self._has_issue_code(issues, ["PROVIDER_URL_UNREACHABLE"]):
+            url_reachable = True
+            score += 5
+        elif has_url:
+            url_reachable = False
+        return ProviderBreakdown(
+            score=score,
+            max_score=25,
+            tested=True,
+            has_organization=has_org,
+            has_url=has_url,
+            url_reachable=url_reachable
+        )
+    def _score_security(
+        self,
+        card_data: Dict[str, Any],
+        issues: List[ValidationIssue]
+    ) -> SecurityBreakdown:
+        """Score security configuration (20 points).
+        Args:
+            card_data: Agent card data
+            issues: Validation issues
+        Returns:
+            SecurityBreakdown with security metrics
+        """
+        score = 0
+        # Check HTTPS only (10 points)
+        has_http = self._has_issue_code(issues, ["INSECURE_URL", "HTTP_URL_FOUND"])
+        https_only = not has_http
+        if https_only:
+            score += 10
+        # Check for security schemes (5 points)
+        capabilities = card_data.get("capabilities", {})
+        # Ensure capabilities is a dict (defensive coding for validation errors)
+        if not isinstance(capabilities, dict):
+            capabilities = {}
+        security_schemes = capabilities.get("securitySchemes", [])
+        has_security_schemes = bool(security_schemes)
+        if has_security_schemes:
+            score += 5
+        # Check for strong auth (5 points)
+        # OAuth2, API Key, or other authentication
+        has_strong_auth = False
+        if has_security_schemes:
+            for scheme in security_schemes:
+                scheme_type = scheme.get("type", "").lower()
+                if scheme_type in ["oauth2", "apikey", "http"]:
+                    has_strong_auth = True
+                    break
+        if has_strong_auth:
+            score += 5
+        return SecurityBreakdown(
+            score=score,
+            max_score=20,
+            https_only=https_only,
+            has_security_schemes=has_security_schemes,
+            has_strong_auth=has_strong_auth,
+            has_http_urls=has_http
+        )
+    def _score_documentation(self, card_data: Dict[str, Any]) -> DocumentationBreakdown:
+        """Score documentation and transparency (15 points).
+        Args:
+            card_data: Agent card data
+        Returns:
+            DocumentationBreakdown with documentation metrics
+        """
+        score = 0
+        # Check for documentation URL (5 points)
+        has_docs = bool(card_data.get("documentationUrl"))
+        if has_docs:
+            score += 5
+        # Check for terms of service (5 points)
+        has_tos = bool(card_data.get("termsOfService"))
+        if has_tos:
+            score += 5
+        # Check for privacy policy (5 points)
+        has_privacy = bool(card_data.get("privacyPolicy"))
+        if has_privacy:
+            score += 5
+        return DocumentationBreakdown(
+            score=score,
+            max_score=15,
+            has_documentation_url=has_docs,
+            has_terms_of_service=has_tos,
+            has_privacy_policy=has_privacy
+        )
+    def _is_trust_issue(self, issue: ValidationIssue) -> bool:
+        """Check if issue is trust-related.
+        Args:
+            issue: Validation issue to check
+        Returns:
+            True if trust-related
+        """
+        trust_codes = {
+            "SIGNATURE_VERIFICATION_FAILED",
+            "MISSING_SIGNATURE",
+            "SIGNATURE_EXPIRED",
+            "INCOMPLETE_SIGNATURE_COVERAGE",
+            "INSECURE_URL",
+            "HTTP_URL_FOUND",
+            "PROVIDER_URL_UNREACHABLE",
+            "SSRF_RISK",
+            "PRIVATE_IP",
+        }
+        return issue.code in trust_codes
+    def _has_issue_code(
+        self,
+        issues: List[ValidationIssue],
+        codes: str | List[str]
+    ) -> bool:
+        """Check if any issue has given code(s).
+        Args:
+            issues: List of validation issues
+            codes: Single code or list of codes to check
+        Returns:
+            True if any issue matches
+        """
+        if isinstance(codes, str):
+            codes = [codes]
+        code_set = set(codes)
+        return any(issue.code in code_set for issue in issues)

capiscio_sdk/scoring/types.py ADDED Viewed

@@ -0,0 +1,353 @@
+"""Type definitions for multi-dimensional scoring system.
+Defines the three core score types (Compliance, Trust, Availability),
+their breakdown structures, rating enums, and helper functions.
+"""
+from dataclasses import dataclass, field
+from enum import Enum
+from typing import List, Optional
+# ============================================================================
+# Rating Enums
+# ============================================================================
+class ComplianceRating(str, Enum):
+    """Compliance score rating levels."""
+    PERFECT = "Perfect"
+    EXCELLENT = "Excellent"
+    GOOD = "Good"
+    FAIR = "Fair"
+    POOR = "Poor"
+class TrustRating(str, Enum):
+    """Trust score rating levels."""
+    HIGHLY_TRUSTED = "Highly Trusted"
+    TRUSTED = "Trusted"
+    MODERATE_TRUST = "Moderate Trust"
+    LOW_TRUST = "Low Trust"
+    UNTRUSTED = "Untrusted"
+class AvailabilityRating(str, Enum):
+    """Availability score rating levels."""
+    FULLY_AVAILABLE = "Fully Available"
+    AVAILABLE = "Available"
+    DEGRADED = "Degraded"
+    UNSTABLE = "Unstable"
+    UNAVAILABLE = "Unavailable"
+# ============================================================================
+# Breakdown Structures
+# ============================================================================
+@dataclass
+class CoreFieldsBreakdown:
+    """Breakdown for core required fields scoring."""
+    score: int
+    max_score: int = 60
+    present: List[str] = field(default_factory=list)
+    missing: List[str] = field(default_factory=list)
+@dataclass
+class SkillsQualityBreakdown:
+    """Breakdown for skills quality scoring."""
+    score: int
+    max_score: int = 20
+    skills_present: bool = False
+    all_skills_have_required_fields: bool = False
+    all_skills_have_tags: bool = False
+    issue_count: int = 0
+@dataclass
+class FormatComplianceBreakdown:
+    """Breakdown for format compliance scoring."""
+    score: int
+    max_score: int = 15
+    valid_semver: bool = False
+    valid_protocol_version: bool = False
+    valid_url: bool = False
+    valid_transports: bool = False
+    valid_mime_types: bool = False
+@dataclass
+class DataQualityBreakdown:
+    """Breakdown for data quality scoring."""
+    score: int
+    max_score: int = 5
+    no_duplicate_skill_ids: bool = False
+    field_lengths_valid: bool = False
+    no_ssrf_risks: bool = False
+@dataclass
+class ComplianceBreakdown:
+    """Complete compliance score breakdown (100 points total)."""
+    core_fields: CoreFieldsBreakdown
+    skills_quality: SkillsQualityBreakdown
+    format_compliance: FormatComplianceBreakdown
+    data_quality: DataQualityBreakdown
+@dataclass
+class SignaturesBreakdown:
+    """Breakdown for signature validation scoring."""
+    score: int
+    max_score: int = 40
+    tested: bool = False
+    has_valid_signature: bool = False
+    multiple_signatures: bool = False
+    covers_all_fields: bool = False
+    is_recent: bool = False
+    has_invalid_signature: bool = False
+    has_expired_signature: bool = False
+@dataclass
+class ProviderBreakdown:
+    """Breakdown for provider information scoring."""
+    score: int
+    max_score: int = 25
+    tested: bool = False
+    has_organization: bool = False
+    has_url: bool = False
+    url_reachable: Optional[bool] = None
+@dataclass
+class SecurityBreakdown:
+    """Breakdown for security configuration scoring."""
+    score: int
+    max_score: int = 20
+    https_only: bool = False
+    has_security_schemes: bool = False
+    has_strong_auth: bool = False
+    has_http_urls: bool = False
+@dataclass
+class DocumentationBreakdown:
+    """Breakdown for documentation and transparency scoring."""
+    score: int
+    max_score: int = 15
+    has_documentation_url: bool = False
+    has_terms_of_service: bool = False
+    has_privacy_policy: bool = False
+@dataclass
+class TrustBreakdown:
+    """Complete trust score breakdown (100 points before multiplier)."""
+    signatures: SignaturesBreakdown
+    provider: ProviderBreakdown
+    security: SecurityBreakdown
+    documentation: DocumentationBreakdown
+@dataclass
+class PrimaryEndpointBreakdown:
+    """Breakdown for primary endpoint scoring."""
+    score: int
+    max_score: int = 50
+    responds: bool = False
+    response_time: Optional[float] = None
+    has_cors: Optional[bool] = None
+    valid_tls: Optional[bool] = None
+    errors: List[str] = field(default_factory=list)
+@dataclass
+class TransportSupportBreakdown:
+    """Breakdown for transport protocol support scoring."""
+    score: int
+    max_score: int = 30
+    preferred_transport_works: bool = False
+    additional_interfaces_working: int = 0
+    additional_interfaces_failed: int = 0
+@dataclass
+class ResponseQualityBreakdown:
+    """Breakdown for response quality scoring."""
+    score: int
+    max_score: int = 20
+    valid_structure: bool = False
+    proper_content_type: bool = False
+    proper_error_handling: bool = False
+@dataclass
+class AvailabilityBreakdown:
+    """Complete availability score breakdown (100 points total)."""
+    primary_endpoint: PrimaryEndpointBreakdown
+    transport_support: TransportSupportBreakdown
+    response_quality: ResponseQualityBreakdown
+# ============================================================================
+# Core Score Types
+# ============================================================================
+@dataclass
+class ComplianceScore:
+    """Compliance score (0-100): Measures A2A specification adherence.
+    Always calculated consistently regardless of validation flags.
+    """
+    total: int
+    rating: ComplianceRating
+    breakdown: ComplianceBreakdown
+    issues: List[str] = field(default_factory=list)
+    def __post_init__(self) -> None:
+        """Validate score is in range."""
+        assert 0 <= self.total <= 100, f"Invalid compliance score: {self.total}"
+@dataclass
+class TrustScore:
+    """Trust score (0-100): Measures security and authenticity signals.
+    Includes confidence multiplier based on signature presence.
+    """
+    total: int  # After confidence multiplier
+    raw_score: int  # Before multiplier
+    confidence_multiplier: float  # 1.0x, 0.6x, or 0.4x
+    rating: TrustRating
+    breakdown: TrustBreakdown
+    issues: List[str] = field(default_factory=list)
+    partial_validation: bool = False
+    def __post_init__(self) -> None:
+        """Validate score is in range."""
+        assert 0 <= self.total <= 100, f"Invalid trust score: {self.total}"
+        assert 0 <= self.raw_score <= 100, f"Invalid raw trust score: {self.raw_score}"
+        assert self.confidence_multiplier in (0.4, 0.6, 1.0), \
+            f"Invalid confidence multiplier: {self.confidence_multiplier}"
+@dataclass
+class AvailabilityScore:
+    """Availability score (0-100): Measures operational readiness.
+    Only calculated when network tests are enabled (not schema-only mode).
+    """
+    total: Optional[int]  # None if not tested
+    rating: Optional[AvailabilityRating]
+    breakdown: Optional[AvailabilityBreakdown]
+    issues: List[str] = field(default_factory=list)
+    tested: bool = False
+    not_tested_reason: Optional[str] = None
+    def __post_init__(self) -> None:
+        """Validate score is in range if present."""
+        if self.total is not None:
+            assert 0 <= self.total <= 100, f"Invalid availability score: {self.total}"
+# ============================================================================
+# Context & Helpers
+# ============================================================================
+@dataclass
+class ScoringContext:
+    """Context about what validation was performed."""
+    schema_only: bool = False
+    skip_signature_verification: bool = False
+    test_live: bool = False
+    strict_mode: bool = False
+# ============================================================================
+# Rating Helper Functions
+# ============================================================================
+def get_compliance_rating(score: int) -> ComplianceRating:
+    """Get compliance rating based on score.
+    Args:
+        score: Compliance score (0-100)
+    Returns:
+        ComplianceRating enum value
+    """
+    if score == 100:
+        return ComplianceRating.PERFECT
+    if score >= 90:
+        return ComplianceRating.EXCELLENT
+    if score >= 75:
+        return ComplianceRating.GOOD
+    if score >= 60:
+        return ComplianceRating.FAIR
+    return ComplianceRating.POOR
+def get_trust_rating(score: int) -> TrustRating:
+    """Get trust rating based on score.
+    Args:
+        score: Trust score (0-100, after confidence multiplier)
+    Returns:
+        TrustRating enum value
+    """
+    if score >= 80:
+        return TrustRating.HIGHLY_TRUSTED
+    if score >= 60:
+        return TrustRating.TRUSTED
+    if score >= 40:
+        return TrustRating.MODERATE_TRUST
+    if score >= 20:
+        return TrustRating.LOW_TRUST
+    return TrustRating.UNTRUSTED
+def get_availability_rating(score: int) -> AvailabilityRating:
+    """Get availability rating based on score.
+    Args:
+        score: Availability score (0-100)
+    Returns:
+        AvailabilityRating enum value
+    """
+    if score >= 95:
+        return AvailabilityRating.FULLY_AVAILABLE
+    if score >= 80:
+        return AvailabilityRating.AVAILABLE
+    if score >= 60:
+        return AvailabilityRating.DEGRADED
+    if score >= 40:
+        return AvailabilityRating.UNSTABLE
+    return AvailabilityRating.UNAVAILABLE
+def get_trust_confidence_multiplier(
+    has_valid_signature: bool,
+    has_invalid_signature: bool
+) -> float:
+    """Get trust confidence multiplier based on signature state.
+    Args:
+        has_valid_signature: Whether a valid signature exists
+        has_invalid_signature: Whether an invalid signature exists
+    Returns:
+        Confidence multiplier: 1.0x (valid), 0.6x (none), or 0.4x (invalid)
+    """
+    if has_invalid_signature:
+        return 0.4  # Active distrust
+    if has_valid_signature:
+        return 1.0  # Full confidence
+    return 0.6  # Unverified claims