PyPI - cloudwright-ai - Versions diffs - 0.1.0__py3-none-any.whl - Mend

cloudwright-ai 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (81) hide show

cloudwright/__init__.py +100 -0
cloudwright/adapters/__init__.py +79 -0
cloudwright/adapters/aws.py +314 -0
cloudwright/adapters/azure.py +274 -0
cloudwright/adapters/gcp.py +305 -0
cloudwright/analyzer.py +180 -0
cloudwright/architect.py +603 -0
cloudwright/catalog/__init__.py +26 -0
cloudwright/catalog/formula.py +257 -0
cloudwright/catalog/refresh.py +248 -0
cloudwright/catalog/store.py +672 -0
cloudwright/cost.py +281 -0
cloudwright/data/catalog.db +0 -0
cloudwright/data/registry/analytics.yaml +32 -0
cloudwright/data/registry/cache.yaml +64 -0
cloudwright/data/registry/compute.yaml +78 -0
cloudwright/data/registry/containers.yaml +116 -0
cloudwright/data/registry/database_nosql.yaml +33 -0
cloudwright/data/registry/database_relational.yaml +96 -0
cloudwright/data/registry/messaging.yaml +47 -0
cloudwright/data/registry/ml.yaml +32 -0
cloudwright/data/registry/networking_api.yaml +31 -0
cloudwright/data/registry/networking_cdn.yaml +29 -0
cloudwright/data/registry/networking_dns.yaml +31 -0
cloudwright/data/registry/networking_lb.yaml +77 -0
cloudwright/data/registry/orchestration.yaml +32 -0
cloudwright/data/registry/security_auth.yaml +29 -0
cloudwright/data/registry/security_waf.yaml +31 -0
cloudwright/data/registry/serverless.yaml +74 -0
cloudwright/data/registry/storage_block.yaml +31 -0
cloudwright/data/registry/storage_object.yaml +71 -0
cloudwright/data/registry/streaming.yaml +32 -0
cloudwright/data/templates/_index.yaml +99 -0
cloudwright/data/templates/azure-microservices.yaml +81 -0
cloudwright/data/templates/azure-serverless-api.yaml +49 -0
cloudwright/data/templates/azure-three-tier-web.yaml +59 -0
cloudwright/data/templates/batch-processing.yaml +103 -0
cloudwright/data/templates/data-lake.yaml +91 -0
cloudwright/data/templates/event-driven.yaml +89 -0
cloudwright/data/templates/gcp-microservices.yaml +90 -0
cloudwright/data/templates/gcp-serverless-api.yaml +48 -0
cloudwright/data/templates/gcp-three-tier-web.yaml +59 -0
cloudwright/data/templates/microservices.yaml +131 -0
cloudwright/data/templates/ml_pipeline.yaml +60 -0
cloudwright/data/templates/serverless_api.yaml +60 -0
cloudwright/data/templates/static-site.yaml +92 -0
cloudwright/data/templates/three_tier_web.yaml +59 -0
cloudwright/differ.py +237 -0
cloudwright/drift.py +90 -0
cloudwright/evolution.py +63 -0
cloudwright/exporter/__init__.py +105 -0
cloudwright/exporter/aibom.py +104 -0
cloudwright/exporter/cloudformation.py +218 -0
cloudwright/exporter/compliance_report.py +161 -0
cloudwright/exporter/d2.py +82 -0
cloudwright/exporter/mermaid.py +69 -0
cloudwright/exporter/sbom.py +68 -0
cloudwright/exporter/terraform.py +1003 -0
cloudwright/importer/__init__.py +78 -0
cloudwright/importer/cloudformation.py +368 -0
cloudwright/importer/terraform_state.py +320 -0
cloudwright/importer/utils.py +45 -0
cloudwright/linter.py +255 -0
cloudwright/llm/__init__.py +45 -0
cloudwright/llm/anthropic.py +42 -0
cloudwright/llm/base.py +14 -0
cloudwright/llm/openai.py +42 -0
cloudwright/plugins.py +73 -0
cloudwright/policy.py +204 -0
cloudwright/providers/__init__.py +59 -0
cloudwright/providers/aws.py +172 -0
cloudwright/providers/azure.py +151 -0
cloudwright/providers/gcp.py +151 -0
cloudwright/py.typed +0 -0
cloudwright/registry.py +223 -0
cloudwright/scorer.py +369 -0
cloudwright/spec.py +185 -0
cloudwright/validator.py +841 -0
cloudwright_ai-0.1.0.dist-info/METADATA +541 -0
cloudwright_ai-0.1.0.dist-info/RECORD +81 -0
cloudwright_ai-0.1.0.dist-info/WHEEL +4 -0

cloudwright/__init__.py ADDED Viewed

@@ -0,0 +1,100 @@
+"""Cloudwright — Architecture intelligence for cloud engineers."""
+from cloudwright.spec import (
+    Alternative,
+    ArchSpec,
+    ArchVersion,
+    Component,
+    ComponentChange,
+    ComponentCost,
+    Connection,
+    ConnectionChange,
+    Constraints,
+    CostEstimate,
+    DiffResult,
+    ValidationCheck,
+    ValidationResult,
+)
+__version__ = "0.1.0"
+__all__ = [
+    "Alternative",
+    "ArchSpec",
+    "ArchVersion",
+    "Architect",
+    "Catalog",
+    "ConversationSession",
+    "Component",
+    "ComponentChange",
+    "ComponentCost",
+    "Connection",
+    "ConnectionChange",
+    "Constraints",
+    "CostEstimate",
+    "create_version",
+    "detect_drift",
+    "diff_versions",
+    "Differ",
+    "DiffResult",
+    "DriftReport",
+    "get_timeline",
+    "LintWarning",
+    "lint",
+    "ValidationCheck",
+    "ValidationResult",
+    "Validator",
+]
+def __getattr__(name: str):
+    # Lazy imports for heavy modules that need LLM/DB
+    if name == "Architect":
+        from cloudwright.architect import Architect
+        return Architect
+    if name == "ConversationSession":
+        from cloudwright.architect import ConversationSession
+        return ConversationSession
+    if name == "Catalog":
+        from cloudwright.catalog import Catalog
+        return Catalog
+    if name == "Differ":
+        from cloudwright.differ import Differ
+        return Differ
+    if name == "Validator":
+        from cloudwright.validator import Validator
+        return Validator
+    if name == "lint":
+        from cloudwright.linter import lint
+        return lint
+    if name == "LintWarning":
+        from cloudwright.linter import LintWarning
+        return LintWarning
+    if name == "detect_drift":
+        from cloudwright.drift import detect_drift
+        return detect_drift
+    if name == "DriftReport":
+        from cloudwright.drift import DriftReport
+        return DriftReport
+    if name == "create_version":
+        from cloudwright.evolution import create_version
+        return create_version
+    if name == "get_timeline":
+        from cloudwright.evolution import get_timeline
+        return get_timeline
+    if name == "diff_versions":
+        from cloudwright.evolution import diff_versions
+        return diff_versions
+    raise AttributeError(f"module 'cloudwright' has no attribute {name!r}")

cloudwright/adapters/__init__.py ADDED Viewed

@@ -0,0 +1,79 @@
+"""Cloud pricing adapters — fetch live pricing data from provider APIs."""
+from __future__ import annotations
+import ssl
+import urllib.request
+from abc import ABC, abstractmethod
+from dataclasses import dataclass
+from typing import Iterator
+def _ssl_context() -> ssl.SSLContext:
+    """Create an SSL context using certifi CA bundle (macOS workaround)."""
+    try:
+        import certifi
+        return ssl.create_default_context(cafile=certifi.where())
+    except ImportError:
+        return ssl.create_default_context()
+def urlopen_safe(req: urllib.request.Request, timeout: int = 30) -> bytes:
+    """urlopen with certifi SSL — use this instead of raw urllib.request.urlopen."""
+    ctx = _ssl_context()
+    with urllib.request.urlopen(req, timeout=timeout, context=ctx) as resp:
+        return resp.read()
+@dataclass
+class InstancePrice:
+    """Pricing record for a compute instance type."""
+    instance_type: str
+    region: str
+    vcpus: int
+    memory_gb: float
+    price_per_hour: float
+    price_type: str = "on_demand"  # on_demand | reserved_1yr | reserved_3yr | spot
+    os: str = "linux"
+    storage_desc: str = ""
+    network_bandwidth: str = ""
+@dataclass
+class ManagedServicePrice:
+    """Pricing record for a managed service tier."""
+    service: str
+    tier_name: str
+    price_per_hour: float
+    price_per_month: float
+    description: str = ""
+    vcpus: int = 0
+    memory_gb: float = 0.0
+class PricingAdapter(ABC):
+    """Abstract base for cloud pricing data adapters.
+    Subclasses fetch live pricing from provider-specific APIs and return
+    normalized InstancePrice / ManagedServicePrice records for catalog ingestion.
+    """
+    provider: str  # "aws" | "gcp" | "azure"
+    @abstractmethod
+    def fetch_instance_pricing(self, region: str) -> Iterator[InstancePrice]:
+        """Yield compute instance prices for the given region."""
+    @abstractmethod
+    def fetch_managed_service_pricing(self, service: str, region: str) -> list[ManagedServicePrice]:
+        """Return pricing tiers for a managed service in the given region."""
+    @abstractmethod
+    def supported_managed_services(self) -> list[str]:
+        """List of managed service keys this adapter can fetch pricing for."""
+__all__ = ["InstancePrice", "ManagedServicePrice", "PricingAdapter"]

cloudwright/adapters/aws.py ADDED Viewed

@@ -0,0 +1,314 @@
+"""AWS Pricing API adapter.
+Streams EC2 instance pricing from the AWS Bulk Pricing CSV (region-scoped)
+and parses managed service pricing from the AWS JSON Pricing API for
+Lambda, S3, RDS, and DynamoDB.
+"""
+from __future__ import annotations
+import csv
+import io
+import json
+import re
+import urllib.error
+import urllib.request
+from typing import Any, Iterator
+from cloudwright.adapters import InstancePrice, ManagedServicePrice, PricingAdapter, urlopen_safe
+_PRICING_BASE = "https://pricing.us-east-1.amazonaws.com"
+_TIMEOUT = 30  # seconds
+# AWS region code -> location name used in the pricing API
+_REGION_TO_LOCATION: dict[str, str] = {
+    "us-east-1": "US East (N. Virginia)",
+    "us-east-2": "US East (Ohio)",
+    "us-west-1": "US West (N. California)",
+    "us-west-2": "US West (Oregon)",
+    "eu-west-1": "EU (Ireland)",
+    "eu-west-2": "EU (London)",
+    "eu-central-1": "EU (Frankfurt)",
+    "ap-southeast-1": "Asia Pacific (Singapore)",
+    "ap-southeast-2": "Asia Pacific (Sydney)",
+    "ap-northeast-1": "Asia Pacific (Tokyo)",
+    "ap-south-1": "Asia Pacific (Mumbai)",
+    "ca-central-1": "Canada (Central)",
+    "sa-east-1": "South America (Sao Paulo)",
+}
+def _parse_memory_gib(mem_str: str) -> float:
+    """Parse '16 GiB' or '16,384 MiB' -> float GiB."""
+    m = re.match(r"([\d,]+(?:\.\d+)?)\s*(GiB|MiB)", mem_str.strip())
+    if not m:
+        return 0.0
+    value = float(m.group(1).replace(",", ""))
+    return value / 1024 if m.group(2) == "MiB" else value
+def _safe_int(val: str) -> int:
+    try:
+        return int(val)
+    except (ValueError, TypeError):
+        return 0
+def _safe_float(val: str | float) -> float:
+    try:
+        return float(val)
+    except (ValueError, TypeError):
+        return 0.0
+def _first_price(terms: dict) -> float:
+    """Extract the first USD price from a terms dict."""
+    for term in terms.values():
+        for dim in term.get("priceDimensions", {}).values():
+            p = _safe_float(dim.get("pricePerUnit", {}).get("USD", "0"))
+            if p > 0:
+                return p
+    return 0.0
+class AWSPricingAdapter(PricingAdapter):
+    """Fetches AWS pricing from the bulk pricing API.
+    EC2 pricing is streamed from the CSV index (large file; streamed to avoid
+    loading the full ~1 GB decompressed CSV into memory at once).
+    Managed service pricing uses the JSON API.
+    """
+    provider = "aws"
+    def __init__(self, timeout: int = _TIMEOUT):
+        self._timeout = timeout
+    # Public interface
+    def fetch_instance_pricing(self, region: str = "us-east-1") -> Iterator[InstancePrice]:
+        """Stream on-demand Linux EC2 instance prices for the given region."""
+        url = f"{_PRICING_BASE}/offers/v1.0/aws/AmazonEC2/current/{region}/index.csv"
+        data = self._get(url)
+        yield from self._parse_ec2_csv(data, region)
+    def fetch_managed_service_pricing(self, service: str, region: str = "us-east-1") -> list[ManagedServicePrice]:
+        """Return pricing tiers for a supported managed service."""
+        parsers = {
+            "lambda": self._parse_lambda,
+            "s3": self._parse_s3,
+            "rds": self._parse_rds,
+            "dynamodb": self._parse_dynamodb,
+        }
+        handler = parsers.get(service)
+        return handler(region) if handler else []
+    def supported_managed_services(self) -> list[str]:
+        return ["lambda", "s3", "rds", "dynamodb"]
+    # EC2 CSV parsing
+    def _parse_ec2_csv(self, data: bytes, region: str) -> Iterator[InstancePrice]:
+        """Parse EC2 pricing CSV.
+        The CSV starts with several metadata lines before the actual header row
+        (the one whose first field is 'SKU'). We scan for it and then parse
+        the remainder as standard CSV.
+        """
+        text = data.decode("utf-8", errors="replace")
+        lines = text.splitlines()
+        # Find the header row — first line where field 0 is 'SKU' (quoted or bare)
+        header_idx = 0
+        for i, line in enumerate(lines):
+            stripped = line.strip().strip('"')
+            if stripped.startswith("SKU"):
+                header_idx = i
+                break
+        reader = csv.DictReader(io.StringIO("\n".join(lines[header_idx:])))
+        for row in reader:
+            if (
+                row.get("TermType") == "OnDemand"
+                and row.get("Operating System", "Linux") in ("Linux", "")
+                and row.get("Tenancy", "Shared") == "Shared"
+                and row.get("CapacityStatus", "Used") == "Used"
+                and row.get("Pre Installed S/W", "NA") in ("NA", "")
+                and row.get("productFamily", "Compute Instance") == "Compute Instance"
+            ):
+                price = _safe_float(row.get("PricePerUnit", "0"))
+                if price <= 0:
+                    continue
+                yield InstancePrice(
+                    instance_type=row.get("Instance Type", ""),
+                    region=region,
+                    vcpus=_safe_int(row.get("vCPU", "0")),
+                    memory_gb=_parse_memory_gib(row.get("Memory", "0 GiB")),
+                    price_per_hour=price,
+                    price_type="on_demand",
+                    os="linux",
+                    storage_desc=row.get("Storage", ""),
+                    network_bandwidth=row.get("Network Performance", ""),
+                )
+    # JSON API parsing
+    def _fetch_json(self, offer_code: str, region: str) -> dict[str, Any]:
+        url = f"{_PRICING_BASE}/offers/v1.0/aws/{offer_code}/current/{region}/index.json"
+        return json.loads(self._get(url))
+    def _parse_lambda(self, region: str) -> list[ManagedServicePrice]:
+        data = self._fetch_json("AWSLambda", region)
+        location = _REGION_TO_LOCATION.get(region, region)
+        on_demand = data.get("terms", {}).get("OnDemand", {})
+        prices: list[ManagedServicePrice] = []
+        for sku, product in data.get("products", {}).items():
+            attrs = product.get("attributes", {})
+            if attrs.get("location") not in (location, region):
+                continue
+            sku_terms = on_demand.get(sku, {})
+            for term in sku_terms.values():
+                for dim in term.get("priceDimensions", {}).values():
+                    unit = dim.get("unit", "")
+                    desc = dim.get("description", "")
+                    price = _safe_float(dim.get("pricePerUnit", {}).get("USD", "0"))
+                    if "request" in unit.lower() or "request" in desc.lower():
+                        prices.append(
+                            ManagedServicePrice(
+                                service="lambda",
+                                tier_name="per_request",
+                                price_per_hour=0.0,
+                                # price is per-request; store per-million
+                                price_per_month=round(price * 1_000_000, 4),
+                                description=desc,
+                            )
+                        )
+                    elif "second" in unit.lower() or "gb-second" in unit.lower():
+                        prices.append(
+                            ManagedServicePrice(
+                                service="lambda",
+                                tier_name="per_gb_second",
+                                price_per_hour=round(price * 3600, 6),
+                                price_per_month=0.0,
+                                description=desc,
+                            )
+                        )
+        return prices
+    def _parse_s3(self, region: str) -> list[ManagedServicePrice]:
+        # S3 uses a global index (no region path component)
+        url = f"{_PRICING_BASE}/offers/v1.0/aws/AmazonS3/current/index.json"
+        data = json.loads(self._get(url))
+        location = _REGION_TO_LOCATION.get(region, region)
+        on_demand = data.get("terms", {}).get("OnDemand", {})
+        prices: list[ManagedServicePrice] = []
+        for sku, product in data.get("products", {}).items():
+            attrs = product.get("attributes", {})
+            if attrs.get("location") != location:
+                continue
+            if attrs.get("storageClass") != "General Purpose":
+                continue
+            if attrs.get("volumeType") != "Standard":
+                continue
+            sku_terms = on_demand.get(sku, {})
+            for term in sku_terms.values():
+                for dim in term.get("priceDimensions", {}).values():
+                    price = _safe_float(dim.get("pricePerUnit", {}).get("USD", "0"))
+                    if price > 0:
+                        prices.append(
+                            ManagedServicePrice(
+                                service="s3",
+                                tier_name="standard_storage_gb",
+                                price_per_hour=0.0,
+                                price_per_month=price,  # per GB/month
+                                description=dim.get("description", ""),
+                            )
+                        )
+        return prices
+    def _parse_rds(self, region: str) -> list[ManagedServicePrice]:
+        data = self._fetch_json("AmazonRDS", region)
+        location = _REGION_TO_LOCATION.get(region, region)
+        on_demand = data.get("terms", {}).get("OnDemand", {})
+        prices: list[ManagedServicePrice] = []
+        for sku, product in data.get("products", {}).items():
+            attrs = product.get("attributes", {})
+            if attrs.get("location") not in (location, region):
+                continue
+            if attrs.get("databaseEngine") not in ("PostgreSQL", "MySQL"):
+                continue
+            if attrs.get("deploymentOption") != "Single-AZ":
+                continue
+            db_class = attrs.get("instanceType", "")
+            if not db_class:
+                continue
+            sku_terms = on_demand.get(sku, {})
+            price = _first_price(sku_terms)
+            if price > 0:
+                prices.append(
+                    ManagedServicePrice(
+                        service="rds",
+                        tier_name=db_class,
+                        price_per_hour=price,
+                        price_per_month=round(price * 730, 2),
+                        description=f"{attrs.get('databaseEngine')} {db_class} Single-AZ",
+                        vcpus=_safe_int(attrs.get("vcpu", "0")),
+                        memory_gb=_parse_memory_gib(attrs.get("memory", "0 GiB")),
+                    )
+                )
+        return prices
+    def _parse_dynamodb(self, region: str) -> list[ManagedServicePrice]:
+        data = self._fetch_json("AmazonDynamoDB", region)
+        location = _REGION_TO_LOCATION.get(region, region)
+        on_demand = data.get("terms", {}).get("OnDemand", {})
+        prices: list[ManagedServicePrice] = []
+        for sku, product in data.get("products", {}).items():
+            attrs = product.get("attributes", {})
+            if attrs.get("location") not in (location, region):
+                continue
+            group = attrs.get("group", "")
+            sku_terms = on_demand.get(sku, {})
+            for term in sku_terms.values():
+                for dim in term.get("priceDimensions", {}).values():
+                    price = _safe_float(dim.get("pricePerUnit", {}).get("USD", "0"))
+                    dim_desc = dim.get("description", "")
+                    if not price:
+                        continue
+                    if "write" in group.lower() or "write" in dim_desc.lower():
+                        prices.append(
+                            ManagedServicePrice(
+                                service="dynamodb",
+                                tier_name="write_request_unit",
+                                price_per_hour=0.0,
+                                price_per_month=round(price * 1_000_000, 4),
+                                description=dim_desc,
+                            )
+                        )
+                    elif "read" in group.lower() or "read" in dim_desc.lower():
+                        prices.append(
+                            ManagedServicePrice(
+                                service="dynamodb",
+                                tier_name="read_request_unit",
+                                price_per_hour=0.0,
+                                price_per_month=round(price * 1_000_000, 4),
+                                description=dim_desc,
+                            )
+                        )
+        return prices
+    # HTTP
+    def _get(self, url: str) -> bytes:
+        req = urllib.request.Request(url, headers={"Accept": "*/*"})
+        return urlopen_safe(req, timeout=self._timeout)