PyPI - zae-limiter - Versions diffs - 0.1.0__py3-none-any.whl - Mend

zae-limiter 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

zae_limiter/__init__.py +130 -0
zae_limiter/aggregator/__init__.py +11 -0
zae_limiter/aggregator/handler.py +54 -0
zae_limiter/aggregator/processor.py +270 -0
zae_limiter/bucket.py +291 -0
zae_limiter/cli.py +608 -0
zae_limiter/exceptions.py +214 -0
zae_limiter/infra/__init__.py +10 -0
zae_limiter/infra/cfn_template.yaml +255 -0
zae_limiter/infra/lambda_builder.py +85 -0
zae_limiter/infra/stack_manager.py +536 -0
zae_limiter/lease.py +196 -0
zae_limiter/limiter.py +925 -0
zae_limiter/migrations/__init__.py +114 -0
zae_limiter/migrations/v1_0_0.py +55 -0
zae_limiter/models.py +302 -0
zae_limiter/repository.py +656 -0
zae_limiter/schema.py +163 -0
zae_limiter/version.py +214 -0
zae_limiter-0.1.0.dist-info/METADATA +470 -0
zae_limiter-0.1.0.dist-info/RECORD +24 -0
zae_limiter-0.1.0.dist-info/WHEEL +4 -0
zae_limiter-0.1.0.dist-info/entry_points.txt +2 -0
zae_limiter-0.1.0.dist-info/licenses/LICENSE +21 -0

zae_limiter/__init__.py ADDED Viewed

@@ -0,0 +1,130 @@
+"""
+zae-limiter: Rate limiting library backed by DynamoDB.
+This library provides a token bucket rate limiter with:
+- Multiple limits per entity/resource
+- Two-level hierarchy (parent/child entities)
+- Cascade mode (consume from entity + parent)
+- Stored limit configs
+- Usage analytics via Lambda aggregator
+Example:
+    from zae_limiter import RateLimiter, Limit, FailureMode
+    limiter = RateLimiter(
+        table_name="rate_limits",
+        region="us-east-1",
+        create_table=True,
+    )
+    async with limiter.acquire(
+        entity_id="key-abc",
+        resource="gpt-4",
+        limits=[
+            Limit.per_minute("rpm", 100),
+            Limit.per_minute("tpm", 10_000),
+        ],
+        consume={"rpm": 1, "tpm": 500},
+    ) as lease:
+        response = await llm_call()
+        await lease.adjust(tpm=response.usage.total_tokens - 500)
+"""
+from .exceptions import (
+    EntityExistsError,
+    EntityNotFoundError,
+    IncompatibleSchemaError,
+    InfrastructureNotFoundError,
+    RateLimitError,
+    RateLimiterUnavailable,
+    RateLimitExceeded,
+    StackAlreadyExistsError,
+    StackCreationError,
+    VersionError,
+    VersionMismatchError,
+)
+from .lease import Lease, SyncLease
+from .models import (
+    BucketState,
+    Entity,
+    EntityCapacity,
+    Limit,
+    LimitName,
+    LimitStatus,
+    ResourceCapacity,
+    UsageSnapshot,
+)
+# RateLimiter, SyncRateLimiter, FailureMode, and StackManager are imported
+# lazily via __getattr__ to avoid loading aioboto3 for Lambda functions
+# that only need boto3
+try:
+    from ._version import __version__  # type: ignore[import-untyped]
+except ImportError:
+    __version__ = "0.0.0+unknown"
+__all__ = [
+    # Version
+    "__version__",
+    # Main classes
+    "RateLimiter",
+    "SyncRateLimiter",
+    "Lease",
+    "SyncLease",
+    "StackManager",
+    # Models
+    "Limit",
+    "LimitName",
+    "Entity",
+    "LimitStatus",
+    "BucketState",
+    "UsageSnapshot",
+    "ResourceCapacity",
+    "EntityCapacity",
+    # Enums
+    "FailureMode",
+    # Exceptions
+    "RateLimitError",
+    "RateLimitExceeded",
+    "RateLimiterUnavailable",
+    "EntityNotFoundError",
+    "EntityExistsError",
+    "StackCreationError",
+    "StackAlreadyExistsError",
+    "VersionError",
+    "VersionMismatchError",
+    "IncompatibleSchemaError",
+    "InfrastructureNotFoundError",
+]
+def __getattr__(name: str) -> type:
+    """
+    Lazy import for modules with heavy dependencies.
+    This allows the package to be imported without loading aioboto3,
+    which is critical for Lambda functions that only need boto3.
+    The aggregator Lambda function imports the handler which would normally
+    trigger loading of the entire package. By making RateLimiter and
+    StackManager lazy imports, we avoid loading aioboto3 (not available in
+    Lambda runtime) while maintaining backward compatibility for regular usage.
+    """
+    if name == "RateLimiter":
+        from .limiter import RateLimiter
+        return RateLimiter
+    if name == "SyncRateLimiter":
+        from .limiter import SyncRateLimiter
+        return SyncRateLimiter
+    if name == "FailureMode":
+        from .limiter import FailureMode
+        return FailureMode
+    if name == "StackManager":
+        from .infra.stack_manager import StackManager
+        return StackManager
+    raise AttributeError(f"module {__name__!r} has no attribute {name!r}")

zae_limiter/aggregator/__init__.py ADDED Viewed

@@ -0,0 +1,11 @@
+"""Lambda aggregator for usage snapshots."""
+from .handler import handler
+from .processor import ConsumptionDelta, ProcessResult, process_stream_records
+__all__ = [
+    "handler",
+    "process_stream_records",
+    "ProcessResult",
+    "ConsumptionDelta",
+]

zae_limiter/aggregator/handler.py ADDED Viewed

@@ -0,0 +1,54 @@
+"""Lambda handler for DynamoDB Stream events."""
+import os
+from typing import Any
+from .processor import process_stream_records
+# Configuration from environment
+TABLE_NAME = os.environ.get("TABLE_NAME", "rate_limits")
+SNAPSHOT_WINDOWS = os.environ.get("SNAPSHOT_WINDOWS", "hourly,daily").split(",")
+SNAPSHOT_TTL_DAYS = int(os.environ.get("SNAPSHOT_TTL_DAYS", "90"))
+def handler(event: dict[str, Any], context: Any) -> dict[str, Any]:
+    """
+    Lambda handler for DynamoDB Stream events.
+    Processes bucket changes and updates usage snapshots.
+    Environment variables:
+        TABLE_NAME: DynamoDB table name (default: rate_limits)
+        SNAPSHOT_WINDOWS: Comma-separated windows (default: hourly,daily)
+        SNAPSHOT_TTL_DAYS: TTL for snapshots in days (default: 90)
+    Args:
+        event: DynamoDB Stream event
+        context: Lambda context
+    Returns:
+        Processing result summary
+    """
+    records = event.get("Records", [])
+    if not records:
+        return {
+            "statusCode": 200,
+            "body": {"processed": 0, "snapshots_updated": 0, "errors": []},
+        }
+    result = process_stream_records(
+        records=records,
+        table_name=TABLE_NAME,
+        windows=SNAPSHOT_WINDOWS,
+        ttl_days=SNAPSHOT_TTL_DAYS,
+    )
+    return {
+        "statusCode": 200,
+        "body": {
+            "processed": result.processed_count,
+            "snapshots_updated": result.snapshots_updated,
+            "errors": result.errors,
+        },
+    }

zae_limiter/aggregator/processor.py ADDED Viewed

@@ -0,0 +1,270 @@
+"""DynamoDB Stream processor for usage aggregation."""
+import logging
+from dataclasses import dataclass
+from datetime import UTC, datetime, timedelta
+from typing import Any
+import boto3  # type: ignore[import-untyped]
+from ..schema import SK_BUCKET, gsi2_pk_resource, gsi2_sk_usage, pk_entity, sk_usage
+logger = logging.getLogger(__name__)
+@dataclass
+class ProcessResult:
+    """Result of processing stream records."""
+    processed_count: int
+    snapshots_updated: int
+    errors: list[str]
+@dataclass
+class ConsumptionDelta:
+    """Consumption delta extracted from stream record."""
+    entity_id: str
+    resource: str
+    limit_name: str
+    tokens_delta: int  # positive = consumed, negative = refilled/returned
+    timestamp_ms: int
+def process_stream_records(
+    records: list[dict[str, Any]],
+    table_name: str,
+    windows: list[str],
+    ttl_days: int = 90,
+) -> ProcessResult:
+    """
+    Process DynamoDB stream records and update usage snapshots.
+    1. Filter for BUCKET records (MODIFY events)
+    2. Extract consumption deltas from old/new images
+    3. Aggregate into hourly/daily snapshot records
+    4. Write updates using atomic ADD operations
+    Args:
+        records: DynamoDB stream records
+        table_name: Target table name
+        windows: List of window types ("hourly", "daily")
+        ttl_days: TTL for snapshot records
+    Returns:
+        ProcessResult with counts and errors
+    """
+    dynamodb = boto3.resource("dynamodb")
+    table = dynamodb.Table(table_name)
+    deltas: list[ConsumptionDelta] = []
+    errors: list[str] = []
+    # Extract deltas from records
+    for record in records:
+        if record.get("eventName") != "MODIFY":
+            continue
+        try:
+            delta = extract_delta(record)
+            if delta:
+                deltas.append(delta)
+        except Exception as e:
+            error_msg = f"Error processing record: {e}"
+            logger.warning(error_msg)
+            errors.append(error_msg)
+    if not deltas:
+        return ProcessResult(len(records), 0, errors)
+    # Update snapshots
+    snapshots_updated = 0
+    for delta in deltas:
+        for window in windows:
+            try:
+                update_snapshot(table, delta, window, ttl_days)
+                snapshots_updated += 1
+            except Exception as e:
+                error_msg = f"Error updating snapshot: {e}"
+                logger.warning(error_msg)
+                errors.append(error_msg)
+    return ProcessResult(len(records), snapshots_updated, errors)
+def extract_delta(record: dict[str, Any]) -> ConsumptionDelta | None:
+    """
+    Extract consumption delta from a stream record.
+    Only processes BUCKET records where tokens decreased (consumption).
+    Args:
+        record: DynamoDB stream record
+    Returns:
+        ConsumptionDelta if this was a consumption event, None otherwise
+    """
+    dynamodb_data = record.get("dynamodb", {})
+    new_image = dynamodb_data.get("NewImage", {})
+    old_image = dynamodb_data.get("OldImage", {})
+    # Only process bucket records
+    sk = new_image.get("SK", {}).get("S", "")
+    if not sk.startswith(SK_BUCKET):
+        return None
+    # Parse key: #BUCKET#{resource}#{limit_name}
+    parts = sk[len(SK_BUCKET) :].split("#", 1)
+    if len(parts) != 2:
+        return None
+    resource, limit_name = parts
+    entity_id = new_image.get("entity_id", {}).get("S", "")
+    if not entity_id:
+        return None
+    # Extract token values from data map
+    new_data = new_image.get("data", {}).get("M", {})
+    old_data = old_image.get("data", {}).get("M", {})
+    new_tokens = int(new_data.get("tokens_milli", {}).get("N", "0"))
+    old_tokens = int(old_data.get("tokens_milli", {}).get("N", "0"))
+    new_refill_ms = int(new_data.get("last_refill_ms", {}).get("N", "0"))
+    # Calculate delta: old - new = amount consumed
+    # (tokens decrease when consumed)
+    tokens_delta = old_tokens - new_tokens
+    # We track all changes (consumption and refunds)
+    # but skip pure refill events (no net consumption)
+    if tokens_delta == 0:
+        return None
+    return ConsumptionDelta(
+        entity_id=entity_id,
+        resource=resource,
+        limit_name=limit_name,
+        tokens_delta=tokens_delta,  # positive = consumed, negative = returned
+        timestamp_ms=new_refill_ms,
+    )
+def get_window_key(timestamp_ms: int, window: str) -> str:
+    """
+    Get the window key (ISO timestamp) for a given timestamp.
+    Args:
+        timestamp_ms: Epoch milliseconds
+        window: Window type ("hourly", "daily", "monthly")
+    Returns:
+        ISO timestamp string for the window start
+    """
+    dt = datetime.fromtimestamp(timestamp_ms / 1000, tz=UTC)
+    if window == "hourly":
+        return dt.strftime("%Y-%m-%dT%H:00:00Z")
+    elif window == "daily":
+        return dt.strftime("%Y-%m-%dT00:00:00Z")
+    elif window == "monthly":
+        return dt.strftime("%Y-%m-01T00:00:00Z")
+    else:
+        raise ValueError(f"Unknown window type: {window}")
+def get_window_end(window_key: str, window: str) -> str:
+    """
+    Get the window end timestamp.
+    Args:
+        window_key: Window start (ISO timestamp)
+        window: Window type
+    Returns:
+        ISO timestamp string for the window end
+    """
+    dt = datetime.fromisoformat(window_key.replace("Z", "+00:00"))
+    if window == "hourly":
+        end_dt = dt.replace(minute=59, second=59)
+    elif window == "daily":
+        end_dt = dt.replace(hour=23, minute=59, second=59)
+    elif window == "monthly":
+        # Last day of month
+        if dt.month == 12:
+            end_dt = dt.replace(year=dt.year + 1, month=1, day=1) - timedelta(seconds=1)
+        else:
+            end_dt = dt.replace(month=dt.month + 1, day=1) - timedelta(seconds=1)
+    else:
+        end_dt = dt
+    return end_dt.strftime("%Y-%m-%dT%H:%M:%SZ")
+def calculate_snapshot_ttl(ttl_days: int) -> int:
+    """Calculate TTL epoch seconds."""
+    return int(datetime.now(UTC).timestamp()) + (ttl_days * 86400)
+def update_snapshot(
+    table: Any,
+    delta: ConsumptionDelta,
+    window: str,
+    ttl_days: int,
+) -> None:
+    """
+    Update a usage snapshot record atomically.
+    Uses DynamoDB ADD operation to increment counters, creating
+    the record if it doesn't exist.
+    Args:
+        table: boto3 Table resource
+        delta: Consumption delta to record
+        window: Window type
+        ttl_days: TTL in days
+    """
+    window_key = get_window_key(delta.timestamp_ms, window)
+    # Convert millitokens to tokens for storage
+    tokens_delta = delta.tokens_delta // 1000
+    # Build update expression
+    # We use ADD for atomic increments and SET for metadata
+    table.update_item(
+        Key={
+            "PK": pk_entity(delta.entity_id),
+            "SK": sk_usage(delta.resource, window_key),
+        },
+        UpdateExpression="""
+            SET entity_id = :entity_id,
+                #data.#resource = :resource,
+                #data.#window = :window,
+                #data.window_start = :window_start,
+                GSI2PK = :gsi2pk,
+                GSI2SK = :gsi2sk,
+                #ttl = :ttl
+            ADD #data.#limit_name :delta,
+                #data.total_events :one
+        """,
+        ExpressionAttributeNames={
+            "#data": "data",
+            "#resource": "resource",
+            "#window": "window",
+            "#limit_name": delta.limit_name,
+            "#ttl": "ttl",
+        },
+        ExpressionAttributeValues={
+            ":entity_id": delta.entity_id,
+            ":resource": delta.resource,
+            ":window": window,
+            ":window_start": window_key,
+            ":gsi2pk": gsi2_pk_resource(delta.resource),
+            ":gsi2sk": gsi2_sk_usage(window_key, delta.entity_id),
+            ":ttl": calculate_snapshot_ttl(ttl_days),
+            ":delta": tokens_delta,
+            ":one": 1,
+        },
+    )