PyPI - ccproxy-api - Versions diffs - 0.1.0__py3-none-any.whl - Mend

ccproxy-api 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (148) hide show

ccproxy/__init__.py +4 -0
ccproxy/__main__.py +7 -0
ccproxy/_version.py +21 -0
ccproxy/adapters/__init__.py +11 -0
ccproxy/adapters/base.py +80 -0
ccproxy/adapters/openai/__init__.py +43 -0
ccproxy/adapters/openai/adapter.py +915 -0
ccproxy/adapters/openai/models.py +412 -0
ccproxy/adapters/openai/streaming.py +449 -0
ccproxy/api/__init__.py +28 -0
ccproxy/api/app.py +225 -0
ccproxy/api/dependencies.py +140 -0
ccproxy/api/middleware/__init__.py +11 -0
ccproxy/api/middleware/auth.py +0 -0
ccproxy/api/middleware/cors.py +55 -0
ccproxy/api/middleware/errors.py +703 -0
ccproxy/api/middleware/headers.py +51 -0
ccproxy/api/middleware/logging.py +175 -0
ccproxy/api/middleware/request_id.py +69 -0
ccproxy/api/middleware/server_header.py +62 -0
ccproxy/api/responses.py +84 -0
ccproxy/api/routes/__init__.py +16 -0
ccproxy/api/routes/claude.py +181 -0
ccproxy/api/routes/health.py +489 -0
ccproxy/api/routes/metrics.py +1033 -0
ccproxy/api/routes/proxy.py +238 -0
ccproxy/auth/__init__.py +75 -0
ccproxy/auth/bearer.py +68 -0
ccproxy/auth/credentials_adapter.py +93 -0
ccproxy/auth/dependencies.py +229 -0
ccproxy/auth/exceptions.py +79 -0
ccproxy/auth/manager.py +102 -0
ccproxy/auth/models.py +118 -0
ccproxy/auth/oauth/__init__.py +26 -0
ccproxy/auth/oauth/models.py +49 -0
ccproxy/auth/oauth/routes.py +396 -0
ccproxy/auth/oauth/storage.py +0 -0
ccproxy/auth/storage/__init__.py +12 -0
ccproxy/auth/storage/base.py +57 -0
ccproxy/auth/storage/json_file.py +159 -0
ccproxy/auth/storage/keyring.py +192 -0
ccproxy/claude_sdk/__init__.py +20 -0
ccproxy/claude_sdk/client.py +169 -0
ccproxy/claude_sdk/converter.py +331 -0
ccproxy/claude_sdk/options.py +120 -0
ccproxy/cli/__init__.py +14 -0
ccproxy/cli/commands/__init__.py +8 -0
ccproxy/cli/commands/auth.py +553 -0
ccproxy/cli/commands/config/__init__.py +14 -0
ccproxy/cli/commands/config/commands.py +766 -0
ccproxy/cli/commands/config/schema_commands.py +119 -0
ccproxy/cli/commands/serve.py +630 -0
ccproxy/cli/docker/__init__.py +34 -0
ccproxy/cli/docker/adapter_factory.py +157 -0
ccproxy/cli/docker/params.py +278 -0
ccproxy/cli/helpers.py +144 -0
ccproxy/cli/main.py +193 -0
ccproxy/cli/options/__init__.py +14 -0
ccproxy/cli/options/claude_options.py +216 -0
ccproxy/cli/options/core_options.py +40 -0
ccproxy/cli/options/security_options.py +48 -0
ccproxy/cli/options/server_options.py +117 -0
ccproxy/config/__init__.py +40 -0
ccproxy/config/auth.py +154 -0
ccproxy/config/claude.py +124 -0
ccproxy/config/cors.py +79 -0
ccproxy/config/discovery.py +87 -0
ccproxy/config/docker_settings.py +265 -0
ccproxy/config/loader.py +108 -0
ccproxy/config/observability.py +158 -0
ccproxy/config/pricing.py +88 -0
ccproxy/config/reverse_proxy.py +31 -0
ccproxy/config/scheduler.py +89 -0
ccproxy/config/security.py +14 -0
ccproxy/config/server.py +81 -0
ccproxy/config/settings.py +534 -0
ccproxy/config/validators.py +231 -0
ccproxy/core/__init__.py +274 -0
ccproxy/core/async_utils.py +675 -0
ccproxy/core/constants.py +97 -0
ccproxy/core/errors.py +256 -0
ccproxy/core/http.py +328 -0
ccproxy/core/http_transformers.py +428 -0
ccproxy/core/interfaces.py +247 -0
ccproxy/core/logging.py +189 -0
ccproxy/core/middleware.py +114 -0
ccproxy/core/proxy.py +143 -0
ccproxy/core/system.py +38 -0
ccproxy/core/transformers.py +259 -0
ccproxy/core/types.py +129 -0
ccproxy/core/validators.py +288 -0
ccproxy/docker/__init__.py +67 -0
ccproxy/docker/adapter.py +588 -0
ccproxy/docker/docker_path.py +207 -0
ccproxy/docker/middleware.py +103 -0
ccproxy/docker/models.py +228 -0
ccproxy/docker/protocol.py +192 -0
ccproxy/docker/stream_process.py +264 -0
ccproxy/docker/validators.py +173 -0
ccproxy/models/__init__.py +123 -0
ccproxy/models/errors.py +42 -0
ccproxy/models/messages.py +243 -0
ccproxy/models/requests.py +85 -0
ccproxy/models/responses.py +227 -0
ccproxy/models/types.py +102 -0
ccproxy/observability/__init__.py +51 -0
ccproxy/observability/access_logger.py +400 -0
ccproxy/observability/context.py +447 -0
ccproxy/observability/metrics.py +539 -0
ccproxy/observability/pushgateway.py +366 -0
ccproxy/observability/sse_events.py +303 -0
ccproxy/observability/stats_printer.py +755 -0
ccproxy/observability/storage/__init__.py +1 -0
ccproxy/observability/storage/duckdb_simple.py +665 -0
ccproxy/observability/storage/models.py +55 -0
ccproxy/pricing/__init__.py +19 -0
ccproxy/pricing/cache.py +212 -0
ccproxy/pricing/loader.py +267 -0
ccproxy/pricing/models.py +106 -0
ccproxy/pricing/updater.py +309 -0
ccproxy/scheduler/__init__.py +39 -0
ccproxy/scheduler/core.py +335 -0
ccproxy/scheduler/exceptions.py +34 -0
ccproxy/scheduler/manager.py +186 -0
ccproxy/scheduler/registry.py +150 -0
ccproxy/scheduler/tasks.py +484 -0
ccproxy/services/__init__.py +10 -0
ccproxy/services/claude_sdk_service.py +614 -0
ccproxy/services/credentials/__init__.py +55 -0
ccproxy/services/credentials/config.py +105 -0
ccproxy/services/credentials/manager.py +562 -0
ccproxy/services/credentials/oauth_client.py +482 -0
ccproxy/services/proxy_service.py +1536 -0
ccproxy/static/.keep +0 -0
ccproxy/testing/__init__.py +34 -0
ccproxy/testing/config.py +148 -0
ccproxy/testing/content_generation.py +197 -0
ccproxy/testing/mock_responses.py +262 -0
ccproxy/testing/response_handlers.py +161 -0
ccproxy/testing/scenarios.py +241 -0
ccproxy/utils/__init__.py +6 -0
ccproxy/utils/cost_calculator.py +210 -0
ccproxy/utils/streaming_metrics.py +199 -0
ccproxy_api-0.1.0.dist-info/METADATA +253 -0
ccproxy_api-0.1.0.dist-info/RECORD +148 -0
ccproxy_api-0.1.0.dist-info/WHEEL +4 -0
ccproxy_api-0.1.0.dist-info/entry_points.txt +2 -0
ccproxy_api-0.1.0.dist-info/licenses/LICENSE +21 -0

ccproxy/api/routes/metrics.py ADDED Viewed

@@ -0,0 +1,1033 @@
+"""Metrics endpoints for CCProxy API Server."""
+import time
+from datetime import datetime as dt
+from typing import Any, Optional, cast
+from fastapi import APIRouter, Depends, HTTPException, Query, Request, Response
+from fastapi.responses import FileResponse, HTMLResponse, StreamingResponse
+from sqlmodel import Session, col, desc, func, select
+from typing_extensions import TypedDict
+from ccproxy.api.dependencies import (
+    DuckDBStorageDep,
+    LogStorageDep,
+    ObservabilityMetricsDep,
+    SettingsDep,
+)
+from ccproxy.observability.storage.models import AccessLog
+class AnalyticsSummary(TypedDict):
+    """TypedDict for analytics summary data."""
+    total_requests: int
+    total_successful_requests: int
+    total_error_requests: int
+    avg_duration_ms: float
+    total_cost_usd: float
+    total_tokens_input: int
+    total_tokens_output: int
+    total_cache_read_tokens: int
+    total_cache_write_tokens: int
+    total_tokens_all: int
+class TokenAnalytics(TypedDict):
+    """TypedDict for token analytics data."""
+    input_tokens: int
+    output_tokens: int
+    cache_read_tokens: int
+    cache_write_tokens: int
+    total_tokens: int
+class RequestAnalytics(TypedDict):
+    """TypedDict for request analytics data."""
+    total_requests: int
+    successful_requests: int
+    error_requests: int
+    success_rate: float
+    error_rate: float
+class ServiceBreakdown(TypedDict):
+    """TypedDict for service type breakdown data."""
+    request_count: int
+    successful_requests: int
+    error_requests: int
+    success_rate: float
+    error_rate: float
+    avg_duration_ms: float
+    total_cost_usd: float
+    total_tokens_input: int
+    total_tokens_output: int
+    total_cache_read_tokens: int
+    total_cache_write_tokens: int
+    total_tokens_all: int
+class AnalyticsResult(TypedDict):
+    """TypedDict for complete analytics result."""
+    summary: AnalyticsSummary
+    token_analytics: TokenAnalytics
+    request_analytics: RequestAnalytics
+    service_type_breakdown: dict[str, ServiceBreakdown]
+    query_time: float
+    backend: str
+    query_params: dict[str, Any]
+# Create separate routers for different concerns
+prometheus_router = APIRouter(tags=["metrics"])
+logs_router = APIRouter(prefix="/logs", tags=["logs"])
+dashboard_router = APIRouter(tags=["dashboard"])
+# Backward compatibility - keep the old router name pointing to logs for now
+router = logs_router
+@logs_router.get("/status")
+async def logs_status(metrics: ObservabilityMetricsDep) -> dict[str, str]:
+    """Get observability system status."""
+    return {
+        "status": "healthy",
+        "prometheus_enabled": str(metrics.is_enabled()),
+        "observability_system": "hybrid_prometheus_structlog",
+    }
+@dashboard_router.get("/dashboard")
+async def get_metrics_dashboard() -> HTMLResponse:
+    """Serve the metrics dashboard SPA entry point."""
+    from pathlib import Path
+    # Get the path to the dashboard folder
+    current_file = Path(__file__)
+    project_root = (
+        current_file.parent.parent.parent.parent
+    )  # ccproxy/api/routes/metrics.py -> project root
+    dashboard_folder = project_root / "ccproxy" / "static" / "dashboard"
+    dashboard_index = dashboard_folder / "index.html"
+    # Check if dashboard folder and index.html exist
+    if not dashboard_folder.exists():
+        raise HTTPException(
+            status_code=404,
+            detail="Dashboard not found. Please build the dashboard first using 'cd dashboard && bun run build:prod'",
+        )
+    if not dashboard_index.exists():
+        raise HTTPException(
+            status_code=404,
+            detail="Dashboard index.html not found. Please rebuild the dashboard using 'cd dashboard && bun run build:prod'",
+        )
+    # Read the HTML content
+    try:
+        with dashboard_index.open(encoding="utf-8") as f:
+            html_content = f.read()
+        return HTMLResponse(
+            content=html_content,
+            status_code=200,
+            headers={
+                "Cache-Control": "no-cache, no-store, must-revalidate",
+                "Pragma": "no-cache",
+                "Expires": "0",
+                "Content-Type": "text/html; charset=utf-8",
+            },
+        )
+    except Exception as e:
+        raise HTTPException(
+            status_code=500, detail=f"Failed to serve dashboard: {str(e)}"
+        ) from e
+@dashboard_router.get("/dashboard/favicon.svg")
+async def get_dashboard_favicon() -> FileResponse:
+    """Serve the dashboard favicon."""
+    from pathlib import Path
+    # Get the path to the favicon
+    current_file = Path(__file__)
+    project_root = (
+        current_file.parent.parent.parent.parent
+    )  # ccproxy/api/routes/metrics.py -> project root
+    favicon_path = project_root / "ccproxy" / "static" / "dashboard" / "favicon.svg"
+    if not favicon_path.exists():
+        raise HTTPException(status_code=404, detail="Favicon not found")
+    return FileResponse(
+        path=str(favicon_path),
+        media_type="image/svg+xml",
+        headers={"Cache-Control": "public, max-age=3600"},
+    )
+@prometheus_router.get("/metrics")
+async def get_prometheus_metrics(metrics: ObservabilityMetricsDep) -> Response:
+    """Export metrics in Prometheus format using native prometheus_client.
+    This endpoint exposes operational metrics collected by the hybrid observability
+    system for Prometheus scraping.
+    Args:
+        metrics: Observability metrics dependency
+    Returns:
+        Prometheus-formatted metrics text
+    """
+    try:
+        # Check if prometheus_client is available
+        try:
+            from prometheus_client import CONTENT_TYPE_LATEST, generate_latest
+        except ImportError as err:
+            raise HTTPException(
+                status_code=503,
+                detail="Prometheus client not available. Install with: pip install prometheus-client",
+            ) from err
+        if not metrics.is_enabled():
+            raise HTTPException(
+                status_code=503,
+                detail="Prometheus metrics not enabled. Ensure prometheus-client is installed.",
+            )
+        # Generate prometheus format using the registry
+        from prometheus_client import REGISTRY, CollectorRegistry
+        # Use the global registry if metrics.registry is None (default behavior)
+        registry = metrics.registry if metrics.registry is not None else REGISTRY
+        prometheus_data = generate_latest(registry)
+        # Return the metrics data with proper content type
+        from fastapi import Response
+        return Response(
+            content=prometheus_data,
+            media_type=CONTENT_TYPE_LATEST,
+            headers={
+                "Cache-Control": "no-cache, no-store, must-revalidate",
+                "Pragma": "no-cache",
+                "Expires": "0",
+            },
+        )
+    except HTTPException:
+        raise
+    except Exception as e:
+        raise HTTPException(
+            status_code=500, detail=f"Failed to generate Prometheus metrics: {str(e)}"
+        ) from e
+@logs_router.get("/query")
+async def query_logs(
+    storage: DuckDBStorageDep,
+    settings: SettingsDep,
+    limit: int = Query(1000, ge=1, le=10000, description="Maximum number of results"),
+    start_time: float | None = Query(None, description="Start timestamp filter"),
+    end_time: float | None = Query(None, description="End timestamp filter"),
+    model: str | None = Query(None, description="Model filter"),
+    service_type: str | None = Query(None, description="Service type filter"),
+) -> dict[str, Any]:
+    """
+    Query access logs with filters.
+    Returns access log entries with optional filtering by time range, model, and service type.
+    """
+    try:
+        if not settings.observability.logs_collection_enabled:
+            raise HTTPException(
+                status_code=503,
+                detail="Logs collection is disabled. Enable with logs_collection_enabled=true",
+            )
+        if not storage:
+            raise HTTPException(
+                status_code=503,
+                detail="Storage backend not available. Ensure DuckDB is installed and pipeline is running.",
+            )
+        # Use SQLModel for querying
+        if hasattr(storage, "_engine") and storage._engine:
+            try:
+                with Session(storage._engine) as session:
+                    # Build base query
+                    statement = select(AccessLog)
+                    # Add filters - convert Unix timestamps to datetime
+                    start_dt = dt.fromtimestamp(start_time) if start_time else None
+                    end_dt = dt.fromtimestamp(end_time) if end_time else None
+                    if start_dt:
+                        statement = statement.where(AccessLog.timestamp >= start_dt)
+                    if end_dt:
+                        statement = statement.where(AccessLog.timestamp <= end_dt)
+                    if model:
+                        statement = statement.where(AccessLog.model == model)
+                    if service_type:
+                        statement = statement.where(
+                            AccessLog.service_type == service_type
+                        )
+                    # Apply limit and order
+                    statement = statement.order_by(desc(AccessLog.timestamp)).limit(
+                        limit
+                    )
+                    # Execute query
+                    results = session.exec(statement).all()
+                    # Convert to dict format
+                    entries = [log.dict() for log in results]
+                    return {
+                        "results": entries,
+                        "count": len(entries),
+                        "limit": limit,
+                        "filters": {
+                            "start_time": start_time,
+                            "end_time": end_time,
+                            "model": model,
+                            "service_type": service_type,
+                        },
+                        "timestamp": time.time(),
+                    }
+            except Exception as e:
+                import structlog
+                logger = structlog.get_logger(__name__)
+                logger.error("sqlmodel_query_error", error=str(e))
+                raise HTTPException(
+                    status_code=500, detail=f"Query execution failed: {str(e)}"
+                ) from e
+        else:
+            raise HTTPException(
+                status_code=503,
+                detail="Storage engine not available",
+            )
+    except HTTPException:
+        raise
+    except Exception as e:
+        raise HTTPException(
+            status_code=500, detail=f"Query execution failed: {str(e)}"
+        ) from e
+@logs_router.get("/analytics")
+async def get_logs_analytics(
+    storage: DuckDBStorageDep,
+    settings: SettingsDep,
+    start_time: float | None = Query(None, description="Start timestamp (Unix time)"),
+    end_time: float | None = Query(None, description="End timestamp (Unix time)"),
+    model: str | None = Query(None, description="Filter by model name"),
+    service_type: str | None = Query(
+        None,
+        description="Filter by service type. Supports comma-separated values (e.g., 'proxy_service,sdk_service') and negation with ! prefix (e.g., '!access_log,!sdk_service')",
+    ),
+    hours: int | None = Query(
+        24, ge=1, le=168, description="Hours of data to analyze (default: 24)"
+    ),
+) -> AnalyticsResult:
+    """
+    Get comprehensive analytics for metrics data.
+    Returns summary statistics, hourly trends, and model breakdowns.
+    """
+    try:
+        if not settings.observability.logs_collection_enabled:
+            raise HTTPException(
+                status_code=503,
+                detail="Logs collection is disabled. Enable with logs_collection_enabled=true",
+            )
+        if not storage:
+            raise HTTPException(
+                status_code=503,
+                detail="Storage backend not available. Ensure DuckDB is installed and pipeline is running.",
+            )
+        # Default time range if not provided
+        if start_time is None and end_time is None and hours:
+            end_time = time.time()
+            start_time = end_time - (hours * 3600)
+        # Use SQLModel for analytics
+        if hasattr(storage, "_engine") and storage._engine:
+            try:
+                with Session(storage._engine) as session:
+                    # Build base query
+                    statement = select(AccessLog)
+                    # Add filters - convert Unix timestamps to datetime
+                    start_dt = dt.fromtimestamp(start_time) if start_time else None
+                    end_dt = dt.fromtimestamp(end_time) if end_time else None
+                    # Helper function to build filter conditions
+                    def build_filter_conditions() -> list[Any]:
+                        conditions: list[Any] = []
+                        if start_dt:
+                            conditions.append(AccessLog.timestamp >= start_dt)
+                        if end_dt:
+                            conditions.append(AccessLog.timestamp <= end_dt)
+                        if model:
+                            conditions.append(AccessLog.model == model)
+                        # Apply service type filtering with comma-separated values and negation
+                        if service_type:
+                            service_filters = [
+                                s.strip() for s in service_type.split(",")
+                            ]
+                            include_filters = [
+                                f for f in service_filters if not f.startswith("!")
+                            ]
+                            exclude_filters = [
+                                f[1:] for f in service_filters if f.startswith("!")
+                            ]
+                            if include_filters:
+                                conditions.append(
+                                    col(AccessLog.service_type).in_(include_filters)
+                                )
+                            if exclude_filters:
+                                conditions.append(
+                                    ~col(AccessLog.service_type).in_(exclude_filters)
+                                )
+                        return conditions
+                    # Get summary statistics using individual queries to avoid overload issues
+                    # Reuse datetime variables defined above
+                    filter_conditions = build_filter_conditions()
+                    total_requests = session.exec(
+                        select(func.count())
+                        .select_from(AccessLog)
+                        .where(*filter_conditions)
+                    ).first()
+                    avg_duration = session.exec(
+                        select(func.avg(AccessLog.duration_ms))
+                        .select_from(AccessLog)
+                        .where(*filter_conditions)
+                    ).first()
+                    total_cost = session.exec(
+                        select(func.sum(AccessLog.cost_usd))
+                        .select_from(AccessLog)
+                        .where(*filter_conditions)
+                    ).first()
+                    total_tokens_input = session.exec(
+                        select(func.sum(AccessLog.tokens_input))
+                        .select_from(AccessLog)
+                        .where(*filter_conditions)
+                    ).first()
+                    total_tokens_output = session.exec(
+                        select(func.sum(AccessLog.tokens_output))
+                        .select_from(AccessLog)
+                        .where(*filter_conditions)
+                    ).first()
+                    # Token analytics - all token types
+                    total_cache_read_tokens = session.exec(
+                        select(func.sum(AccessLog.cache_read_tokens))
+                        .select_from(AccessLog)
+                        .where(*filter_conditions)
+                    ).first()
+                    total_cache_write_tokens = session.exec(
+                        select(func.sum(AccessLog.cache_write_tokens))
+                        .select_from(AccessLog)
+                        .where(*filter_conditions)
+                    ).first()
+                    # Success and error request analytics
+                    success_conditions = filter_conditions + [
+                        AccessLog.status_code >= 200,
+                        AccessLog.status_code < 400,
+                    ]
+                    total_successful_requests = session.exec(
+                        select(func.count())
+                        .select_from(AccessLog)
+                        .where(*success_conditions)
+                    ).first()
+                    error_conditions = filter_conditions + [
+                        AccessLog.status_code >= 400,
+                    ]
+                    total_error_requests = session.exec(
+                        select(func.count())
+                        .select_from(AccessLog)
+                        .where(*error_conditions)
+                    ).first()
+                    # Summary results are already computed individually above
+                    # Get service type breakdown - simplified approach
+                    service_breakdown = {}
+                    # Get unique service types first
+                    unique_services = session.exec(
+                        select(AccessLog.service_type)
+                        .distinct()
+                        .where(*filter_conditions)
+                    ).all()
+                    # For each service type, get its statistics
+                    for service in unique_services:
+                        if service:  # Skip None values
+                            # Build service-specific filter conditions
+                            service_conditions = []
+                            if start_dt:
+                                service_conditions.append(
+                                    AccessLog.timestamp >= start_dt
+                                )
+                            if end_dt:
+                                service_conditions.append(AccessLog.timestamp <= end_dt)
+                            if model:
+                                service_conditions.append(AccessLog.model == model)
+                            service_conditions.append(AccessLog.service_type == service)
+                            service_count = session.exec(
+                                select(func.count())
+                                .select_from(AccessLog)
+                                .where(*service_conditions)
+                            ).first()
+                            service_avg_duration = session.exec(
+                                select(func.avg(AccessLog.duration_ms))
+                                .select_from(AccessLog)
+                                .where(*service_conditions)
+                            ).first()
+                            service_total_cost = session.exec(
+                                select(func.sum(AccessLog.cost_usd))
+                                .select_from(AccessLog)
+                                .where(*service_conditions)
+                            ).first()
+                            service_total_tokens_input = session.exec(
+                                select(func.sum(AccessLog.tokens_input))
+                                .select_from(AccessLog)
+                                .where(*service_conditions)
+                            ).first()
+                            service_total_tokens_output = session.exec(
+                                select(func.sum(AccessLog.tokens_output))
+                                .select_from(AccessLog)
+                                .where(*service_conditions)
+                            ).first()
+                            service_cache_read_tokens = session.exec(
+                                select(func.sum(AccessLog.cache_read_tokens))
+                                .select_from(AccessLog)
+                                .where(*service_conditions)
+                            ).first()
+                            service_cache_write_tokens = session.exec(
+                                select(func.sum(AccessLog.cache_write_tokens))
+                                .select_from(AccessLog)
+                                .where(*service_conditions)
+                            ).first()
+                            service_success_conditions = service_conditions + [
+                                AccessLog.status_code >= 200,
+                                AccessLog.status_code < 400,
+                            ]
+                            service_success_count = session.exec(
+                                select(func.count())
+                                .select_from(AccessLog)
+                                .where(*service_success_conditions)
+                            ).first()
+                            service_error_conditions = service_conditions + [
+                                AccessLog.status_code >= 400,
+                            ]
+                            service_error_count = session.exec(
+                                select(func.count())
+                                .select_from(AccessLog)
+                                .where(*service_error_conditions)
+                            ).first()
+                            service_breakdown[service] = {
+                                "request_count": service_count or 0,
+                                "successful_requests": service_success_count or 0,
+                                "error_requests": service_error_count or 0,
+                                "success_rate": (service_success_count or 0)
+                                / (service_count or 1)
+                                * 100
+                                if service_count
+                                else 0,
+                                "error_rate": (service_error_count or 0)
+                                / (service_count or 1)
+                                * 100
+                                if service_count
+                                else 0,
+                                "avg_duration_ms": service_avg_duration or 0,
+                                "total_cost_usd": service_total_cost or 0,
+                                "total_tokens_input": service_total_tokens_input or 0,
+                                "total_tokens_output": service_total_tokens_output or 0,
+                                "total_cache_read_tokens": service_cache_read_tokens
+                                or 0,
+                                "total_cache_write_tokens": service_cache_write_tokens
+                                or 0,
+                                "total_tokens_all": (service_total_tokens_input or 0)
+                                + (service_total_tokens_output or 0)
+                                + (service_cache_read_tokens or 0)
+                                + (service_cache_write_tokens or 0),
+                            }
+                    analytics = {
+                        "summary": {
+                            "total_requests": total_requests or 0,
+                            "total_successful_requests": total_successful_requests or 0,
+                            "total_error_requests": total_error_requests or 0,
+                            "avg_duration_ms": avg_duration or 0,
+                            "total_cost_usd": total_cost or 0,
+                            "total_tokens_input": total_tokens_input or 0,
+                            "total_tokens_output": total_tokens_output or 0,
+                            "total_cache_read_tokens": total_cache_read_tokens or 0,
+                            "total_cache_write_tokens": total_cache_write_tokens or 0,
+                            "total_tokens_all": (total_tokens_input or 0)
+                            + (total_tokens_output or 0)
+                            + (total_cache_read_tokens or 0)
+                            + (total_cache_write_tokens or 0),
+                        },
+                        "token_analytics": {
+                            "input_tokens": total_tokens_input or 0,
+                            "output_tokens": total_tokens_output or 0,
+                            "cache_read_tokens": total_cache_read_tokens or 0,
+                            "cache_write_tokens": total_cache_write_tokens or 0,
+                            "total_tokens": (total_tokens_input or 0)
+                            + (total_tokens_output or 0)
+                            + (total_cache_read_tokens or 0)
+                            + (total_cache_write_tokens or 0),
+                        },
+                        "request_analytics": {
+                            "total_requests": total_requests or 0,
+                            "successful_requests": total_successful_requests or 0,
+                            "error_requests": total_error_requests or 0,
+                            "success_rate": (total_successful_requests or 0)
+                            / (total_requests or 1)
+                            * 100
+                            if total_requests
+                            else 0,
+                            "error_rate": (total_error_requests or 0)
+                            / (total_requests or 1)
+                            * 100
+                            if total_requests
+                            else 0,
+                        },
+                        "service_type_breakdown": service_breakdown,
+                        "query_time": time.time(),
+                        "backend": "sqlmodel",
+                    }
+                    # Add metadata
+                    analytics["query_params"] = {
+                        "start_time": start_time,
+                        "end_time": end_time,
+                        "model": model,
+                        "service_type": service_type,
+                        "hours": hours,
+                    }
+                    return cast(AnalyticsResult, analytics)
+            except Exception as e:
+                import structlog
+                logger = structlog.get_logger(__name__)
+                logger.error("sqlmodel_analytics_error", error=str(e))
+                raise HTTPException(
+                    status_code=500, detail=f"Analytics query failed: {str(e)}"
+                ) from e
+        else:
+            raise HTTPException(
+                status_code=503,
+                detail="Storage engine not available",
+            )
+    except HTTPException:
+        raise
+    except Exception as e:
+        raise HTTPException(
+            status_code=500, detail=f"Analytics generation failed: {str(e)}"
+        ) from e
+@logs_router.get("/stream")
+async def stream_logs(
+    request: Request,
+    model: str | None = Query(None, description="Filter by model name"),
+    service_type: str | None = Query(
+        None,
+        description="Filter by service type. Supports comma-separated values (e.g., 'proxy_service,sdk_service') and negation with ! prefix (e.g., '!access_log,!sdk_service')",
+    ),
+    min_duration_ms: float | None = Query(
+        None, description="Filter by minimum duration in milliseconds"
+    ),
+    max_duration_ms: float | None = Query(
+        None, description="Filter by maximum duration in milliseconds"
+    ),
+    status_code_min: int | None = Query(
+        None, description="Filter by minimum status code"
+    ),
+    status_code_max: int | None = Query(
+        None, description="Filter by maximum status code"
+    ),
+) -> StreamingResponse:
+    """
+    Stream real-time metrics and request logs via Server-Sent Events.
+    Returns a continuous stream of request events using event-driven SSE
+    instead of polling. Events are emitted in real-time when requests
+    start, complete, or error. Supports filtering similar to analytics and entries endpoints.
+    """
+    import asyncio
+    import uuid
+    from collections.abc import AsyncIterator
+    # Get request ID from request state
+    request_id = getattr(request.state, "request_id", None)
+    if request and hasattr(request, "state") and hasattr(request.state, "context"):
+        # Use existing context from middleware
+        ctx = request.state.context
+        # Set streaming flag for access log
+        ctx.add_metadata(streaming=True)
+        ctx.add_metadata(event_type="streaming_complete")
+    # Build filter criteria for event filtering
+    filter_criteria = {
+        "model": model,
+        "service_type": service_type,
+        "min_duration_ms": min_duration_ms,
+        "max_duration_ms": max_duration_ms,
+        "status_code_min": status_code_min,
+        "status_code_max": status_code_max,
+    }
+    # Remove None values
+    filter_criteria = {k: v for k, v in filter_criteria.items() if v is not None}
+    def should_include_event(event_data: dict[str, Any]) -> bool:
+        """Check if event matches filter criteria."""
+        if not filter_criteria:
+            return True
+        data = event_data.get("data", {})
+        # Model filter
+        if "model" in filter_criteria and data.get("model") != filter_criteria["model"]:
+            return False
+        # Service type filter with comma-separated and negation support
+        if "service_type" in filter_criteria:
+            service_type_filter = filter_criteria["service_type"]
+            if isinstance(service_type_filter, str):
+                service_filters = [s.strip() for s in service_type_filter.split(",")]
+            else:
+                # Handle non-string types by converting to string
+                service_filters = [str(service_type_filter).strip()]
+            include_filters = [f for f in service_filters if not f.startswith("!")]
+            exclude_filters = [f[1:] for f in service_filters if f.startswith("!")]
+            data_service_type = data.get("service_type")
+            if include_filters and data_service_type not in include_filters:
+                return False
+            if exclude_filters and data_service_type in exclude_filters:
+                return False
+        # Duration filters
+        duration_ms = data.get("duration_ms")
+        if duration_ms is not None:
+            if (
+                "min_duration_ms" in filter_criteria
+                and duration_ms < filter_criteria["min_duration_ms"]
+            ):
+                return False
+            if (
+                "max_duration_ms" in filter_criteria
+                and duration_ms > filter_criteria["max_duration_ms"]
+            ):
+                return False
+        # Status code filters
+        status_code = data.get("status_code")
+        if status_code is not None:
+            if (
+                "status_code_min" in filter_criteria
+                and status_code < filter_criteria["status_code_min"]
+            ):
+                return False
+            if (
+                "status_code_max" in filter_criteria
+                and status_code > filter_criteria["status_code_max"]
+            ):
+                return False
+        return True
+    async def event_stream() -> AsyncIterator[str]:
+        """Generate Server-Sent Events for real-time metrics."""
+        from ccproxy.observability.sse_events import get_sse_manager
+        # Get SSE manager
+        sse_manager = get_sse_manager()
+        # Create unique connection ID
+        connection_id = str(uuid.uuid4())
+        try:
+            # Use SSE manager for event-driven streaming
+            async for event_data in sse_manager.add_connection(
+                connection_id, request_id
+            ):
+                # Parse event data to check for filtering
+                if event_data.startswith("data: "):
+                    try:
+                        import json
+                        json_str = event_data[6:].strip()
+                        if json_str:
+                            event_obj = json.loads(json_str)
+                            # Apply filters for data events (not connection/system events)
+                            if (
+                                event_obj.get("type")
+                                in ["request_complete", "request_start"]
+                                and filter_criteria
+                            ) and not should_include_event(event_obj):
+                                continue  # Skip this event
+                    except (json.JSONDecodeError, KeyError):
+                        # If we can't parse, pass through (system events)
+                        pass
+                yield event_data
+        except asyncio.CancelledError:
+            # Connection was cancelled, cleanup handled by SSE manager
+            pass
+        except Exception as e:
+            # Send error event
+            import json
+            error_event = {
+                "type": "error",
+                "message": str(e),
+                "timestamp": time.time(),
+            }
+            yield f"data: {json.dumps(error_event)}\n\n"
+    return StreamingResponse(
+        event_stream(),
+        media_type="text/event-stream",
+        headers={
+            "Cache-Control": "no-cache",
+            "Connection": "keep-alive",
+            "Access-Control-Allow-Origin": "*",
+            "Access-Control-Allow-Headers": "Cache-Control",
+        },
+    )
+@logs_router.get("/entries")
+async def get_logs_entries(
+    storage: DuckDBStorageDep,
+    settings: SettingsDep,
+    limit: int = Query(
+        50, ge=1, le=1000, description="Maximum number of entries to return"
+    ),
+    offset: int = Query(0, ge=0, description="Number of entries to skip"),
+    order_by: str = Query(
+        "timestamp",
+        description="Column to order by (timestamp, duration_ms, cost_usd, model, service_type, status_code)",
+    ),
+    order_desc: bool = Query(False, description="Order in descending order"),
+    service_type: str | None = Query(
+        None,
+        description="Filter by service type. Supports comma-separated values (e.g., 'proxy_service,sdk_service') and negation with ! prefix (e.g., '!access_log,!sdk_service')",
+    ),
+) -> dict[str, Any]:
+    """
+    Get the last n database entries from the access logs.
+    Returns individual request entries with full details for analysis.
+    """
+    try:
+        if not settings.observability.logs_collection_enabled:
+            raise HTTPException(
+                status_code=503,
+                detail="Logs collection is disabled. Enable with logs_collection_enabled=true",
+            )
+        if not storage:
+            raise HTTPException(
+                status_code=503,
+                detail="Storage backend not available. Ensure DuckDB is installed and pipeline is running.",
+            )
+        # Use SQLModel for entries
+        if hasattr(storage, "_engine") and storage._engine:
+            try:
+                with Session(storage._engine) as session:
+                    # Validate order_by parameter using SQLModel
+                    valid_columns = list(AccessLog.model_fields.keys())
+                    if order_by not in valid_columns:
+                        order_by = "timestamp"
+                    # Build SQLModel query
+                    order_attr = getattr(AccessLog, order_by)
+                    order_clause = order_attr.desc() if order_desc else order_attr.asc()
+                    statement = select(AccessLog)
+                    # Apply service type filtering with comma-separated values and negation
+                    if service_type:
+                        service_filters = [s.strip() for s in service_type.split(",")]
+                        include_filters = [
+                            f for f in service_filters if not f.startswith("!")
+                        ]
+                        exclude_filters = [
+                            f[1:] for f in service_filters if f.startswith("!")
+                        ]
+                        if include_filters:
+                            statement = statement.where(
+                                col(AccessLog.service_type).in_(include_filters)
+                            )
+                        if exclude_filters:
+                            statement = statement.where(
+                                ~col(AccessLog.service_type).in_(exclude_filters)
+                            )
+                    statement = (
+                        statement.order_by(order_clause).offset(offset).limit(limit)
+                    )
+                    results = session.exec(statement).all()
+                    # Get total count with same filters
+                    count_statement = select(func.count()).select_from(AccessLog)
+                    # Apply same service type filtering to count
+                    if service_type:
+                        service_filters = [s.strip() for s in service_type.split(",")]
+                        include_filters = [
+                            f for f in service_filters if not f.startswith("!")
+                        ]
+                        exclude_filters = [
+                            f[1:] for f in service_filters if f.startswith("!")
+                        ]
+                        if include_filters:
+                            count_statement = count_statement.where(
+                                col(AccessLog.service_type).in_(include_filters)
+                            )
+                        if exclude_filters:
+                            count_statement = count_statement.where(
+                                ~col(AccessLog.service_type).in_(exclude_filters)
+                            )
+                    total_count = session.exec(count_statement).first()
+                    # Convert to dict format
+                    entries = [log.dict() for log in results]
+                    return {
+                        "entries": entries,
+                        "total_count": total_count,
+                        "limit": limit,
+                        "offset": offset,
+                        "order_by": order_by,
+                        "order_desc": order_desc,
+                        "service_type": service_type,
+                        "page": (offset // limit) + 1,
+                        "total_pages": ((total_count or 0) + limit - 1) // limit,
+                        "backend": "sqlmodel",
+                    }
+            except Exception as e:
+                import structlog
+                logger = structlog.get_logger(__name__)
+                logger.error("sqlmodel_entries_error", error=str(e))
+                raise HTTPException(
+                    status_code=500, detail=f"Failed to retrieve entries: {str(e)}"
+                ) from e
+        else:
+            raise HTTPException(
+                status_code=503,
+                detail="Storage engine not available",
+            )
+    except HTTPException:
+        raise
+    except Exception as e:
+        raise HTTPException(
+            status_code=500, detail=f"Failed to retrieve database entries: {str(e)}"
+        ) from e
+@logs_router.post("/reset")
+async def reset_logs_data(
+    storage: DuckDBStorageDep, settings: SettingsDep
+) -> dict[str, Any]:
+    """
+    Reset all data in the logs storage.
+    This endpoint clears all access logs from the database.
+    Use with caution - this action cannot be undone.
+    Returns:
+        Dictionary with reset status and timestamp
+    """
+    try:
+        if not settings.observability.logs_collection_enabled:
+            raise HTTPException(
+                status_code=503,
+                detail="Logs collection is disabled. Enable with logs_collection_enabled=true",
+            )
+        if not storage:
+            raise HTTPException(
+                status_code=503,
+                detail="Storage backend not available. Ensure DuckDB is installed.",
+            )
+        # Check if storage has reset_data method
+        if not hasattr(storage, "reset_data"):
+            raise HTTPException(
+                status_code=501,
+                detail="Reset operation not supported by current storage backend",
+            )
+        # Perform the reset
+        success = await storage.reset_data()
+        if success:
+            return {
+                "status": "success",
+                "message": "All logs data has been reset",
+                "timestamp": time.time(),
+                "backend": "duckdb",
+            }
+        else:
+            raise HTTPException(
+                status_code=500,
+                detail="Reset operation failed",
+            )
+    except HTTPException:
+        raise
+    except Exception as e:
+        raise HTTPException(
+            status_code=500, detail=f"Reset operation failed: {str(e)}"
+        ) from e