PyPI - isa-model - Versions diffs - 0.3.91__py3-none-any.whl → 0.4.3__py3-none-any.whl - Mend

isa-model 0.3.91py3-none-any.whl → 0.4.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (228) hide show

isa_model/client.py +1166 -584
isa_model/core/cache/redis_cache.py +410 -0
isa_model/core/config/config_manager.py +282 -12
isa_model/core/config.py +91 -1
isa_model/core/database/__init__.py +1 -0
isa_model/core/database/direct_db_client.py +114 -0
isa_model/core/database/migration_manager.py +563 -0
isa_model/core/database/migrations.py +297 -0
isa_model/core/database/supabase_client.py +258 -0
isa_model/core/dependencies.py +316 -0
isa_model/core/discovery/__init__.py +19 -0
isa_model/core/discovery/consul_discovery.py +190 -0
isa_model/core/logging/__init__.py +54 -0
isa_model/core/logging/influx_logger.py +523 -0
isa_model/core/logging/loki_logger.py +160 -0
isa_model/core/models/__init__.py +46 -0
isa_model/core/models/config_models.py +625 -0
isa_model/core/models/deployment_billing_tracker.py +430 -0
isa_model/core/models/model_billing_tracker.py +60 -88
isa_model/core/models/model_manager.py +66 -25
isa_model/core/models/model_metadata.py +690 -0
isa_model/core/models/model_repo.py +217 -55
isa_model/core/models/model_statistics_tracker.py +234 -0
isa_model/core/models/model_storage.py +0 -1
isa_model/core/models/model_version_manager.py +959 -0
isa_model/core/models/system_models.py +857 -0
isa_model/core/pricing_manager.py +2 -249
isa_model/core/repositories/__init__.py +9 -0
isa_model/core/repositories/config_repository.py +912 -0
isa_model/core/resilience/circuit_breaker.py +366 -0
isa_model/core/security/secrets.py +358 -0
isa_model/core/services/__init__.py +2 -4
isa_model/core/services/intelligent_model_selector.py +479 -370
isa_model/core/storage/hf_storage.py +2 -2
isa_model/core/types.py +8 -0
isa_model/deployment/__init__.py +5 -48
isa_model/deployment/core/__init__.py +2 -31
isa_model/deployment/core/deployment_manager.py +1278 -368
isa_model/deployment/local/__init__.py +31 -0
isa_model/deployment/local/config.py +248 -0
isa_model/deployment/local/gpu_gateway.py +607 -0
isa_model/deployment/local/health_checker.py +428 -0
isa_model/deployment/local/provider.py +586 -0
isa_model/deployment/local/tensorrt_service.py +621 -0
isa_model/deployment/local/transformers_service.py +644 -0
isa_model/deployment/local/vllm_service.py +527 -0
isa_model/deployment/modal/__init__.py +8 -0
isa_model/deployment/modal/config.py +136 -0
isa_model/deployment/modal/deployer.py +894 -0
isa_model/deployment/modal/services/__init__.py +3 -0
isa_model/deployment/modal/services/audio/__init__.py +1 -0
isa_model/deployment/modal/services/audio/isa_audio_chatTTS_service.py +520 -0
isa_model/deployment/modal/services/audio/isa_audio_openvoice_service.py +758 -0
isa_model/deployment/modal/services/audio/isa_audio_service_v2.py +1044 -0
isa_model/deployment/modal/services/embedding/__init__.py +1 -0
isa_model/deployment/modal/services/embedding/isa_embed_rerank_service.py +296 -0
isa_model/deployment/modal/services/llm/__init__.py +1 -0
isa_model/deployment/modal/services/llm/isa_llm_service.py +424 -0
isa_model/deployment/modal/services/video/__init__.py +1 -0
isa_model/deployment/modal/services/video/isa_video_hunyuan_service.py +423 -0
isa_model/deployment/modal/services/vision/__init__.py +1 -0
isa_model/deployment/modal/services/vision/isa_vision_ocr_service.py +519 -0
isa_model/deployment/modal/services/vision/isa_vision_qwen25_service.py +709 -0
isa_model/deployment/modal/services/vision/isa_vision_table_service.py +676 -0
isa_model/deployment/modal/services/vision/isa_vision_ui_service.py +833 -0
isa_model/deployment/modal/services/vision/isa_vision_ui_service_optimized.py +660 -0
isa_model/deployment/models/org-org-acme-corp-tenant-a-service-llm-20250825-225822/tenant-a-service_modal_service.py +48 -0
isa_model/deployment/models/org-test-org-123-prefix-test-service-llm-20250825-225822/prefix-test-service_modal_service.py +48 -0
isa_model/deployment/models/test-llm-service-llm-20250825-204442/test-llm-service_modal_service.py +48 -0
isa_model/deployment/models/test-monitoring-gpt2-llm-20250825-212906/test-monitoring-gpt2_modal_service.py +48 -0
isa_model/deployment/models/test-monitoring-gpt2-llm-20250825-213009/test-monitoring-gpt2_modal_service.py +48 -0
isa_model/deployment/storage/__init__.py +5 -0
isa_model/deployment/storage/deployment_repository.py +824 -0
isa_model/deployment/triton/__init__.py +10 -0
isa_model/deployment/triton/config.py +196 -0
isa_model/deployment/triton/configs/__init__.py +1 -0
isa_model/deployment/triton/provider.py +512 -0
isa_model/deployment/triton/scripts/__init__.py +1 -0
isa_model/deployment/triton/templates/__init__.py +1 -0
isa_model/inference/__init__.py +47 -1
isa_model/inference/ai_factory.py +179 -16
isa_model/inference/legacy_services/__init__.py +21 -0
isa_model/inference/legacy_services/model_evaluation.py +637 -0
isa_model/inference/legacy_services/model_service.py +573 -0
isa_model/inference/legacy_services/model_serving.py +717 -0
isa_model/inference/legacy_services/model_training.py +561 -0
isa_model/inference/models/__init__.py +21 -0
isa_model/inference/models/inference_config.py +551 -0
isa_model/inference/models/inference_record.py +675 -0
isa_model/inference/models/performance_models.py +714 -0
isa_model/inference/repositories/__init__.py +9 -0
isa_model/inference/repositories/inference_repository.py +828 -0
isa_model/inference/services/audio/__init__.py +21 -0
isa_model/inference/services/audio/base_realtime_service.py +225 -0
isa_model/inference/services/audio/base_stt_service.py +184 -11
isa_model/inference/services/audio/isa_tts_service.py +0 -0
isa_model/inference/services/audio/openai_realtime_service.py +320 -124
isa_model/inference/services/audio/openai_stt_service.py +53 -11
isa_model/inference/services/base_service.py +17 -1
isa_model/inference/services/custom_model_manager.py +277 -0
isa_model/inference/services/embedding/__init__.py +13 -0
isa_model/inference/services/embedding/base_embed_service.py +111 -8
isa_model/inference/services/embedding/isa_embed_service.py +305 -0
isa_model/inference/services/embedding/ollama_embed_service.py +15 -3
isa_model/inference/services/embedding/openai_embed_service.py +2 -4
isa_model/inference/services/embedding/resilient_embed_service.py +285 -0
isa_model/inference/services/embedding/tests/test_embedding.py +222 -0
isa_model/inference/services/img/__init__.py +2 -2
isa_model/inference/services/img/base_image_gen_service.py +24 -7
isa_model/inference/services/img/replicate_image_gen_service.py +84 -422
isa_model/inference/services/img/services/replicate_face_swap.py +193 -0
isa_model/inference/services/img/services/replicate_flux.py +226 -0
isa_model/inference/services/img/services/replicate_flux_kontext.py +219 -0
isa_model/inference/services/img/services/replicate_sticker_maker.py +249 -0
isa_model/inference/services/img/tests/test_img_client.py +297 -0
isa_model/inference/services/llm/__init__.py +10 -2
isa_model/inference/services/llm/base_llm_service.py +361 -26
isa_model/inference/services/llm/cerebras_llm_service.py +628 -0
isa_model/inference/services/llm/helpers/llm_adapter.py +71 -12
isa_model/inference/services/llm/helpers/llm_prompts.py +342 -0
isa_model/inference/services/llm/helpers/llm_utils.py +321 -23
isa_model/inference/services/llm/huggingface_llm_service.py +581 -0
isa_model/inference/services/llm/local_llm_service.py +747 -0
isa_model/inference/services/llm/ollama_llm_service.py +11 -3
isa_model/inference/services/llm/openai_llm_service.py +670 -56
isa_model/inference/services/llm/yyds_llm_service.py +10 -3
isa_model/inference/services/vision/__init__.py +27 -6
isa_model/inference/services/vision/base_vision_service.py +118 -185
isa_model/inference/services/vision/blip_vision_service.py +359 -0
isa_model/inference/services/vision/helpers/image_utils.py +19 -10
isa_model/inference/services/vision/isa_vision_service.py +634 -0
isa_model/inference/services/vision/openai_vision_service.py +19 -10
isa_model/inference/services/vision/tests/test_ocr_client.py +284 -0
isa_model/inference/services/vision/vgg16_vision_service.py +257 -0
isa_model/serving/api/cache_manager.py +245 -0
isa_model/serving/api/dependencies/__init__.py +1 -0
isa_model/serving/api/dependencies/auth.py +194 -0
isa_model/serving/api/dependencies/database.py +139 -0
isa_model/serving/api/error_handlers.py +284 -0
isa_model/serving/api/fastapi_server.py +240 -18
isa_model/serving/api/middleware/auth.py +317 -0
isa_model/serving/api/middleware/security.py +268 -0
isa_model/serving/api/middleware/tenant_context.py +414 -0
isa_model/serving/api/routes/analytics.py +489 -0
isa_model/serving/api/routes/config.py +645 -0
isa_model/serving/api/routes/deployment_billing.py +315 -0
isa_model/serving/api/routes/deployments.py +475 -0
isa_model/serving/api/routes/gpu_gateway.py +440 -0
isa_model/serving/api/routes/health.py +32 -12
isa_model/serving/api/routes/inference_monitoring.py +486 -0
isa_model/serving/api/routes/local_deployments.py +448 -0
isa_model/serving/api/routes/logs.py +430 -0
isa_model/serving/api/routes/settings.py +582 -0
isa_model/serving/api/routes/tenants.py +575 -0
isa_model/serving/api/routes/unified.py +992 -171
isa_model/serving/api/routes/webhooks.py +479 -0
isa_model/serving/api/startup.py +318 -0
isa_model/serving/modal_proxy_server.py +249 -0
isa_model/utils/gpu_utils.py +311 -0
{isa_model-0.3.91.dist-info → isa_model-0.4.3.dist-info}/METADATA +76 -22
isa_model-0.4.3.dist-info/RECORD +193 -0
isa_model/deployment/cloud/__init__.py +0 -9
isa_model/deployment/cloud/modal/__init__.py +0 -10
isa_model/deployment/cloud/modal/isa_vision_doc_service.py +0 -766
isa_model/deployment/cloud/modal/isa_vision_table_service.py +0 -532
isa_model/deployment/cloud/modal/isa_vision_ui_service.py +0 -406
isa_model/deployment/cloud/modal/register_models.py +0 -321
isa_model/deployment/core/deployment_config.py +0 -356
isa_model/deployment/core/isa_deployment_service.py +0 -401
isa_model/deployment/gpu_int8_ds8/app/server.py +0 -66
isa_model/deployment/gpu_int8_ds8/scripts/test_client.py +0 -43
isa_model/deployment/gpu_int8_ds8/scripts/test_client_os.py +0 -35
isa_model/deployment/runtime/deployed_service.py +0 -338
isa_model/deployment/services/__init__.py +0 -9
isa_model/deployment/services/auto_deploy_vision_service.py +0 -538
isa_model/deployment/services/model_service.py +0 -332
isa_model/deployment/services/service_monitor.py +0 -356
isa_model/deployment/services/service_registry.py +0 -527
isa_model/eval/__init__.py +0 -92
isa_model/eval/benchmarks.py +0 -469
isa_model/eval/config/__init__.py +0 -10
isa_model/eval/config/evaluation_config.py +0 -108
isa_model/eval/evaluators/__init__.py +0 -18
isa_model/eval/evaluators/base_evaluator.py +0 -503
isa_model/eval/evaluators/llm_evaluator.py +0 -472
isa_model/eval/factory.py +0 -531
isa_model/eval/infrastructure/__init__.py +0 -24
isa_model/eval/infrastructure/experiment_tracker.py +0 -466
isa_model/eval/metrics.py +0 -798
isa_model/inference/adapter/unified_api.py +0 -248
isa_model/inference/services/helpers/stacked_config.py +0 -148
isa_model/inference/services/img/flux_professional_service.py +0 -603
isa_model/inference/services/img/helpers/base_stacked_service.py +0 -274
isa_model/inference/services/others/table_transformer_service.py +0 -61
isa_model/inference/services/vision/doc_analysis_service.py +0 -640
isa_model/inference/services/vision/helpers/base_stacked_service.py +0 -274
isa_model/inference/services/vision/ui_analysis_service.py +0 -823
isa_model/scripts/inference_tracker.py +0 -283
isa_model/scripts/mlflow_manager.py +0 -379
isa_model/scripts/model_registry.py +0 -465
isa_model/scripts/register_models.py +0 -370
isa_model/scripts/register_models_with_embeddings.py +0 -510
isa_model/scripts/start_mlflow.py +0 -95
isa_model/scripts/training_tracker.py +0 -257
isa_model/training/__init__.py +0 -74
isa_model/training/annotation/annotation_schema.py +0 -47
isa_model/training/annotation/processors/annotation_processor.py +0 -126
isa_model/training/annotation/storage/dataset_manager.py +0 -131
isa_model/training/annotation/storage/dataset_schema.py +0 -44
isa_model/training/annotation/tests/test_annotation_flow.py +0 -109
isa_model/training/annotation/tests/test_minio copy.py +0 -113
isa_model/training/annotation/tests/test_minio_upload.py +0 -43
isa_model/training/annotation/views/annotation_controller.py +0 -158
isa_model/training/cloud/__init__.py +0 -22
isa_model/training/cloud/job_orchestrator.py +0 -402
isa_model/training/cloud/runpod_trainer.py +0 -454
isa_model/training/cloud/storage_manager.py +0 -482
isa_model/training/core/__init__.py +0 -23
isa_model/training/core/config.py +0 -181
isa_model/training/core/dataset.py +0 -222
isa_model/training/core/trainer.py +0 -720
isa_model/training/core/utils.py +0 -213
isa_model/training/factory.py +0 -424
isa_model-0.3.91.dist-info/RECORD +0 -138
/isa_model/{core/storage/minio_storage.py → deployment/modal/services/audio/isa_audio_fish_service.py} +0 -0
/isa_model/deployment/{services → modal/services/vision}/simple_auto_deploy_vision_service.py +0 -0
{isa_model-0.3.91.dist-info → isa_model-0.4.3.dist-info}/WHEEL +0 -0
{isa_model-0.3.91.dist-info → isa_model-0.4.3.dist-info}/top_level.txt +0 -0

isa_model/inference/repositories/inference_repository.py ADDED Viewed

@@ -0,0 +1,828 @@
+"""
+Inference Repository - Data persistence layer for inference operations
+Provides standardized data access for inference requests, usage statistics, and history
+following the ISA Model architecture pattern.
+"""
+import logging
+import json
+import uuid
+from datetime import datetime, timezone, timedelta
+from typing import Dict, List, Optional, Any, Union
+from pathlib import Path
+from dataclasses import dataclass, asdict
+from enum import Enum
+try:
+    # Try to import Supabase for centralized data storage
+    from ...core.database.supabase_client import get_supabase_client
+    SUPABASE_AVAILABLE = True
+except ImportError:
+    SUPABASE_AVAILABLE = False
+logger = logging.getLogger(__name__)
+class InferenceStatus(str, Enum):
+    """Inference status enumeration"""
+    PENDING = "pending"
+    PROCESSING = "processing"
+    COMPLETED = "completed"
+    FAILED = "failed"
+    TIMEOUT = "timeout"
+    CANCELLED = "cancelled"
+class ServiceType(str, Enum):
+    """Service type enumeration"""
+    LLM = "llm"
+    VISION = "vision"
+    EMBEDDING = "embedding"
+    TTS = "tts"
+    STT = "stt"
+    IMAGE_GEN = "image_gen"
+    AUDIO = "audio"
+    RERANK = "rerank"
+    OCR = "ocr"
+@dataclass
+class InferenceRequest:
+    """Inference request record"""
+    request_id: str
+    service_type: str
+    model_id: str
+    provider: str
+    endpoint: str
+    request_data: Dict[str, Any]
+    status: str = InferenceStatus.PENDING
+    created_at: datetime = None
+    started_at: Optional[datetime] = None
+    completed_at: Optional[datetime] = None
+    user_id: Optional[str] = None
+    session_id: Optional[str] = None
+    ip_address: Optional[str] = None
+    user_agent: Optional[str] = None
+    response_data: Optional[Dict[str, Any]] = None
+    error_message: Optional[str] = None
+    execution_time_ms: Optional[int] = None
+    tokens_used: Optional[int] = None
+    cost_usd: Optional[float] = None
+    metadata: Optional[Dict[str, Any]] = None
+    def __post_init__(self):
+        if self.created_at is None:
+            self.created_at = datetime.now(timezone.utc)
+@dataclass
+class UsageStatistics:
+    """Usage statistics record"""
+    stat_id: str
+    period_start: datetime
+    period_end: datetime
+    service_type: str
+    model_id: Optional[str] = None
+    provider: Optional[str] = None
+    user_id: Optional[str] = None
+    total_requests: int = 0
+    successful_requests: int = 0
+    failed_requests: int = 0
+    total_tokens: int = 0
+    total_cost_usd: float = 0.0
+    avg_response_time_ms: float = 0.0
+    p95_response_time_ms: float = 0.0
+    requests_per_hour: float = 0.0
+    error_rate: float = 0.0
+    created_at: datetime = None
+    def __post_init__(self):
+        if self.created_at is None:
+            self.created_at = datetime.now(timezone.utc)
+@dataclass
+class ModelUsageSnapshot:
+    """Model usage snapshot for quick analytics"""
+    snapshot_id: str
+    model_id: str
+    provider: str
+    snapshot_time: datetime
+    hourly_requests: int = 0
+    daily_requests: int = 0
+    weekly_requests: int = 0
+    monthly_requests: int = 0
+    total_tokens_today: int = 0
+    total_cost_today: float = 0.0
+    avg_response_time_today: float = 0.0
+    success_rate_today: float = 100.0
+    last_used: Optional[datetime] = None
+    def __post_init__(self):
+        if self.snapshot_time is None:
+            self.snapshot_time = datetime.now(timezone.utc)
+class InferenceRepository:
+    """
+    Repository for inference data persistence
+    Supports multiple backend storage options:
+    1. Supabase (preferred for centralized storage)
+    2. Local file system (fallback for development)
+    3. In-memory storage (for testing)
+    """
+    def __init__(self, storage_backend: str = "auto", **kwargs):
+        """
+        Initialize inference repository
+        Args:
+            storage_backend: "supabase", "file", "memory", or "auto"
+            **kwargs: Backend-specific configuration
+        """
+        self.storage_backend = self._determine_backend(storage_backend)
+        self.config = kwargs
+        # Initialize storage backend
+        if self.storage_backend == "supabase":
+            self._init_supabase()
+        elif self.storage_backend == "memory":
+            self._init_memory()
+        else:  # file system fallback
+            self._init_file_system()
+        logger.info(f"Inference repository initialized with {self.storage_backend} backend")
+    def _determine_backend(self, preference: str) -> str:
+        """Determine the best available storage backend"""
+        if preference == "supabase" and SUPABASE_AVAILABLE:
+            return "supabase"
+        elif preference in ["supabase", "file", "memory"]:
+            return preference
+        # Auto-select best available backend
+        if SUPABASE_AVAILABLE:
+            return "supabase"
+        else:
+            return "file"
+    def _init_supabase(self):
+        """Initialize Supabase backend"""
+        try:
+            self.supabase_client = get_supabase_client()
+            self._ensure_supabase_tables()
+            logger.info("Supabase backend initialized for inference")
+        except Exception as e:
+            logger.error(f"Failed to initialize Supabase backend: {e}")
+            self.storage_backend = "file"
+            self._init_file_system()
+    def _init_file_system(self):
+        """Initialize file system backend"""
+        self.data_dir = Path(self.config.get("data_dir", "./inference_data"))
+        self.data_dir.mkdir(parents=True, exist_ok=True)
+        # Create subdirectories
+        (self.data_dir / "requests").mkdir(exist_ok=True)
+        (self.data_dir / "statistics").mkdir(exist_ok=True)
+        (self.data_dir / "snapshots").mkdir(exist_ok=True)
+        logger.info(f"File system backend initialized: {self.data_dir}")
+    def _init_memory(self):
+        """Initialize in-memory backend for testing"""
+        self.requests = {}
+        self.statistics = {}
+        self.snapshots = {}
+        logger.info("In-memory backend initialized for inference")
+    def _ensure_supabase_tables(self):
+        """Ensure required Supabase tables exist"""
+        try:
+            self.supabase_client.table("inference_requests").select("request_id").limit(1).execute()
+            self.supabase_client.table("usage_statistics").select("stat_id").limit(1).execute()
+            self.supabase_client.table("model_usage_snapshots").select("snapshot_id").limit(1).execute()
+        except Exception as e:
+            logger.warning(f"Some inference tables may not exist in Supabase: {e}")
+    # Request Management Methods
+    def create_inference_request(
+        self,
+        service_type: str,
+        model_id: str,
+        provider: str,
+        endpoint: str,
+        request_data: Dict[str, Any],
+        user_id: Optional[str] = None,
+        session_id: Optional[str] = None,
+        ip_address: Optional[str] = None,
+        user_agent: Optional[str] = None,
+        metadata: Optional[Dict[str, Any]] = None
+    ) -> str:
+        """Create a new inference request record"""
+        request_id = f"inf_{datetime.now().strftime('%Y%m%d_%H%M%S')}_{uuid.uuid4().hex[:8]}"
+        request = InferenceRequest(
+            request_id=request_id,
+            service_type=service_type,
+            model_id=model_id,
+            provider=provider,
+            endpoint=endpoint,
+            request_data=request_data,
+            user_id=user_id,
+            session_id=session_id,
+            ip_address=ip_address,
+            user_agent=user_agent,
+            metadata=metadata
+        )
+        if self.storage_backend == "supabase":
+            return self._create_request_supabase(request)
+        elif self.storage_backend == "memory":
+            return self._create_request_memory(request)
+        else:
+            return self._create_request_file(request)
+    def update_inference_status(
+        self,
+        request_id: str,
+        status: str,
+        response_data: Optional[Dict[str, Any]] = None,
+        error_message: Optional[str] = None,
+        execution_time_ms: Optional[int] = None,
+        tokens_used: Optional[int] = None,
+        cost_usd: Optional[float] = None,
+        additional_updates: Optional[Dict[str, Any]] = None
+    ) -> bool:
+        """Update inference request status and results"""
+        updates = {"status": status}
+        if status == InferenceStatus.PROCESSING:
+            updates["started_at"] = datetime.now(timezone.utc).isoformat()
+        elif status in [InferenceStatus.COMPLETED, InferenceStatus.FAILED, InferenceStatus.TIMEOUT]:
+            updates["completed_at"] = datetime.now(timezone.utc).isoformat()
+        if response_data:
+            updates["response_data"] = response_data
+        if error_message:
+            updates["error_message"] = error_message
+        if execution_time_ms:
+            updates["execution_time_ms"] = execution_time_ms
+        if tokens_used:
+            updates["tokens_used"] = tokens_used
+        if cost_usd:
+            updates["cost_usd"] = cost_usd
+        if additional_updates:
+            updates.update(additional_updates)
+        if self.storage_backend == "supabase":
+            return self._update_request_supabase(request_id, updates)
+        elif self.storage_backend == "memory":
+            return self._update_request_memory(request_id, updates)
+        else:
+            return self._update_request_file(request_id, updates)
+    def get_inference_request(self, request_id: str) -> Optional[InferenceRequest]:
+        """Get inference request by ID"""
+        if self.storage_backend == "supabase":
+            return self._get_request_supabase(request_id)
+        elif self.storage_backend == "memory":
+            return self._get_request_memory(request_id)
+        else:
+            return self._get_request_file(request_id)
+    def list_recent_requests(
+        self,
+        service_type: Optional[str] = None,
+        model_id: Optional[str] = None,
+        user_id: Optional[str] = None,
+        status: Optional[str] = None,
+        hours: int = 24,
+        limit: int = 100
+    ) -> List[InferenceRequest]:
+        """List recent inference requests with optional filtering"""
+        if self.storage_backend == "supabase":
+            return self._list_requests_supabase(service_type, model_id, user_id, status, hours, limit)
+        elif self.storage_backend == "memory":
+            return self._list_requests_memory(service_type, model_id, user_id, status, hours, limit)
+        else:
+            return self._list_requests_file(service_type, model_id, user_id, status, hours, limit)
+    # Usage Statistics Methods
+    def record_usage_statistics(
+        self,
+        period_start: datetime,
+        period_end: datetime,
+        service_type: str,
+        model_id: Optional[str] = None,
+        provider: Optional[str] = None,
+        user_id: Optional[str] = None,
+        total_requests: int = 0,
+        successful_requests: int = 0,
+        failed_requests: int = 0,
+        total_tokens: int = 0,
+        total_cost_usd: float = 0.0,
+        avg_response_time_ms: float = 0.0,
+        p95_response_time_ms: float = 0.0,
+        requests_per_hour: float = 0.0,
+        error_rate: float = 0.0
+    ) -> str:
+        """Record usage statistics for a time period"""
+        stat_id = f"stat_{period_start.strftime('%Y%m%d_%H')}_{uuid.uuid4().hex[:6]}"
+        stats = UsageStatistics(
+            stat_id=stat_id,
+            period_start=period_start,
+            period_end=period_end,
+            service_type=service_type,
+            model_id=model_id,
+            provider=provider,
+            user_id=user_id,
+            total_requests=total_requests,
+            successful_requests=successful_requests,
+            failed_requests=failed_requests,
+            total_tokens=total_tokens,
+            total_cost_usd=total_cost_usd,
+            avg_response_time_ms=avg_response_time_ms,
+            p95_response_time_ms=p95_response_time_ms,
+            requests_per_hour=requests_per_hour,
+            error_rate=error_rate
+        )
+        if self.storage_backend == "supabase":
+            return self._record_stats_supabase(stats)
+        elif self.storage_backend == "memory":
+            return self._record_stats_memory(stats)
+        else:
+            return self._record_stats_file(stats)
+    def get_usage_statistics(
+        self,
+        service_type: Optional[str] = None,
+        model_id: Optional[str] = None,
+        user_id: Optional[str] = None,
+        days: int = 7,
+        limit: int = 100
+    ) -> List[UsageStatistics]:
+        """Get usage statistics for specified period"""
+        if self.storage_backend == "supabase":
+            return self._get_stats_supabase(service_type, model_id, user_id, days, limit)
+        elif self.storage_backend == "memory":
+            return self._get_stats_memory(service_type, model_id, user_id, days, limit)
+        else:
+            return self._get_stats_file(service_type, model_id, user_id, days, limit)
+    def get_aggregated_usage(
+        self,
+        service_type: Optional[str] = None,
+        model_id: Optional[str] = None,
+        user_id: Optional[str] = None,
+        days: int = 30
+    ) -> Dict[str, Any]:
+        """Get aggregated usage statistics"""
+        stats = self.get_usage_statistics(service_type, model_id, user_id, days, 1000)
+        if not stats:
+            return {
+                "total_requests": 0,
+                "total_cost_usd": 0.0,
+                "total_tokens": 0,
+                "avg_response_time_ms": 0.0,
+                "success_rate": 100.0,
+                "period_days": days
+            }
+        total_requests = sum(s.total_requests for s in stats)
+        total_successful = sum(s.successful_requests for s in stats)
+        total_cost = sum(s.total_cost_usd for s in stats)
+        total_tokens = sum(s.total_tokens for s in stats)
+        # Weighted average for response time
+        weighted_response_times = [s.avg_response_time_ms * s.total_requests for s in stats if s.total_requests > 0]
+        avg_response_time = sum(weighted_response_times) / total_requests if total_requests > 0 else 0.0
+        success_rate = (total_successful / total_requests * 100) if total_requests > 0 else 100.0
+        return {
+            "total_requests": total_requests,
+            "successful_requests": total_successful,
+            "total_cost_usd": round(total_cost, 4),
+            "total_tokens": total_tokens,
+            "avg_response_time_ms": round(avg_response_time, 2),
+            "success_rate": round(success_rate, 2),
+            "period_days": days,
+            "stats_count": len(stats)
+        }
+    # Model Usage Snapshots Methods
+    def update_model_snapshot(
+        self,
+        model_id: str,
+        provider: str,
+        hourly_requests: int = 0,
+        daily_requests: int = 0,
+        weekly_requests: int = 0,
+        monthly_requests: int = 0,
+        total_tokens_today: int = 0,
+        total_cost_today: float = 0.0,
+        avg_response_time_today: float = 0.0,
+        success_rate_today: float = 100.0
+    ) -> str:
+        """Update or create model usage snapshot"""
+        snapshot_id = f"snap_{model_id}_{provider}_{datetime.now().strftime('%Y%m%d')}"
+        snapshot = ModelUsageSnapshot(
+            snapshot_id=snapshot_id,
+            model_id=model_id,
+            provider=provider,
+            snapshot_time=datetime.now(timezone.utc),
+            hourly_requests=hourly_requests,
+            daily_requests=daily_requests,
+            weekly_requests=weekly_requests,
+            monthly_requests=monthly_requests,
+            total_tokens_today=total_tokens_today,
+            total_cost_today=total_cost_today,
+            avg_response_time_today=avg_response_time_today,
+            success_rate_today=success_rate_today,
+            last_used=datetime.now(timezone.utc)
+        )
+        if self.storage_backend == "supabase":
+            return self._update_snapshot_supabase(snapshot)
+        elif self.storage_backend == "memory":
+            return self._update_snapshot_memory(snapshot)
+        else:
+            return self._update_snapshot_file(snapshot)
+    def get_model_snapshots(
+        self,
+        model_id: Optional[str] = None,
+        provider: Optional[str] = None,
+        days: int = 7
+    ) -> List[ModelUsageSnapshot]:
+        """Get model usage snapshots"""
+        if self.storage_backend == "supabase":
+            return self._get_snapshots_supabase(model_id, provider, days)
+        elif self.storage_backend == "memory":
+            return self._get_snapshots_memory(model_id, provider, days)
+        else:
+            return self._get_snapshots_file(model_id, provider, days)
+    def get_top_models(self, metric: str = "daily_requests", limit: int = 10) -> List[Dict[str, Any]]:
+        """Get top models by specified metric"""
+        snapshots = self.get_model_snapshots(days=1)  # Get latest snapshots
+        if not snapshots:
+            return []
+        # Sort by the specified metric
+        valid_metrics = ["hourly_requests", "daily_requests", "weekly_requests", "monthly_requests",
+                        "total_tokens_today", "total_cost_today"]
+        if metric not in valid_metrics:
+            metric = "daily_requests"
+        sorted_snapshots = sorted(
+            snapshots,
+            key=lambda x: getattr(x, metric, 0),
+            reverse=True
+        )[:limit]
+        return [
+            {
+                "model_id": s.model_id,
+                "provider": s.provider,
+                "metric_value": getattr(s, metric, 0),
+                "daily_requests": s.daily_requests,
+                "total_cost_today": s.total_cost_today,
+                "success_rate_today": s.success_rate_today,
+                "last_used": s.last_used.isoformat() if s.last_used else None
+            }
+            for s in sorted_snapshots
+        ]
+    # Cleanup and Maintenance Methods
+    def cleanup_old_requests(self, days: int = 30) -> int:
+        """Clean up old inference requests"""
+        cutoff_date = datetime.now(timezone.utc) - timedelta(days=days)
+        if self.storage_backend == "supabase":
+            return self._cleanup_requests_supabase(cutoff_date)
+        elif self.storage_backend == "memory":
+            return self._cleanup_requests_memory(cutoff_date)
+        else:
+            return self._cleanup_requests_file(cutoff_date)
+    def cleanup_old_statistics(self, days: int = 90) -> int:
+        """Clean up old usage statistics"""
+        cutoff_date = datetime.now(timezone.utc) - timedelta(days=days)
+        if self.storage_backend == "supabase":
+            return self._cleanup_stats_supabase(cutoff_date)
+        elif self.storage_backend == "memory":
+            return self._cleanup_stats_memory(cutoff_date)
+        else:
+            return self._cleanup_stats_file(cutoff_date)
+    # Backend-specific implementations
+    def _create_request_file(self, request: InferenceRequest) -> str:
+        """Create request in file system"""
+        try:
+            request_file = self.data_dir / "requests" / f"{request.request_id}.json"
+            request_data = asdict(request)
+            # Convert datetime objects to ISO strings
+            for key in ['created_at', 'started_at', 'completed_at']:
+                if request_data[key] and isinstance(request_data[key], datetime):
+                    request_data[key] = request_data[key].isoformat()
+            with open(request_file, 'w') as f:
+                json.dump(request_data, f, indent=2, ensure_ascii=False)
+            return request.request_id
+        except Exception as e:
+            logger.error(f"Failed to create request in file system: {e}")
+            raise
+    def _create_request_memory(self, request: InferenceRequest) -> str:
+        """Create request in memory"""
+        self.requests[request.request_id] = request
+        return request.request_id
+    def _update_request_file(self, request_id: str, updates: Dict[str, Any]) -> bool:
+        """Update request in file system"""
+        try:
+            request_file = self.data_dir / "requests" / f"{request_id}.json"
+            if not request_file.exists():
+                return False
+            with open(request_file, 'r') as f:
+                request_data = json.load(f)
+            request_data.update(updates)
+            with open(request_file, 'w') as f:
+                json.dump(request_data, f, indent=2, ensure_ascii=False)
+            return True
+        except Exception as e:
+            logger.error(f"Failed to update request in file system: {e}")
+            return False
+    def _update_request_memory(self, request_id: str, updates: Dict[str, Any]) -> bool:
+        """Update request in memory"""
+        if request_id not in self.requests:
+            return False
+        request_dict = asdict(self.requests[request_id])
+        request_dict.update(updates)
+        # Convert datetime strings back to datetime objects if needed
+        for key in ['created_at', 'started_at', 'completed_at']:
+            if key in request_dict and isinstance(request_dict[key], str):
+                request_dict[key] = datetime.fromisoformat(request_dict[key])
+        self.requests[request_id] = InferenceRequest(**request_dict)
+        return True
+    def _get_request_file(self, request_id: str) -> Optional[InferenceRequest]:
+        """Get request from file system"""
+        try:
+            request_file = self.data_dir / "requests" / f"{request_id}.json"
+            if not request_file.exists():
+                return None
+            with open(request_file, 'r') as f:
+                request_data = json.load(f)
+            # Convert ISO strings back to datetime objects
+            for key in ['created_at', 'started_at', 'completed_at']:
+                if request_data[key]:
+                    request_data[key] = datetime.fromisoformat(request_data[key])
+            return InferenceRequest(**request_data)
+        except Exception as e:
+            logger.error(f"Failed to get request from file system: {e}")
+            return None
+    def _get_request_memory(self, request_id: str) -> Optional[InferenceRequest]:
+        """Get request from memory"""
+        return self.requests.get(request_id)
+    def _list_requests_file(
+        self, service_type: Optional[str], model_id: Optional[str],
+        user_id: Optional[str], status: Optional[str], hours: int, limit: int
+    ) -> List[InferenceRequest]:
+        """List requests from file system"""
+        try:
+            requests = []
+            requests_dir = self.data_dir / "requests"
+            cutoff_time = datetime.now(timezone.utc) - timedelta(hours=hours)
+            for request_file in requests_dir.glob("*.json"):
+                with open(request_file, 'r') as f:
+                    request_data = json.load(f)
+                # Convert datetime fields
+                for key in ['created_at', 'started_at', 'completed_at']:
+                    if request_data[key]:
+                        request_data[key] = datetime.fromisoformat(request_data[key])
+                request = InferenceRequest(**request_data)
+                # Apply filters
+                if request.created_at < cutoff_time:
+                    continue
+                if service_type and request.service_type != service_type:
+                    continue
+                if model_id and request.model_id != model_id:
+                    continue
+                if user_id and request.user_id != user_id:
+                    continue
+                if status and request.status != status:
+                    continue
+                requests.append(request)
+                if len(requests) >= limit:
+                    break
+            return sorted(requests, key=lambda x: x.created_at, reverse=True)
+        except Exception as e:
+            logger.error(f"Failed to list requests from file system: {e}")
+            return []
+    def _list_requests_memory(
+        self, service_type: Optional[str], model_id: Optional[str],
+        user_id: Optional[str], status: Optional[str], hours: int, limit: int
+    ) -> List[InferenceRequest]:
+        """List requests from memory"""
+        cutoff_time = datetime.now(timezone.utc) - timedelta(hours=hours)
+        requests = []
+        for request in self.requests.values():
+            # Apply filters
+            if request.created_at < cutoff_time:
+                continue
+            if service_type and request.service_type != service_type:
+                continue
+            if model_id and request.model_id != model_id:
+                continue
+            if user_id and request.user_id != user_id:
+                continue
+            if status and request.status != status:
+                continue
+            requests.append(request)
+            if len(requests) >= limit:
+                break
+        return sorted(requests, key=lambda x: x.created_at, reverse=True)
+    # Simplified placeholder implementations for statistics and snapshots
+    def _record_stats_file(self, stats: UsageStatistics) -> str:
+        """Record statistics in file system"""
+        try:
+            stats_file = self.data_dir / "statistics" / f"{stats.stat_id}.json"
+            stats_data = asdict(stats)
+            # Convert datetime objects to ISO strings
+            for key in ['period_start', 'period_end', 'created_at']:
+                if stats_data[key] and isinstance(stats_data[key], datetime):
+                    stats_data[key] = stats_data[key].isoformat()
+            with open(stats_file, 'w') as f:
+                json.dump(stats_data, f, indent=2, ensure_ascii=False)
+            return stats.stat_id
+        except Exception as e:
+            logger.error(f"Failed to record statistics in file system: {e}")
+            raise
+    def _record_stats_memory(self, stats: UsageStatistics) -> str:
+        """Record statistics in memory"""
+        self.statistics[stats.stat_id] = stats
+        return stats.stat_id
+    def _update_snapshot_file(self, snapshot: ModelUsageSnapshot) -> str:
+        """Update snapshot in file system"""
+        try:
+            snapshot_file = self.data_dir / "snapshots" / f"{snapshot.snapshot_id}.json"
+            snapshot_data = asdict(snapshot)
+            # Convert datetime objects to ISO strings
+            for key in ['snapshot_time', 'last_used']:
+                if snapshot_data[key] and isinstance(snapshot_data[key], datetime):
+                    snapshot_data[key] = snapshot_data[key].isoformat()
+            with open(snapshot_file, 'w') as f:
+                json.dump(snapshot_data, f, indent=2, ensure_ascii=False)
+            return snapshot.snapshot_id
+        except Exception as e:
+            logger.error(f"Failed to update snapshot in file system: {e}")
+            raise
+    def _update_snapshot_memory(self, snapshot: ModelUsageSnapshot) -> str:
+        """Update snapshot in memory"""
+        self.snapshots[snapshot.snapshot_id] = snapshot
+        return snapshot.snapshot_id
+    # Cleanup implementations
+    def _cleanup_requests_file(self, cutoff_date: datetime) -> int:
+        """Cleanup old requests from file system"""
+        count = 0
+        try:
+            requests_dir = self.data_dir / "requests"
+            for request_file in requests_dir.glob("*.json"):
+                if request_file.stat().st_mtime < cutoff_date.timestamp():
+                    request_file.unlink()
+                    count += 1
+        except Exception as e:
+            logger.error(f"Failed to cleanup requests from file system: {e}")
+        return count
+    def _cleanup_requests_memory(self, cutoff_date: datetime) -> int:
+        """Cleanup old requests from memory"""
+        count = 0
+        to_remove = []
+        for request_id, request in self.requests.items():
+            if request.created_at < cutoff_date:
+                to_remove.append(request_id)
+        for request_id in to_remove:
+            del self.requests[request_id]
+            count += 1
+        return count
+    # Placeholder implementations for Supabase backend
+    def _create_request_supabase(self, request: InferenceRequest) -> str:
+        return request.request_id  # Implementation needed
+    def _update_request_supabase(self, request_id: str, updates: Dict[str, Any]) -> bool:
+        return False  # Implementation needed
+    def _get_request_supabase(self, request_id: str) -> Optional[InferenceRequest]:
+        return None  # Implementation needed
+    def _list_requests_supabase(self, service_type, model_id, user_id, status, hours, limit) -> List[InferenceRequest]:
+        return []  # Implementation needed
+    def _record_stats_supabase(self, stats: UsageStatistics) -> str:
+        return stats.stat_id  # Implementation needed
+    def _get_stats_supabase(self, service_type, model_id, user_id, days, limit) -> List[UsageStatistics]:
+        return []  # Implementation needed
+    def _get_stats_memory(self, service_type, model_id, user_id, days, limit) -> List[UsageStatistics]:
+        return list(self.statistics.values())[:limit]
+    def _get_stats_file(self, service_type, model_id, user_id, days, limit) -> List[UsageStatistics]:
+        return []  # Implementation needed
+    def _update_snapshot_supabase(self, snapshot: ModelUsageSnapshot) -> str:
+        return snapshot.snapshot_id  # Implementation needed
+    def _get_snapshots_supabase(self, model_id, provider, days) -> List[ModelUsageSnapshot]:
+        return []  # Implementation needed
+    def _get_snapshots_memory(self, model_id, provider, days) -> List[ModelUsageSnapshot]:
+        return list(self.snapshots.values())
+    def _get_snapshots_file(self, model_id, provider, days) -> List[ModelUsageSnapshot]:
+        return []  # Implementation needed
+    def _cleanup_requests_supabase(self, cutoff_date: datetime) -> int:
+        return 0  # Implementation needed
+    def _cleanup_stats_supabase(self, cutoff_date: datetime) -> int:
+        return 0  # Implementation needed
+    def _cleanup_stats_memory(self, cutoff_date: datetime) -> int:
+        count = 0
+        to_remove = []
+        for stat_id, stat in self.statistics.items():
+            if stat.created_at < cutoff_date:
+                to_remove.append(stat_id)
+        for stat_id in to_remove:
+            del self.statistics[stat_id]
+            count += 1
+        return count
+    def _cleanup_stats_file(self, cutoff_date: datetime) -> int:
+        count = 0
+        try:
+            stats_dir = self.data_dir / "statistics"
+            for stats_file in stats_dir.glob("*.json"):
+                if stats_file.stat().st_mtime < cutoff_date.timestamp():
+                    stats_file.unlink()
+                    count += 1
+        except Exception as e:
+            logger.error(f"Failed to cleanup statistics from file system: {e}")
+        return count

isa-model 0.3.91__py3-none-any.whl → 0.4.3__py3-none-any.whl

isa-model 0.3.91py3-none-any.whl → 0.4.3py3-none-any.whl