PyPI - isa-model - Versions diffs - 0.4.0__py3-none-any.whl → 0.4.3__py3-none-any.whl - Mend

isa-model 0.4.0py3-none-any.whl → 0.4.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (199) hide show

isa_model/client.py +466 -43
isa_model/core/cache/redis_cache.py +12 -3
isa_model/core/config/config_manager.py +230 -3
isa_model/core/config.py +90 -0
isa_model/core/database/direct_db_client.py +114 -0
isa_model/core/database/migration_manager.py +563 -0
isa_model/core/database/migrations.py +21 -1
isa_model/core/database/supabase_client.py +154 -19
isa_model/core/dependencies.py +316 -0
isa_model/core/discovery/__init__.py +19 -0
isa_model/core/discovery/consul_discovery.py +190 -0
isa_model/core/logging/__init__.py +54 -0
isa_model/core/logging/influx_logger.py +523 -0
isa_model/core/logging/loki_logger.py +160 -0
isa_model/core/models/__init__.py +27 -18
isa_model/core/models/config_models.py +625 -0
isa_model/core/models/deployment_billing_tracker.py +430 -0
isa_model/core/models/model_manager.py +40 -17
isa_model/core/models/model_metadata.py +690 -0
isa_model/core/models/model_repo.py +174 -18
isa_model/core/models/system_models.py +857 -0
isa_model/core/repositories/__init__.py +9 -0
isa_model/core/repositories/config_repository.py +912 -0
isa_model/core/services/intelligent_model_selector.py +399 -21
isa_model/core/storage/hf_storage.py +1 -1
isa_model/core/types.py +1 -0
isa_model/deployment/__init__.py +5 -48
isa_model/deployment/core/__init__.py +2 -31
isa_model/deployment/core/deployment_manager.py +1278 -370
isa_model/deployment/local/__init__.py +31 -0
isa_model/deployment/local/config.py +248 -0
isa_model/deployment/local/gpu_gateway.py +607 -0
isa_model/deployment/local/health_checker.py +428 -0
isa_model/deployment/local/provider.py +586 -0
isa_model/deployment/local/tensorrt_service.py +621 -0
isa_model/deployment/local/transformers_service.py +644 -0
isa_model/deployment/local/vllm_service.py +527 -0
isa_model/deployment/modal/__init__.py +8 -0
isa_model/deployment/modal/config.py +136 -0
isa_model/deployment/{services/auto_hf_modal_deployer.py → modal/deployer.py} +1 -1
isa_model/deployment/modal/services/__init__.py +3 -0
isa_model/deployment/modal/services/audio/__init__.py +1 -0
isa_model/deployment/modal/services/embedding/__init__.py +1 -0
isa_model/deployment/modal/services/llm/__init__.py +1 -0
isa_model/deployment/modal/services/llm/isa_llm_service.py +424 -0
isa_model/deployment/modal/services/video/__init__.py +1 -0
isa_model/deployment/modal/services/vision/__init__.py +1 -0
isa_model/deployment/models/org-org-acme-corp-tenant-a-service-llm-20250825-225822/tenant-a-service_modal_service.py +48 -0
isa_model/deployment/models/org-test-org-123-prefix-test-service-llm-20250825-225822/prefix-test-service_modal_service.py +48 -0
isa_model/deployment/models/test-llm-service-llm-20250825-204442/test-llm-service_modal_service.py +48 -0
isa_model/deployment/models/test-monitoring-gpt2-llm-20250825-212906/test-monitoring-gpt2_modal_service.py +48 -0
isa_model/deployment/models/test-monitoring-gpt2-llm-20250825-213009/test-monitoring-gpt2_modal_service.py +48 -0
isa_model/deployment/storage/__init__.py +5 -0
isa_model/deployment/storage/deployment_repository.py +824 -0
isa_model/deployment/triton/__init__.py +10 -0
isa_model/deployment/triton/config.py +196 -0
isa_model/deployment/triton/configs/__init__.py +1 -0
isa_model/deployment/triton/provider.py +512 -0
isa_model/deployment/triton/scripts/__init__.py +1 -0
isa_model/deployment/triton/templates/__init__.py +1 -0
isa_model/inference/__init__.py +47 -1
isa_model/inference/ai_factory.py +137 -10
isa_model/inference/legacy_services/__init__.py +21 -0
isa_model/inference/legacy_services/model_evaluation.py +637 -0
isa_model/inference/legacy_services/model_service.py +573 -0
isa_model/inference/legacy_services/model_serving.py +717 -0
isa_model/inference/legacy_services/model_training.py +561 -0
isa_model/inference/models/__init__.py +21 -0
isa_model/inference/models/inference_config.py +551 -0
isa_model/inference/models/inference_record.py +675 -0
isa_model/inference/models/performance_models.py +714 -0
isa_model/inference/repositories/__init__.py +9 -0
isa_model/inference/repositories/inference_repository.py +828 -0
isa_model/inference/services/audio/base_stt_service.py +184 -11
isa_model/inference/services/audio/openai_stt_service.py +22 -6
isa_model/inference/services/custom_model_manager.py +277 -0
isa_model/inference/services/embedding/ollama_embed_service.py +15 -3
isa_model/inference/services/embedding/resilient_embed_service.py +285 -0
isa_model/inference/services/llm/__init__.py +10 -2
isa_model/inference/services/llm/base_llm_service.py +335 -24
isa_model/inference/services/llm/cerebras_llm_service.py +628 -0
isa_model/inference/services/llm/helpers/llm_adapter.py +9 -4
isa_model/inference/services/llm/helpers/llm_prompts.py +342 -0
isa_model/inference/services/llm/helpers/llm_utils.py +321 -23
isa_model/inference/services/llm/huggingface_llm_service.py +581 -0
isa_model/inference/services/llm/local_llm_service.py +747 -0
isa_model/inference/services/llm/ollama_llm_service.py +9 -2
isa_model/inference/services/llm/openai_llm_service.py +33 -16
isa_model/inference/services/llm/yyds_llm_service.py +8 -2
isa_model/inference/services/vision/__init__.py +22 -1
isa_model/inference/services/vision/blip_vision_service.py +359 -0
isa_model/inference/services/vision/helpers/image_utils.py +8 -5
isa_model/inference/services/vision/isa_vision_service.py +65 -4
isa_model/inference/services/vision/openai_vision_service.py +19 -10
isa_model/inference/services/vision/vgg16_vision_service.py +257 -0
isa_model/serving/api/cache_manager.py +245 -0
isa_model/serving/api/dependencies/__init__.py +1 -0
isa_model/serving/api/dependencies/auth.py +194 -0
isa_model/serving/api/dependencies/database.py +139 -0
isa_model/serving/api/error_handlers.py +284 -0
isa_model/serving/api/fastapi_server.py +172 -22
isa_model/serving/api/middleware/auth.py +8 -2
isa_model/serving/api/middleware/security.py +23 -33
isa_model/serving/api/middleware/tenant_context.py +414 -0
isa_model/serving/api/routes/analytics.py +4 -1
isa_model/serving/api/routes/config.py +645 -0
isa_model/serving/api/routes/deployment_billing.py +315 -0
isa_model/serving/api/routes/deployments.py +138 -2
isa_model/serving/api/routes/gpu_gateway.py +440 -0
isa_model/serving/api/routes/health.py +32 -12
isa_model/serving/api/routes/inference_monitoring.py +486 -0
isa_model/serving/api/routes/local_deployments.py +448 -0
isa_model/serving/api/routes/tenants.py +575 -0
isa_model/serving/api/routes/unified.py +680 -18
isa_model/serving/api/routes/webhooks.py +479 -0
isa_model/serving/api/startup.py +68 -54
isa_model/utils/gpu_utils.py +311 -0
{isa_model-0.4.0.dist-info → isa_model-0.4.3.dist-info}/METADATA +66 -24
isa_model-0.4.3.dist-info/RECORD +193 -0
isa_model/core/storage/minio_storage.py +0 -0
isa_model/deployment/cloud/__init__.py +0 -9
isa_model/deployment/cloud/modal/__init__.py +0 -10
isa_model/deployment/core/deployment_config.py +0 -356
isa_model/deployment/core/isa_deployment_service.py +0 -401
isa_model/deployment/gpu_int8_ds8/app/server.py +0 -66
isa_model/deployment/gpu_int8_ds8/scripts/test_client.py +0 -43
isa_model/deployment/gpu_int8_ds8/scripts/test_client_os.py +0 -35
isa_model/deployment/runtime/deployed_service.py +0 -338
isa_model/deployment/services/__init__.py +0 -9
isa_model/deployment/services/auto_deploy_vision_service.py +0 -538
isa_model/deployment/services/model_service.py +0 -332
isa_model/deployment/services/service_monitor.py +0 -356
isa_model/deployment/services/service_registry.py +0 -527
isa_model/eval/__init__.py +0 -92
isa_model/eval/benchmarks/__init__.py +0 -27
isa_model/eval/benchmarks/multimodal_datasets.py +0 -460
isa_model/eval/benchmarks.py +0 -701
isa_model/eval/config/__init__.py +0 -10
isa_model/eval/config/evaluation_config.py +0 -108
isa_model/eval/evaluators/__init__.py +0 -24
isa_model/eval/evaluators/audio_evaluator.py +0 -727
isa_model/eval/evaluators/base_evaluator.py +0 -503
isa_model/eval/evaluators/embedding_evaluator.py +0 -742
isa_model/eval/evaluators/llm_evaluator.py +0 -472
isa_model/eval/evaluators/vision_evaluator.py +0 -564
isa_model/eval/example_evaluation.py +0 -395
isa_model/eval/factory.py +0 -798
isa_model/eval/infrastructure/__init__.py +0 -24
isa_model/eval/infrastructure/experiment_tracker.py +0 -466
isa_model/eval/isa_benchmarks.py +0 -700
isa_model/eval/isa_integration.py +0 -582
isa_model/eval/metrics.py +0 -951
isa_model/eval/tests/unit/test_basic.py +0 -396
isa_model/serving/api/routes/evaluations.py +0 -579
isa_model/training/__init__.py +0 -168
isa_model/training/annotation/annotation_schema.py +0 -47
isa_model/training/annotation/processors/annotation_processor.py +0 -126
isa_model/training/annotation/storage/dataset_manager.py +0 -131
isa_model/training/annotation/storage/dataset_schema.py +0 -44
isa_model/training/annotation/tests/test_annotation_flow.py +0 -109
isa_model/training/annotation/tests/test_minio copy.py +0 -113
isa_model/training/annotation/tests/test_minio_upload.py +0 -43
isa_model/training/annotation/views/annotation_controller.py +0 -158
isa_model/training/cloud/__init__.py +0 -22
isa_model/training/cloud/job_orchestrator.py +0 -402
isa_model/training/cloud/runpod_trainer.py +0 -454
isa_model/training/cloud/storage_manager.py +0 -482
isa_model/training/core/__init__.py +0 -26
isa_model/training/core/config.py +0 -181
isa_model/training/core/dataset.py +0 -222
isa_model/training/core/trainer.py +0 -720
isa_model/training/core/utils.py +0 -213
isa_model/training/examples/intelligent_training_example.py +0 -281
isa_model/training/factory.py +0 -424
isa_model/training/intelligent/__init__.py +0 -25
isa_model/training/intelligent/decision_engine.py +0 -643
isa_model/training/intelligent/intelligent_factory.py +0 -888
isa_model/training/intelligent/knowledge_base.py +0 -751
isa_model/training/intelligent/resource_optimizer.py +0 -839
isa_model/training/intelligent/task_classifier.py +0 -576
isa_model/training/storage/__init__.py +0 -24
isa_model/training/storage/core_integration.py +0 -439
isa_model/training/storage/training_repository.py +0 -552
isa_model/training/storage/training_storage.py +0 -628
isa_model-0.4.0.dist-info/RECORD +0 -182
/isa_model/deployment/{cloud/modal → modal/services/audio}/isa_audio_chatTTS_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/audio}/isa_audio_fish_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/audio}/isa_audio_openvoice_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/audio}/isa_audio_service_v2.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/embedding}/isa_embed_rerank_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/video}/isa_video_hunyuan_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/vision}/isa_vision_ocr_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/vision}/isa_vision_qwen25_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/vision}/isa_vision_table_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/vision}/isa_vision_ui_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/vision}/isa_vision_ui_service_optimized.py +0 -0
/isa_model/deployment/{services → modal/services/vision}/simple_auto_deploy_vision_service.py +0 -0
{isa_model-0.4.0.dist-info → isa_model-0.4.3.dist-info}/WHEEL +0 -0
{isa_model-0.4.0.dist-info → isa_model-0.4.3.dist-info}/top_level.txt +0 -0

isa_model/inference/services/vision/isa_vision_service.py CHANGED Viewed

@@ -9,6 +9,7 @@ import logging
 import base64
 import io
 import time
+import asyncio
 from typing import Dict, Any, List, Union, Optional, BinaryIO
 from PIL import Image
@@ -36,7 +37,7 @@ class ISAVisionService(BaseVisionService):
     def __init__(self,
                  modal_app_id: str = "ap-VlHUQoiPUdy9cgrHSfG7Fk",
                  modal_app_name: str = "isa-vision-ui-optimized",
-                 timeout: int = 30):
+                 timeout: int = 60):
         """
         初始化ISA Vision服务
@@ -77,6 +78,31 @@ class ISAVisionService(BaseVisionService):
         self.request_count = 0
         self.total_cost = 0.0
+        # 性能优化 - 预热连接（延迟初始化）
+        self._connection_warmed = False
+        # 简单缓存机制（可选）
+        self._result_cache = {}
+        self._cache_max_size = 100
+    async def _warm_connection(self):
+        """预热Modal连接，减少首次调用延迟"""
+        if self._connection_warmed or not self.modal_app:
+            return
+        try:
+            logger.info("Warming up Modal connection...")
+            # 尝试获取服务状态来预热连接
+            if hasattr(self.modal_app, 'list_functions'):
+                await asyncio.wait_for(
+                    asyncio.to_thread(self.modal_app.list_functions),
+                    timeout=10
+                )
+            self._connection_warmed = True
+            logger.info("✅ Modal connection warmed up")
+        except Exception as e:
+            logger.warning(f"Failed to warm up connection: {e}")
     async def analyze_image(
         self,
         image: Union[str, BinaryIO],
@@ -154,6 +180,9 @@ class ISAVisionService(BaseVisionService):
                     'error': 'Modal app or service not available'
                 }
+            # 预热连接以减少延迟
+            await self._warm_connection()
             # 准备图像数据
             image_b64 = await self._prepare_image_base64(image)
@@ -208,11 +237,22 @@ class ISAVisionService(BaseVisionService):
             # 创建实例并调用优化方法（快速模式，无字幕）
             instance = OptimizedUIDetectionService()
-            result = instance.detect_ui_elements_fast.remote(image_b64, enable_captions=False)
+            # 使用超时控制Modal调用
+            result = await asyncio.wait_for(
+                instance.detect_ui_elements_fast.remote(image_b64, enable_captions=False),
+                timeout=self.timeout
+            )
             logger.info("✅ Modal SDK call successful")
             return result
+        except asyncio.TimeoutError:
+            logger.error(f"Modal SDK call timed out after {self.timeout} seconds")
+            return {
+                'success': False,
+                'error': f'Modal service timeout after {self.timeout} seconds',
+                'timeout': True
+            }
         except Exception as e:
             logger.error(f"Modal SDK call failed: {e}")
             return {
@@ -316,11 +356,22 @@ class ISAVisionService(BaseVisionService):
             # 创建实例并调用方法
             instance = SuryaOCRService()
-            result = instance.extract_text.remote(image_b64, languages)
+            # 使用超时控制OCR调用
+            result = await asyncio.wait_for(
+                instance.extract_text.remote(image_b64, languages),
+                timeout=self.timeout
+            )
             logger.info("✅ OCR service call successful")
             return result
+        except asyncio.TimeoutError:
+            logger.error(f"OCR service call timed out after {self.timeout} seconds")
+            return {
+                'success': False,
+                'error': f'OCR service timeout after {self.timeout} seconds',
+                'timeout': True
+            }
         except Exception as e:
             logger.error(f"OCR service call failed: {e}")
             return {
@@ -499,7 +550,7 @@ class ISAVisionService(BaseVisionService):
         """准备base64编码的图像"""
         if isinstance(image, str):
             # Check if it's already base64 encoded
-            if image.startswith('data:image') or len(image) > 1000:
+            if image.startswith('data:image') or (not image.startswith('http') and len(image) > 1000):
                 # Likely already base64
                 if image.startswith('data:image'):
                     # Extract base64 part
@@ -507,6 +558,16 @@ class ISAVisionService(BaseVisionService):
                 else:
                     # Assume it's pure base64
                     return image
+            elif image.startswith('http://') or image.startswith('https://'):
+                # URL - download the image
+                import aiohttp
+                async with aiohttp.ClientSession() as session:
+                    async with session.get(image) as response:
+                        if response.status == 200:
+                            image_data = await response.read()
+                            return base64.b64encode(image_data).decode('utf-8')
+                        else:
+                            raise ValueError(f"Failed to download image from URL: {response.status}")
             else:
                 # File path
                 with open(image, 'rb') as f:

isa_model/inference/services/vision/openai_vision_service.py CHANGED Viewed

@@ -92,12 +92,21 @@ class OpenAIVisionService(BaseVisionService, VisionPromptMixin):
                 }
             ]
-            response = await self._client.chat.completions.create(  # type: ignore
-                model=self.model_name,
-                messages=messages,  # type: ignore
-                max_tokens=max_tokens,
-                temperature=self.temperature
-            )
+            # Use max_completion_tokens for newer models like gpt-4o-mini
+            completion_params = {
+                "model": self.model_name,
+                "messages": messages,  # type: ignore
+                "temperature": self.temperature
+            }
+            # Check if model uses new parameter name
+            # All newer models (gpt-4o, gpt-4.1, o1, etc.) use max_completion_tokens
+            if any(prefix in self.model_name for prefix in ["gpt-4o", "gpt-4.1", "o1"]):
+                completion_params["max_completion_tokens"] = max_tokens
+            else:
+                completion_params["max_tokens"] = max_tokens
+            response = await self._client.chat.completions.create(**completion_params)  # type: ignore
             # Track usage for billing
             if response.usage:
@@ -162,7 +171,7 @@ class OpenAIVisionService(BaseVisionService, VisionPromptMixin):
         图像描述 - 使用专门提示词
         """
         prompt = self.get_task_prompt("describe", detail_level=detail_level)
-        return await self.analyze_image(image, prompt)
+        return await self.analyze_image(image, prompt, max_tokens=1000)
     async def extract_text(self, image: Union[str, BinaryIO]) -> Dict[str, Any]:
         """
@@ -170,7 +179,7 @@ class OpenAIVisionService(BaseVisionService, VisionPromptMixin):
         """
         prompt = self.get_task_prompt("extract_text")
-        return await self.analyze_image(image, prompt)
+        return await self.analyze_image(image, prompt, max_tokens=1000)
     async def detect_objects(
         self,
@@ -182,7 +191,7 @@ class OpenAIVisionService(BaseVisionService, VisionPromptMixin):
         """
         prompt = self.get_task_prompt("detect_objects", confidence_threshold=confidence_threshold)
-        return await self.analyze_image(image, prompt)
+        return await self.analyze_image(image, prompt, max_tokens=1000)
     async def detect_ui_elements(
         self,
@@ -195,7 +204,7 @@ class OpenAIVisionService(BaseVisionService, VisionPromptMixin):
         """
         prompt = self.get_task_prompt("detect_ui_elements", element_types=element_types, confidence_threshold=confidence_threshold)
-        return await self.analyze_image(image, prompt)
+        return await self.analyze_image(image, prompt, max_tokens=1000)
     async def detect_document_elements(
         self,

isa_model/inference/services/vision/vgg16_vision_service.py ADDED Viewed

@@ -0,0 +1,257 @@
+#!/usr/bin/env python3
+"""
+VGG16 Vision Service
+Computer vision service using VGG16 for image classification
+Based on the aircraft damage detection notebook implementation
+"""
+import os
+import numpy as np
+from typing import Dict, List, Any, Optional, Union, BinaryIO
+import logging
+from PIL import Image
+import io
+from .base_vision_service import BaseVisionService
+logger = logging.getLogger(__name__)
+def _lazy_import_vgg16_deps():
+    """Lazy import VGG16 dependencies"""
+    try:
+        import tensorflow as tf
+        from tensorflow.keras.applications import VGG16
+        from tensorflow.keras.layers import Dense, Dropout, Flatten
+        from tensorflow.keras.models import Sequential, Model
+        from tensorflow.keras.optimizers import Adam
+        from tensorflow.keras.preprocessing.image import ImageDataGenerator
+        return {
+            'tf': tf,
+            'VGG16': VGG16,
+            'Dense': Dense,
+            'Dropout': Dropout,
+            'Flatten': Flatten,
+            'Sequential': Sequential,
+            'Model': Model,
+            'Adam': Adam,
+            'ImageDataGenerator': ImageDataGenerator,
+            'available': True
+        }
+    except ImportError as e:
+        logger.warning(f"VGG16 dependencies not available: {e}")
+        return {'available': False}
+class VGG16VisionService(BaseVisionService):
+    """
+    VGG16-based vision service for image classification
+    Provides an alternative implementation to VLM-based classification
+    """
+    def __init__(self, model_path: Optional[str] = None, class_names: Optional[List[str]] = None):
+        """
+        Initialize VGG16 vision service
+        Args:
+            model_path: Path to trained VGG16 model
+            class_names: List of class names for classification
+        """
+        super().__init__()
+        self.model_path = model_path
+        self.class_names = class_names or ["class_0", "class_1"]
+        self.model = None
+        self.input_shape = (224, 224, 3)
+        # Lazy load dependencies
+        self.vgg16_components = _lazy_import_vgg16_deps()
+        if not self.vgg16_components['available']:
+            raise ImportError("TensorFlow and VGG16 dependencies are required")
+        # Load model if path provided
+        if model_path and os.path.exists(model_path):
+            self._load_model(model_path)
+    def _load_model(self, model_path: str):
+        """Load trained VGG16 model"""
+        try:
+            tf = self.vgg16_components['tf']
+            self.model = tf.keras.models.load_model(model_path)
+            logger.info(f"VGG16 model loaded from {model_path}")
+        except Exception as e:
+            logger.error(f"Error loading VGG16 model: {e}")
+            raise
+    def _preprocess_image(self, image: Union[str, BinaryIO]) -> np.ndarray:
+        """
+        Preprocess image for VGG16 input
+        Args:
+            image: Image path or binary data
+        Returns:
+            Preprocessed image array
+        """
+        try:
+            # Handle different image input types
+            if isinstance(image, str):
+                # File path
+                pil_image = Image.open(image).convert('RGB')
+            elif hasattr(image, 'read'):
+                # Binary IO
+                image_data = image.read()
+                pil_image = Image.open(io.BytesIO(image_data)).convert('RGB')
+            else:
+                raise ValueError("Unsupported image format")
+            # Resize to VGG16 input size
+            pil_image = pil_image.resize((self.input_shape[0], self.input_shape[1]))
+            # Convert to array and normalize
+            image_array = np.array(pil_image) / 255.0
+            # Add batch dimension
+            image_batch = np.expand_dims(image_array, axis=0)
+            return image_batch, image_array
+        except Exception as e:
+            logger.error(f"Error preprocessing image: {e}")
+            raise
+    async def classify_image(self,
+                           image: Union[str, BinaryIO],
+                           categories: Optional[List[str]] = None) -> Dict[str, Any]:
+        """
+        Classify image using trained VGG16 model
+        Args:
+            image: Image path or binary data
+            categories: Optional list of categories (uses model's classes if None)
+        Returns:
+            Classification results
+        """
+        try:
+            if self.model is None:
+                return {
+                    "error": "No trained model available. Please load a model first.",
+                    "service": "VGG16VisionService"
+                }
+            # Preprocess image
+            image_batch, image_array = self._preprocess_image(image)
+            # Make prediction
+            predictions = self.model.predict(image_batch, verbose=0)
+            # Use provided categories or default class names
+            class_names = categories or self.class_names
+            # Process predictions based on model output
+            if len(predictions[0]) == 1:  # Binary classification
+                predicted_class_idx = int(predictions[0] > 0.5)
+                confidence = float(predictions[0][0]) if predicted_class_idx == 1 else float(1 - predictions[0][0])
+                # Create probability distribution
+                probabilities = {
+                    class_names[0]: float(1 - predictions[0][0]),
+                    class_names[1]: float(predictions[0][0])
+                }
+            else:  # Multiclass classification
+                predicted_class_idx = np.argmax(predictions[0])
+                confidence = float(predictions[0][predicted_class_idx])
+                # Create probability distribution
+                probabilities = {
+                    class_names[i]: float(predictions[0][i])
+                    for i in range(min(len(class_names), len(predictions[0])))
+                }
+            predicted_class = class_names[predicted_class_idx] if predicted_class_idx < len(class_names) else f"class_{predicted_class_idx}"
+            return {
+                "task": "classify",
+                "service": "VGG16VisionService",
+                "predicted_class": predicted_class,
+                "confidence": confidence,
+                "probabilities": probabilities,
+                "model_type": "VGG16",
+                "success": True
+            }
+        except Exception as e:
+            logger.error(f"Error classifying image: {e}")
+            return {
+                "error": str(e),
+                "service": "VGG16VisionService",
+                "success": False
+            }
+    async def analyze_image(self,
+                          image: Union[str, BinaryIO],
+                          prompt: Optional[str] = None,
+                          max_tokens: int = 1000) -> Dict[str, Any]:
+        """
+        Analyze image using VGG16 classification
+        Args:
+            image: Image path or binary data
+            prompt: Optional prompt (used to guide interpretation)
+            max_tokens: Not used for classification
+        Returns:
+            Analysis results
+        """
+        # For VGG16, analysis is essentially classification
+        classification_result = await self.classify_image(image)
+        if classification_result.get("success"):
+            # Create analysis text based on classification
+            predicted_class = classification_result["predicted_class"]
+            confidence = classification_result["confidence"]
+            analysis_text = f"The image has been classified as '{predicted_class}' with {confidence:.2%} confidence."
+            if prompt:
+                analysis_text += f" Analysis context: {prompt}"
+            return {
+                "task": "analyze",
+                "service": "VGG16VisionService",
+                "text": analysis_text,
+                "confidence": confidence,
+                "classification": classification_result,
+                "success": True
+            }
+        else:
+            return classification_result
+    def set_class_names(self, class_names: List[str]):
+        """Set class names for classification"""
+        self.class_names = class_names
+    def load_trained_model(self, model_path: str, class_names: Optional[List[str]] = None):
+        """
+        Load a trained VGG16 model
+        Args:
+            model_path: Path to the trained model
+            class_names: Optional class names
+        """
+        self._load_model(model_path)
+        if class_names:
+            self.set_class_names(class_names)
+    def get_service_info(self) -> Dict[str, Any]:
+        """Get service information"""
+        return {
+            "service_name": "VGG16VisionService",
+            "model_type": "VGG16",
+            "capabilities": ["classify", "analyze"],
+            "model_loaded": self.model is not None,
+            "input_shape": self.input_shape,
+            "class_names": self.class_names,
+            "dependencies_available": self.vgg16_components['available']
+        }

isa_model/serving/api/cache_manager.py ADDED Viewed

@@ -0,0 +1,245 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+"""
+Simple Cache Manager for ISA Model API
+Provides in-memory caching to improve API performance
+"""
+import time
+import logging
+from typing import Dict, Any, Optional, Callable
+from dataclasses import dataclass
+from threading import RLock
+import asyncio
+import hashlib
+import json
+logger = logging.getLogger(__name__)
+@dataclass
+class CacheEntry:
+    """Cache entry with data and metadata"""
+    data: Any
+    created_at: float
+    ttl: float
+    access_count: int = 0
+    last_accessed: float = None
+    def is_expired(self) -> bool:
+        """Check if cache entry is expired"""
+        return time.time() - self.created_at > self.ttl
+    def access(self) -> Any:
+        """Mark as accessed and return data"""
+        self.access_count += 1
+        self.last_accessed = time.time()
+        return self.data
+class APICache:
+    """
+    Simple in-memory cache for API responses
+    Thread-safe with automatic expiration
+    """
+    def __init__(self, default_ttl: float = 300.0, max_size: int = 1000):
+        self.default_ttl = default_ttl  # 5 minutes default
+        self.max_size = max_size
+        self._cache: Dict[str, CacheEntry] = {}
+        self._lock = RLock()
+        self._stats = {
+            "hits": 0,
+            "misses": 0,
+            "evictions": 0,
+            "total_requests": 0
+        }
+    def _generate_key(self, *args, **kwargs) -> str:
+        """Generate cache key from arguments"""
+        # Create a stable key from arguments
+        key_data = {
+            "args": args,
+            "kwargs": sorted(kwargs.items()) if kwargs else {}
+        }
+        key_string = json.dumps(key_data, sort_keys=True, default=str)
+        return hashlib.md5(key_string.encode()).hexdigest()
+    def _cleanup_expired(self):
+        """Remove expired entries"""
+        with self._lock:
+            current_time = time.time()
+            expired_keys = [
+                key for key, entry in self._cache.items()
+                if entry.is_expired()
+            ]
+            for key in expired_keys:
+                del self._cache[key]
+            if expired_keys:
+                logger.debug(f"Cleaned up {len(expired_keys)} expired cache entries")
+    def _evict_lru(self):
+        """Evict least recently used entries when cache is full"""
+        with self._lock:
+            if len(self._cache) >= self.max_size:
+                # Sort by last_accessed time (LRU)
+                sorted_entries = sorted(
+                    self._cache.items(),
+                    key=lambda x: x[1].last_accessed or x[1].created_at
+                )
+                # Remove oldest 20% of entries
+                num_to_remove = max(1, len(sorted_entries) // 5)
+                for key, _ in sorted_entries[:num_to_remove]:
+                    del self._cache[key]
+                    self._stats["evictions"] += 1
+                logger.debug(f"Evicted {num_to_remove} LRU cache entries")
+    def get(self, key: str) -> Optional[Any]:
+        """Get cached value by key"""
+        with self._lock:
+            self._stats["total_requests"] += 1
+            if key in self._cache:
+                entry = self._cache[key]
+                if not entry.is_expired():
+                    self._stats["hits"] += 1
+                    return entry.access()
+                else:
+                    # Remove expired entry
+                    del self._cache[key]
+            self._stats["misses"] += 1
+            return None
+    def set(self, key: str, value: Any, ttl: Optional[float] = None) -> None:
+        """Set cached value with optional TTL"""
+        with self._lock:
+            # Cleanup and eviction
+            self._cleanup_expired()
+            self._evict_lru()
+            entry = CacheEntry(
+                data=value,
+                created_at=time.time(),
+                ttl=ttl or self.default_ttl,
+                last_accessed=time.time()
+            )
+            self._cache[key] = entry
+    def delete(self, key: str) -> bool:
+        """Delete cached value"""
+        with self._lock:
+            if key in self._cache:
+                del self._cache[key]
+                return True
+            return False
+    def clear(self) -> None:
+        """Clear all cached values"""
+        with self._lock:
+            self._cache.clear()
+            logger.info("Cache cleared")
+    def get_stats(self) -> Dict[str, Any]:
+        """Get cache statistics"""
+        with self._lock:
+            hit_rate = (
+                self._stats["hits"] / self._stats["total_requests"]
+                if self._stats["total_requests"] > 0 else 0
+            )
+            return {
+                "cache_size": len(self._cache),
+                "max_size": self.max_size,
+                "default_ttl": self.default_ttl,
+                "hit_rate": round(hit_rate * 100, 2),
+                **self._stats
+            }
+# Decorator for caching function results
+def cached(ttl: float = 300.0, cache_key_func: Optional[Callable] = None):
+    """
+    Decorator to cache function results
+    Args:
+        ttl: Time to live in seconds
+        cache_key_func: Custom function to generate cache key
+    """
+    def decorator(func):
+        async def async_wrapper(*args, **kwargs):
+            # Generate cache key
+            if cache_key_func:
+                cache_key = cache_key_func(*args, **kwargs)
+            else:
+                cache_key = api_cache._generate_key(func.__name__, *args, **kwargs)
+            # Try to get from cache
+            cached_result = api_cache.get(cache_key)
+            if cached_result is not None:
+                logger.debug(f"Cache hit for {func.__name__}")
+                return cached_result
+            # Execute function and cache result
+            try:
+                result = await func(*args, **kwargs)
+                api_cache.set(cache_key, result, ttl)
+                logger.debug(f"Cached result for {func.__name__}")
+                return result
+            except Exception as e:
+                logger.error(f"Function {func.__name__} failed: {e}")
+                raise
+        def sync_wrapper(*args, **kwargs):
+            # Generate cache key
+            if cache_key_func:
+                cache_key = cache_key_func(*args, **kwargs)
+            else:
+                cache_key = api_cache._generate_key(func.__name__, *args, **kwargs)
+            # Try to get from cache
+            cached_result = api_cache.get(cache_key)
+            if cached_result is not None:
+                logger.debug(f"Cache hit for {func.__name__}")
+                return cached_result
+            # Execute function and cache result
+            try:
+                result = func(*args, **kwargs)
+                api_cache.set(cache_key, result, ttl)
+                logger.debug(f"Cached result for {func.__name__}")
+                return result
+            except Exception as e:
+                logger.error(f"Function {func.__name__} failed: {e}")
+                raise
+        # Return appropriate wrapper based on function type
+        if asyncio.iscoroutinefunction(func):
+            return async_wrapper
+        else:
+            return sync_wrapper
+    return decorator
+# Global cache instance
+api_cache = APICache(default_ttl=300.0, max_size=1000)
+def get_api_cache() -> APICache:
+    """Get the global API cache instance"""
+    return api_cache
+# Cache key generators for common patterns
+def model_list_cache_key(service_type=None):
+    """Generate cache key for model list API"""
+    return f"models_list_{service_type or 'all'}"
+def provider_list_cache_key():
+    """Generate cache key for provider list API"""
+    return "providers_list"
+def custom_models_cache_key(model_type=None, provider=None):
+    """Generate cache key for custom models API"""
+    return f"custom_models_{model_type or 'all'}_{provider or 'all'}"

isa-model 0.4.0__py3-none-any.whl → 0.4.3__py3-none-any.whl

isa-model 0.4.0py3-none-any.whl → 0.4.3py3-none-any.whl