PyPI - isa-model - Versions diffs - 0.4.0__py3-none-any.whl → 0.4.3__py3-none-any.whl - Mend

isa-model 0.4.0py3-none-any.whl → 0.4.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (199) hide show

isa_model/client.py +466 -43
isa_model/core/cache/redis_cache.py +12 -3
isa_model/core/config/config_manager.py +230 -3
isa_model/core/config.py +90 -0
isa_model/core/database/direct_db_client.py +114 -0
isa_model/core/database/migration_manager.py +563 -0
isa_model/core/database/migrations.py +21 -1
isa_model/core/database/supabase_client.py +154 -19
isa_model/core/dependencies.py +316 -0
isa_model/core/discovery/__init__.py +19 -0
isa_model/core/discovery/consul_discovery.py +190 -0
isa_model/core/logging/__init__.py +54 -0
isa_model/core/logging/influx_logger.py +523 -0
isa_model/core/logging/loki_logger.py +160 -0
isa_model/core/models/__init__.py +27 -18
isa_model/core/models/config_models.py +625 -0
isa_model/core/models/deployment_billing_tracker.py +430 -0
isa_model/core/models/model_manager.py +40 -17
isa_model/core/models/model_metadata.py +690 -0
isa_model/core/models/model_repo.py +174 -18
isa_model/core/models/system_models.py +857 -0
isa_model/core/repositories/__init__.py +9 -0
isa_model/core/repositories/config_repository.py +912 -0
isa_model/core/services/intelligent_model_selector.py +399 -21
isa_model/core/storage/hf_storage.py +1 -1
isa_model/core/types.py +1 -0
isa_model/deployment/__init__.py +5 -48
isa_model/deployment/core/__init__.py +2 -31
isa_model/deployment/core/deployment_manager.py +1278 -370
isa_model/deployment/local/__init__.py +31 -0
isa_model/deployment/local/config.py +248 -0
isa_model/deployment/local/gpu_gateway.py +607 -0
isa_model/deployment/local/health_checker.py +428 -0
isa_model/deployment/local/provider.py +586 -0
isa_model/deployment/local/tensorrt_service.py +621 -0
isa_model/deployment/local/transformers_service.py +644 -0
isa_model/deployment/local/vllm_service.py +527 -0
isa_model/deployment/modal/__init__.py +8 -0
isa_model/deployment/modal/config.py +136 -0
isa_model/deployment/{services/auto_hf_modal_deployer.py → modal/deployer.py} +1 -1
isa_model/deployment/modal/services/__init__.py +3 -0
isa_model/deployment/modal/services/audio/__init__.py +1 -0
isa_model/deployment/modal/services/embedding/__init__.py +1 -0
isa_model/deployment/modal/services/llm/__init__.py +1 -0
isa_model/deployment/modal/services/llm/isa_llm_service.py +424 -0
isa_model/deployment/modal/services/video/__init__.py +1 -0
isa_model/deployment/modal/services/vision/__init__.py +1 -0
isa_model/deployment/models/org-org-acme-corp-tenant-a-service-llm-20250825-225822/tenant-a-service_modal_service.py +48 -0
isa_model/deployment/models/org-test-org-123-prefix-test-service-llm-20250825-225822/prefix-test-service_modal_service.py +48 -0
isa_model/deployment/models/test-llm-service-llm-20250825-204442/test-llm-service_modal_service.py +48 -0
isa_model/deployment/models/test-monitoring-gpt2-llm-20250825-212906/test-monitoring-gpt2_modal_service.py +48 -0
isa_model/deployment/models/test-monitoring-gpt2-llm-20250825-213009/test-monitoring-gpt2_modal_service.py +48 -0
isa_model/deployment/storage/__init__.py +5 -0
isa_model/deployment/storage/deployment_repository.py +824 -0
isa_model/deployment/triton/__init__.py +10 -0
isa_model/deployment/triton/config.py +196 -0
isa_model/deployment/triton/configs/__init__.py +1 -0
isa_model/deployment/triton/provider.py +512 -0
isa_model/deployment/triton/scripts/__init__.py +1 -0
isa_model/deployment/triton/templates/__init__.py +1 -0
isa_model/inference/__init__.py +47 -1
isa_model/inference/ai_factory.py +137 -10
isa_model/inference/legacy_services/__init__.py +21 -0
isa_model/inference/legacy_services/model_evaluation.py +637 -0
isa_model/inference/legacy_services/model_service.py +573 -0
isa_model/inference/legacy_services/model_serving.py +717 -0
isa_model/inference/legacy_services/model_training.py +561 -0
isa_model/inference/models/__init__.py +21 -0
isa_model/inference/models/inference_config.py +551 -0
isa_model/inference/models/inference_record.py +675 -0
isa_model/inference/models/performance_models.py +714 -0
isa_model/inference/repositories/__init__.py +9 -0
isa_model/inference/repositories/inference_repository.py +828 -0
isa_model/inference/services/audio/base_stt_service.py +184 -11
isa_model/inference/services/audio/openai_stt_service.py +22 -6
isa_model/inference/services/custom_model_manager.py +277 -0
isa_model/inference/services/embedding/ollama_embed_service.py +15 -3
isa_model/inference/services/embedding/resilient_embed_service.py +285 -0
isa_model/inference/services/llm/__init__.py +10 -2
isa_model/inference/services/llm/base_llm_service.py +335 -24
isa_model/inference/services/llm/cerebras_llm_service.py +628 -0
isa_model/inference/services/llm/helpers/llm_adapter.py +9 -4
isa_model/inference/services/llm/helpers/llm_prompts.py +342 -0
isa_model/inference/services/llm/helpers/llm_utils.py +321 -23
isa_model/inference/services/llm/huggingface_llm_service.py +581 -0
isa_model/inference/services/llm/local_llm_service.py +747 -0
isa_model/inference/services/llm/ollama_llm_service.py +9 -2
isa_model/inference/services/llm/openai_llm_service.py +33 -16
isa_model/inference/services/llm/yyds_llm_service.py +8 -2
isa_model/inference/services/vision/__init__.py +22 -1
isa_model/inference/services/vision/blip_vision_service.py +359 -0
isa_model/inference/services/vision/helpers/image_utils.py +8 -5
isa_model/inference/services/vision/isa_vision_service.py +65 -4
isa_model/inference/services/vision/openai_vision_service.py +19 -10
isa_model/inference/services/vision/vgg16_vision_service.py +257 -0
isa_model/serving/api/cache_manager.py +245 -0
isa_model/serving/api/dependencies/__init__.py +1 -0
isa_model/serving/api/dependencies/auth.py +194 -0
isa_model/serving/api/dependencies/database.py +139 -0
isa_model/serving/api/error_handlers.py +284 -0
isa_model/serving/api/fastapi_server.py +172 -22
isa_model/serving/api/middleware/auth.py +8 -2
isa_model/serving/api/middleware/security.py +23 -33
isa_model/serving/api/middleware/tenant_context.py +414 -0
isa_model/serving/api/routes/analytics.py +4 -1
isa_model/serving/api/routes/config.py +645 -0
isa_model/serving/api/routes/deployment_billing.py +315 -0
isa_model/serving/api/routes/deployments.py +138 -2
isa_model/serving/api/routes/gpu_gateway.py +440 -0
isa_model/serving/api/routes/health.py +32 -12
isa_model/serving/api/routes/inference_monitoring.py +486 -0
isa_model/serving/api/routes/local_deployments.py +448 -0
isa_model/serving/api/routes/tenants.py +575 -0
isa_model/serving/api/routes/unified.py +680 -18
isa_model/serving/api/routes/webhooks.py +479 -0
isa_model/serving/api/startup.py +68 -54
isa_model/utils/gpu_utils.py +311 -0
{isa_model-0.4.0.dist-info → isa_model-0.4.3.dist-info}/METADATA +66 -24
isa_model-0.4.3.dist-info/RECORD +193 -0
isa_model/core/storage/minio_storage.py +0 -0
isa_model/deployment/cloud/__init__.py +0 -9
isa_model/deployment/cloud/modal/__init__.py +0 -10
isa_model/deployment/core/deployment_config.py +0 -356
isa_model/deployment/core/isa_deployment_service.py +0 -401
isa_model/deployment/gpu_int8_ds8/app/server.py +0 -66
isa_model/deployment/gpu_int8_ds8/scripts/test_client.py +0 -43
isa_model/deployment/gpu_int8_ds8/scripts/test_client_os.py +0 -35
isa_model/deployment/runtime/deployed_service.py +0 -338
isa_model/deployment/services/__init__.py +0 -9
isa_model/deployment/services/auto_deploy_vision_service.py +0 -538
isa_model/deployment/services/model_service.py +0 -332
isa_model/deployment/services/service_monitor.py +0 -356
isa_model/deployment/services/service_registry.py +0 -527
isa_model/eval/__init__.py +0 -92
isa_model/eval/benchmarks/__init__.py +0 -27
isa_model/eval/benchmarks/multimodal_datasets.py +0 -460
isa_model/eval/benchmarks.py +0 -701
isa_model/eval/config/__init__.py +0 -10
isa_model/eval/config/evaluation_config.py +0 -108
isa_model/eval/evaluators/__init__.py +0 -24
isa_model/eval/evaluators/audio_evaluator.py +0 -727
isa_model/eval/evaluators/base_evaluator.py +0 -503
isa_model/eval/evaluators/embedding_evaluator.py +0 -742
isa_model/eval/evaluators/llm_evaluator.py +0 -472
isa_model/eval/evaluators/vision_evaluator.py +0 -564
isa_model/eval/example_evaluation.py +0 -395
isa_model/eval/factory.py +0 -798
isa_model/eval/infrastructure/__init__.py +0 -24
isa_model/eval/infrastructure/experiment_tracker.py +0 -466
isa_model/eval/isa_benchmarks.py +0 -700
isa_model/eval/isa_integration.py +0 -582
isa_model/eval/metrics.py +0 -951
isa_model/eval/tests/unit/test_basic.py +0 -396
isa_model/serving/api/routes/evaluations.py +0 -579
isa_model/training/__init__.py +0 -168
isa_model/training/annotation/annotation_schema.py +0 -47
isa_model/training/annotation/processors/annotation_processor.py +0 -126
isa_model/training/annotation/storage/dataset_manager.py +0 -131
isa_model/training/annotation/storage/dataset_schema.py +0 -44
isa_model/training/annotation/tests/test_annotation_flow.py +0 -109
isa_model/training/annotation/tests/test_minio copy.py +0 -113
isa_model/training/annotation/tests/test_minio_upload.py +0 -43
isa_model/training/annotation/views/annotation_controller.py +0 -158
isa_model/training/cloud/__init__.py +0 -22
isa_model/training/cloud/job_orchestrator.py +0 -402
isa_model/training/cloud/runpod_trainer.py +0 -454
isa_model/training/cloud/storage_manager.py +0 -482
isa_model/training/core/__init__.py +0 -26
isa_model/training/core/config.py +0 -181
isa_model/training/core/dataset.py +0 -222
isa_model/training/core/trainer.py +0 -720
isa_model/training/core/utils.py +0 -213
isa_model/training/examples/intelligent_training_example.py +0 -281
isa_model/training/factory.py +0 -424
isa_model/training/intelligent/__init__.py +0 -25
isa_model/training/intelligent/decision_engine.py +0 -643
isa_model/training/intelligent/intelligent_factory.py +0 -888
isa_model/training/intelligent/knowledge_base.py +0 -751
isa_model/training/intelligent/resource_optimizer.py +0 -839
isa_model/training/intelligent/task_classifier.py +0 -576
isa_model/training/storage/__init__.py +0 -24
isa_model/training/storage/core_integration.py +0 -439
isa_model/training/storage/training_repository.py +0 -552
isa_model/training/storage/training_storage.py +0 -628
isa_model-0.4.0.dist-info/RECORD +0 -182
/isa_model/deployment/{cloud/modal → modal/services/audio}/isa_audio_chatTTS_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/audio}/isa_audio_fish_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/audio}/isa_audio_openvoice_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/audio}/isa_audio_service_v2.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/embedding}/isa_embed_rerank_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/video}/isa_video_hunyuan_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/vision}/isa_vision_ocr_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/vision}/isa_vision_qwen25_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/vision}/isa_vision_table_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/vision}/isa_vision_ui_service.py +0 -0
/isa_model/deployment/{cloud/modal → modal/services/vision}/isa_vision_ui_service_optimized.py +0 -0
/isa_model/deployment/{services → modal/services/vision}/simple_auto_deploy_vision_service.py +0 -0
{isa_model-0.4.0.dist-info → isa_model-0.4.3.dist-info}/WHEEL +0 -0
{isa_model-0.4.0.dist-info → isa_model-0.4.3.dist-info}/top_level.txt +0 -0

isa_model/inference/services/llm/ollama_llm_service.py CHANGED Viewed

@@ -3,6 +3,7 @@ import httpx
 import json
 from typing import Dict, Any, List, Union, AsyncGenerator, Optional, Callable
 from isa_model.inference.services.llm.base_llm_service import BaseLLMService
+from isa_model.core.config.config_manager import ConfigManager
 logger = logging.getLogger(__name__)
@@ -16,7 +17,10 @@ class OllamaLLMService(BaseLLMService):
         provider_config = self.get_provider_config()
         # Create HTTP client for Ollama API
-        base_url = provider_config.get("base_url", "http://localhost:11434")
+        config_manager = ConfigManager()
+        # Use Consul discovery with fallback
+        default_base_url = config_manager.get_ollama_url()
+        base_url = provider_config.get("base_url", default_base_url)
         timeout = provider_config.get("timeout", 60)
         self.client = httpx.AsyncClient(
@@ -34,7 +38,10 @@ class OllamaLLMService(BaseLLMService):
         """Ensure the HTTP client is available and not closed"""
         if not hasattr(self, 'client') or not self.client or self.client.is_closed:
             provider_config = self.get_provider_config()
-            base_url = provider_config.get("base_url", "http://localhost:11434")
+            config_manager = ConfigManager()
+            # Use Consul discovery with fallback
+            default_base_url = config_manager.get_ollama_url()
+            base_url = provider_config.get("base_url", default_base_url)
             timeout = provider_config.get("timeout", 60)
             self.client = httpx.AsyncClient(base_url=base_url, timeout=timeout)

isa_model/inference/services/llm/openai_llm_service.py CHANGED Viewed

@@ -20,6 +20,8 @@ class OpenAILLMService(BaseLLMService):
         # Check if this is an O-series reasoning model
         self.is_reasoning_model = model_name.startswith("o4-") or model_name.startswith("o3-")
+        self.uses_completion_tokens = self.is_reasoning_model or model_name.startswith("gpt-5")
+        self.requires_default_temperature = self.is_reasoning_model or model_name.startswith("gpt-5")
         self.supports_deep_research = "deep-search" in model_name or "deep-research" in model_name
         # Get configuration from centralized config manager
@@ -36,7 +38,9 @@ class OpenAILLMService(BaseLLMService):
             self.client = AsyncOpenAI(
                 api_key=provider_config["api_key"],
                 base_url=provider_config.get("api_base_url", "https://api.openai.com/v1"),
-                organization=provider_config.get("organization")
+                organization=provider_config.get("organization"),
+                timeout=10.0,  # 10 second timeout for first token (much faster than 600s default)
+                max_retries=2  # Retry on timeout
             )
             logger.info(f"Initialized OpenAILLMService with model {self.model_name} and endpoint {self.client.base_url}")
@@ -70,6 +74,8 @@ class OpenAILLMService(BaseLLMService):
         # Copy OpenAI-specific attributes
         bound_service.is_reasoning_model = self.is_reasoning_model
+        bound_service.uses_completion_tokens = self.uses_completion_tokens
+        bound_service.requires_default_temperature = self.requires_default_temperature
         bound_service.supports_deep_research = self.supports_deep_research
         # Copy base class attributes
@@ -103,7 +109,7 @@ class OpenAILLMService(BaseLLMService):
         return bound_service
-    async def astream(self, input_data: Union[str, List[Dict[str, str]], Any], show_reasoning: bool = False) -> AsyncGenerator[Union[str, Dict[str, Any]], None]:
+    async def astream(self, input_data: Union[str, List[Dict[str, str]], Any], show_reasoning: bool = False, **extra_kwargs) -> AsyncGenerator[Union[str, Dict[str, Any]], None]:
         """
         True streaming method - yields tokens one by one as they arrive
@@ -121,19 +127,19 @@ class OpenAILLMService(BaseLLMService):
             if use_responses_api:
                 logger.info(f"Using Responses API streaming for {self.model_name}")
                 # Use Responses API streaming
-                async for chunk in self._astream_responses_api(input_data, show_reasoning):
+                async for chunk in self._astream_responses_api(input_data, show_reasoning, **extra_kwargs):
                     yield chunk
             else:
                 logger.debug(f"Using Chat Completions API streaming for {self.model_name}")
                 # Use Chat Completions API streaming
-                async for chunk in self._astream_chat_completions_api(input_data):
+                async for chunk in self._astream_chat_completions_api(input_data, **extra_kwargs):
                     yield chunk
         except Exception as e:
             logger.error(f"Error in astream: {e}")
             raise
-    async def _astream_responses_api(self, input_data: Union[str, List[Dict[str, str]], Any], show_reasoning: bool = False) -> AsyncGenerator[Union[str, Dict[str, Any]], None]:
+    async def _astream_responses_api(self, input_data: Union[str, List[Dict[str, str]], Any], show_reasoning: bool = False, **extra_kwargs) -> AsyncGenerator[Union[str, Dict[str, Any]], None]:
         """Stream using Responses API for reasoning models and deep research models"""
         try:
             # Use adapter manager to prepare messages
@@ -228,7 +234,7 @@ class OpenAILLMService(BaseLLMService):
             logger.error(f"Error in _astream_responses_api: {e}")
             raise
-    async def _astream_chat_completions_api(self, input_data: Union[str, List[Dict[str, str]], Any]) -> AsyncGenerator[Union[str, Dict[str, Any]], None]:
+    async def _astream_chat_completions_api(self, input_data: Union[str, List[Dict[str, str]], Any], **extra_kwargs) -> AsyncGenerator[Union[str, Dict[str, Any]], None]:
         """Stream using Chat Completions API for standard models"""
         try:
             # Use adapter manager to prepare messages
@@ -242,13 +248,13 @@ class OpenAILLMService(BaseLLMService):
                 "stream": True
             }
-            # O4 models only support temperature=1 (default)
-            if not self.is_reasoning_model:
+            # O4 and GPT-5 models only support temperature=1 (default)
+            if not self.requires_default_temperature:
                 kwargs["temperature"] = provider_config.get("temperature", 0.7)
-            # O4 models use max_completion_tokens instead of max_tokens
+            # O4 and GPT-5 models use max_completion_tokens instead of max_tokens
             max_tokens_value = provider_config.get("max_tokens", 1024)
-            if self.is_reasoning_model:
+            if self.uses_completion_tokens:
                 kwargs["max_completion_tokens"] = max_tokens_value
             else:
                 kwargs["max_tokens"] = max_tokens_value
@@ -259,6 +265,11 @@ class OpenAILLMService(BaseLLMService):
                 kwargs["tools"] = tool_schemas
                 kwargs["tool_choice"] = "auto"
+            # Add response_format if specified (for JSON mode)
+            if 'response_format' in extra_kwargs:
+                kwargs['response_format'] = extra_kwargs['response_format']
+                logger.debug(f"Using response_format in streaming: {extra_kwargs['response_format']}")
             # Stream tokens and detect tool calls
             content_chunks = []
             tool_calls_accumulator = {}  # Track complete tool calls by ID
@@ -360,13 +371,14 @@ class OpenAILLMService(BaseLLMService):
             logger.error(f"Error in _astream_chat_completions_api: {e}")
             raise
-    async def ainvoke(self, input_data: Union[str, List[Dict[str, str]], Any], show_reasoning: bool = False) -> Union[str, Any]:
+    async def ainvoke(self, input_data: Union[str, List[Dict[str, str]], Any], show_reasoning: bool = False, **extra_kwargs) -> Union[str, Any]:
         """
         Unified invoke method for all input types
         Args:
             input_data: Input messages or text
             show_reasoning: If True and model supports it, show reasoning process using Responses API
+            **extra_kwargs: Additional parameters to pass to the API (e.g., response_format)
         """
         try:
             # Use adapter manager to prepare messages
@@ -385,13 +397,13 @@ class OpenAILLMService(BaseLLMService):
                 "messages": messages
             }
-            # O4 models only support temperature=1 (default)
-            if not self.is_reasoning_model:
+            # O4 and GPT-5 models only support temperature=1 (default)
+            if not self.requires_default_temperature:
                 kwargs["temperature"] = provider_config.get("temperature", 0.7)
-            # O4 models use max_completion_tokens instead of max_tokens
+            # O4 and GPT-5 models use max_completion_tokens instead of max_tokens
             max_tokens_value = provider_config.get("max_tokens", 1024)
-            if self.is_reasoning_model:
+            if self.uses_completion_tokens:
                 kwargs["max_completion_tokens"] = max_tokens_value
             else:
                 kwargs["max_tokens"] = max_tokens_value
@@ -403,11 +415,16 @@ class OpenAILLMService(BaseLLMService):
                 if not use_responses_api:  # Responses API handles tool choice differently
                     kwargs["tool_choice"] = "auto"
+            # Add response_format if specified (for JSON mode)
+            if 'response_format' in extra_kwargs:
+                kwargs['response_format'] = extra_kwargs['response_format']
+                logger.debug(f"Using response_format: {extra_kwargs['response_format']}")
             # Handle streaming vs non-streaming
             if self.streaming:
                 # TRUE STREAMING MODE - collect all chunks from the stream
                 content_chunks = []
-                async for token in self.astream(input_data, show_reasoning=show_reasoning):
+                async for token in self.astream(input_data, show_reasoning=show_reasoning, **extra_kwargs):
                     if isinstance(token, str):
                         content_chunks.append(token)
                     elif isinstance(token, dict) and "result" in token:

isa_model/inference/services/llm/yyds_llm_service.py CHANGED Viewed

@@ -63,16 +63,19 @@ class YydsLLMService(BaseLLMService):
         return bound_service
-    async def astream(self, input_data: Union[str, List[Dict[str, str]], Any]) -> AsyncGenerator[str, None]:
+    async def astream(self, input_data: Union[str, List[Dict[str, str]], Any], **kwargs) -> AsyncGenerator[str, None]:
         """
         True streaming method - yields tokens one by one as they arrive
         Args:
             input_data: Same as ainvoke
+            **kwargs: Additional parameters (will filter out unsupported ones)
         Yields:
             Individual tokens as they arrive from the API
         """
+        # Remove parameters that yyds doesn't support
+        kwargs.pop('show_reasoning', None)  # OpenAI-specific parameter
         try:
             # Use adapter manager to prepare messages
             messages = self._prepare_messages(input_data)
@@ -115,8 +118,11 @@ class YydsLLMService(BaseLLMService):
             logger.error(f"Error in astream: {e}")
             raise
-    async def ainvoke(self, input_data: Union[str, List[Dict[str, str]], Any]) -> Union[str, Any]:
+    async def ainvoke(self, input_data: Union[str, List[Dict[str, str]], Any], **kwargs) -> Union[str, Any]:
         """Unified invoke method for all input types"""
+        # Remove parameters that yyds doesn't support
+        kwargs.pop('show_reasoning', None)  # OpenAI-specific parameter
+        kwargs.pop('task', None)  # Handled internally
         try:
             # Use adapter manager to prepare messages
             messages = self._prepare_messages(input_data)

isa_model/inference/services/vision/__init__.py CHANGED Viewed

@@ -31,6 +31,21 @@ except ImportError:
     OllamaVisionService = None
     OLLAMA_VISION_AVAILABLE = False
+# Computer Vision specialized services
+try:
+    from .vgg16_vision_service import VGG16VisionService
+    VGG16_VISION_AVAILABLE = True
+except ImportError:
+    VGG16VisionService = None
+    VGG16_VISION_AVAILABLE = False
+try:
+    from .blip_vision_service import BLIPVisionService
+    BLIP_VISION_AVAILABLE = True
+except ImportError:
+    BLIPVisionService = None
+    BLIP_VISION_AVAILABLE = False
 __all__ = [
     "BaseVisionService",
     "OpenAIVisionService",
@@ -43,4 +58,10 @@ if ISA_VISION_AVAILABLE:
     __all__.append("ISAVisionService")
 if OLLAMA_VISION_AVAILABLE:
-    __all__.append("OllamaVisionService")
+    __all__.append("OllamaVisionService")
+if VGG16_VISION_AVAILABLE:
+    __all__.append("VGG16VisionService")
+if BLIP_VISION_AVAILABLE:
+    __all__.append("BLIPVisionService")

isa_model/inference/services/vision/blip_vision_service.py ADDED Viewed

@@ -0,0 +1,359 @@
+#!/usr/bin/env python3
+"""
+BLIP Vision Service
+Computer vision service using BLIP for image captioning and description
+Based on the notebook implementation
+"""
+import os
+import logging
+from typing import Dict, List, Any, Optional, Union, BinaryIO
+from PIL import Image
+import io
+from .base_vision_service import BaseVisionService
+logger = logging.getLogger(__name__)
+def _lazy_import_blip_deps():
+    """Lazy import BLIP dependencies"""
+    try:
+        import torch
+        import tensorflow as tf
+        from transformers import BlipProcessor, BlipForConditionalGeneration
+        return {
+            'torch': torch,
+            'tf': tf,
+            'BlipProcessor': BlipProcessor,
+            'BlipForConditionalGeneration': BlipForConditionalGeneration,
+            'available': True
+        }
+    except ImportError as e:
+        logger.warning(f"BLIP dependencies not available: {e}")
+        return {'available': False}
+class BLIPVisionService(BaseVisionService):
+    """
+    BLIP-based vision service for image captioning and description
+    Provides an alternative implementation to VLM-based captioning
+    """
+    def __init__(self, model_name: str = "Salesforce/blip-image-captioning-base"):
+        """
+        Initialize BLIP vision service
+        Args:
+            model_name: Hugging Face model name for BLIP
+        """
+        super().__init__()
+        self.model_name = model_name
+        self.processor = None
+        self.model = None
+        # Lazy load dependencies
+        self.blip_components = _lazy_import_blip_deps()
+        if not self.blip_components['available']:
+            raise ImportError("BLIP dependencies (transformers, torch) are required")
+        # Load BLIP model
+        self._load_blip_model()
+    def _load_blip_model(self):
+        """Load BLIP model and processor"""
+        try:
+            # Load the pretrained BLIP processor and model
+            self.processor = self.blip_components['BlipProcessor'].from_pretrained(self.model_name)
+            self.model = self.blip_components['BlipForConditionalGeneration'].from_pretrained(self.model_name)
+            logger.info(f"BLIP model loaded: {self.model_name}")
+        except Exception as e:
+            logger.error(f"Error loading BLIP model: {e}")
+            raise
+    def _preprocess_image(self, image: Union[str, BinaryIO]) -> Image.Image:
+        """
+        Preprocess image for BLIP input
+        Args:
+            image: Image path or binary data
+        Returns:
+            PIL Image in RGB format
+        """
+        try:
+            # Handle different image input types
+            if isinstance(image, str):
+                # File path
+                pil_image = Image.open(image).convert('RGB')
+            elif hasattr(image, 'read'):
+                # Binary IO
+                image_data = image.read()
+                pil_image = Image.open(io.BytesIO(image_data)).convert('RGB')
+            else:
+                raise ValueError("Unsupported image format")
+            return pil_image
+        except Exception as e:
+            logger.error(f"Error preprocessing image: {e}")
+            raise
+    def _generate_text(self, image: Image.Image, prompt: str) -> str:
+        """
+        Generate text for image using BLIP
+        Args:
+            image: PIL Image
+            prompt: Text prompt for generation
+        Returns:
+            Generated text
+        """
+        try:
+            # Prepare inputs for BLIP model
+            inputs = self.processor(images=image, text=prompt, return_tensors="pt")
+            # Generate text output
+            output = self.model.generate(**inputs)
+            # Decode output
+            result = self.processor.decode(output[0], skip_special_tokens=True)
+            return result
+        except Exception as e:
+            logger.error(f"Error generating text: {e}")
+            raise
+    async def describe_image(self,
+                           image: Union[str, BinaryIO],
+                           detail_level: str = "medium") -> Dict[str, Any]:
+        """
+        Generate description for image using BLIP
+        Args:
+            image: Image path or binary data
+            detail_level: Level of detail (not used in BLIP, maintained for compatibility)
+        Returns:
+            Description results
+        """
+        try:
+            # Preprocess image
+            pil_image = self._preprocess_image(image)
+            # Generate caption using BLIP
+            prompt = "This is a picture of"  # Following notebook implementation
+            caption = self._generate_text(pil_image, prompt)
+            return {
+                "task": "describe",
+                "service": "BLIPVisionService",
+                "description": caption,
+                "detail_level": detail_level,
+                "model_type": "BLIP",
+                "prompt_used": prompt,
+                "success": True
+            }
+        except Exception as e:
+            logger.error(f"Error describing image: {e}")
+            return {
+                "error": str(e),
+                "service": "BLIPVisionService",
+                "success": False
+            }
+    async def analyze_image(self,
+                          image: Union[str, BinaryIO],
+                          prompt: Optional[str] = None,
+                          max_tokens: int = 1000) -> Dict[str, Any]:
+        """
+        Analyze image using BLIP
+        Args:
+            image: Image path or binary data
+            prompt: Optional custom prompt
+            max_tokens: Not used for BLIP
+        Returns:
+            Analysis results
+        """
+        try:
+            # Preprocess image
+            pil_image = self._preprocess_image(image)
+            # Use custom prompt or default
+            if prompt:
+                analysis_prompt = prompt
+            else:
+                analysis_prompt = "This is a detailed photo showing"  # For summary-like analysis
+            # Generate analysis using BLIP
+            analysis_text = self._generate_text(pil_image, analysis_prompt)
+            return {
+                "task": "analyze",
+                "service": "BLIPVisionService",
+                "text": analysis_text,
+                "model_type": "BLIP",
+                "prompt_used": analysis_prompt,
+                "success": True
+            }
+        except Exception as e:
+            logger.error(f"Error analyzing image: {e}")
+            return {
+                "error": str(e),
+                "service": "BLIPVisionService",
+                "success": False
+            }
+    async def generate_caption(self, image: Union[str, BinaryIO]) -> Dict[str, Any]:
+        """
+        Generate caption for image (Task 9 from notebook)
+        Args:
+            image: Image path or binary data
+        Returns:
+            Caption results
+        """
+        try:
+            # Preprocess image
+            pil_image = self._preprocess_image(image)
+            # Generate caption
+            prompt = "This is a picture of"  # Following notebook
+            caption = self._generate_text(pil_image, prompt)
+            return {
+                "task": "caption",
+                "service": "BLIPVisionService",
+                "caption": caption,
+                "model_type": "BLIP",
+                "success": True
+            }
+        except Exception as e:
+            logger.error(f"Error generating caption: {e}")
+            return {
+                "error": str(e),
+                "service": "BLIPVisionService",
+                "success": False
+            }
+    async def generate_summary(self, image: Union[str, BinaryIO]) -> Dict[str, Any]:
+        """
+        Generate summary for image (Task 10 from notebook)
+        Args:
+            image: Image path or binary data
+        Returns:
+            Summary results
+        """
+        try:
+            # Preprocess image
+            pil_image = self._preprocess_image(image)
+            # Generate summary
+            prompt = "This is a detailed photo showing"  # Following notebook
+            summary = self._generate_text(pil_image, prompt)
+            return {
+                "task": "summary",
+                "service": "BLIPVisionService",
+                "summary": summary,
+                "model_type": "BLIP",
+                "success": True
+            }
+        except Exception as e:
+            logger.error(f"Error generating summary: {e}")
+            return {
+                "error": str(e),
+                "service": "BLIPVisionService",
+                "success": False
+            }
+    async def batch_generate(self,
+                           images: List[Union[str, BinaryIO]],
+                           task: str = "caption") -> Dict[str, Any]:
+        """
+        Generate captions or summaries for multiple images
+        Args:
+            images: List of image paths or binary data
+            task: Task type ("caption" or "summary")
+        Returns:
+            Batch generation results
+        """
+        try:
+            results = []
+            errors = []
+            for i, image in enumerate(images):
+                try:
+                    if task == "caption":
+                        result = await self.generate_caption(image)
+                    elif task == "summary":
+                        result = await self.generate_summary(image)
+                    else:
+                        raise ValueError(f"Unsupported task: {task}")
+                    if result.get("success"):
+                        results.append({
+                            "index": i,
+                            "image": str(image) if isinstance(image, str) else f"binary_image_{i}",
+                            **result
+                        })
+                    else:
+                        errors.append({
+                            "index": i,
+                            "image": str(image) if isinstance(image, str) else f"binary_image_{i}",
+                            "error": result.get("error", "Unknown error")
+                        })
+                except Exception as e:
+                    errors.append({
+                        "index": i,
+                        "image": str(image) if isinstance(image, str) else f"binary_image_{i}",
+                        "error": str(e)
+                    })
+            return {
+                "task": f"batch_{task}",
+                "service": "BLIPVisionService",
+                "total_images": len(images),
+                "successful": len(results),
+                "failed": len(errors),
+                "results": results,
+                "errors": errors,
+                "success": True
+            }
+        except Exception as e:
+            logger.error(f"Error in batch generation: {e}")
+            return {
+                "error": str(e),
+                "service": "BLIPVisionService",
+                "success": False
+            }
+    def get_service_info(self) -> Dict[str, Any]:
+        """Get service information"""
+        return {
+            "service_name": "BLIPVisionService",
+            "model_name": self.model_name,
+            "model_type": "BLIP",
+            "capabilities": ["describe", "analyze", "caption", "summary", "batch_generate"],
+            "model_loaded": self.model is not None,
+            "processor_loaded": self.processor is not None,
+            "dependencies_available": self.blip_components['available']
+        }

isa_model/inference/services/vision/helpers/image_utils.py CHANGED Viewed

@@ -59,25 +59,28 @@ def get_image_data(image: Union[str, BinaryIO]) -> bytes:
 def compress_image(image_data: Union[bytes, BytesIO], max_size: int = 1024) -> bytes:
     """压缩图片以减小大小
     Args:
         image_data: 图片数据，可以是 bytes 或 BytesIO
         max_size: 最大尺寸（像素）
     Returns:
         bytes: 压缩后的图片数据
     """
     try:
+        # Ensure max_size is int (type safety)
+        max_size = int(max_size)
         # 如果输入是 bytes，转换为 BytesIO
         if isinstance(image_data, bytes):
             image_data = BytesIO(image_data)
         img = Image.open(image_data)
         # 转换为 RGB 模式（如果需要）
         if img.mode in ('RGBA', 'P'):
             img = img.convert('RGB')
         # 计算新尺寸，保持宽高比
         ratio = max_size / max(img.size)
         if ratio < 1:

isa-model 0.4.0__py3-none-any.whl → 0.4.3__py3-none-any.whl

isa-model 0.4.0py3-none-any.whl → 0.4.3py3-none-any.whl