PyPI - isa-model - Versions diffs - 0.3.9__py3-none-any.whl → 0.4.0__py3-none-any.whl - Mend

isa-model 0.3.9py3-none-any.whl → 0.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (124) hide show

isa_model/__init__.py +1 -1
isa_model/client.py +732 -565
isa_model/core/cache/redis_cache.py +401 -0
isa_model/core/config/config_manager.py +53 -10
isa_model/core/config.py +1 -1
isa_model/core/database/__init__.py +1 -0
isa_model/core/database/migrations.py +277 -0
isa_model/core/database/supabase_client.py +123 -0
isa_model/core/models/__init__.py +37 -0
isa_model/core/models/model_billing_tracker.py +60 -88
isa_model/core/models/model_manager.py +36 -18
isa_model/core/models/model_repo.py +44 -38
isa_model/core/models/model_statistics_tracker.py +234 -0
isa_model/core/models/model_storage.py +0 -1
isa_model/core/models/model_version_manager.py +959 -0
isa_model/core/pricing_manager.py +2 -249
isa_model/core/resilience/circuit_breaker.py +366 -0
isa_model/core/security/secrets.py +358 -0
isa_model/core/services/__init__.py +2 -4
isa_model/core/services/intelligent_model_selector.py +101 -370
isa_model/core/storage/hf_storage.py +1 -1
isa_model/core/types.py +7 -0
isa_model/deployment/cloud/modal/isa_audio_chatTTS_service.py +520 -0
isa_model/deployment/cloud/modal/isa_audio_fish_service.py +0 -0
isa_model/deployment/cloud/modal/isa_audio_openvoice_service.py +758 -0
isa_model/deployment/cloud/modal/isa_audio_service_v2.py +1044 -0
isa_model/deployment/cloud/modal/isa_embed_rerank_service.py +296 -0
isa_model/deployment/cloud/modal/isa_video_hunyuan_service.py +423 -0
isa_model/deployment/cloud/modal/isa_vision_ocr_service.py +519 -0
isa_model/deployment/cloud/modal/isa_vision_qwen25_service.py +709 -0
isa_model/deployment/cloud/modal/isa_vision_table_service.py +467 -323
isa_model/deployment/cloud/modal/isa_vision_ui_service.py +607 -180
isa_model/deployment/cloud/modal/isa_vision_ui_service_optimized.py +660 -0
isa_model/deployment/core/deployment_manager.py +6 -4
isa_model/deployment/services/auto_hf_modal_deployer.py +894 -0
isa_model/eval/benchmarks/__init__.py +27 -0
isa_model/eval/benchmarks/multimodal_datasets.py +460 -0
isa_model/eval/benchmarks.py +244 -12
isa_model/eval/evaluators/__init__.py +8 -2
isa_model/eval/evaluators/audio_evaluator.py +727 -0
isa_model/eval/evaluators/embedding_evaluator.py +742 -0
isa_model/eval/evaluators/vision_evaluator.py +564 -0
isa_model/eval/example_evaluation.py +395 -0
isa_model/eval/factory.py +272 -5
isa_model/eval/isa_benchmarks.py +700 -0
isa_model/eval/isa_integration.py +582 -0
isa_model/eval/metrics.py +159 -6
isa_model/eval/tests/unit/test_basic.py +396 -0
isa_model/inference/ai_factory.py +44 -8
isa_model/inference/services/audio/__init__.py +21 -0
isa_model/inference/services/audio/base_realtime_service.py +225 -0
isa_model/inference/services/audio/isa_tts_service.py +0 -0
isa_model/inference/services/audio/openai_realtime_service.py +320 -124
isa_model/inference/services/audio/openai_stt_service.py +32 -6
isa_model/inference/services/base_service.py +17 -1
isa_model/inference/services/embedding/__init__.py +13 -0
isa_model/inference/services/embedding/base_embed_service.py +111 -8
isa_model/inference/services/embedding/isa_embed_service.py +305 -0
isa_model/inference/services/embedding/openai_embed_service.py +2 -4
isa_model/inference/services/embedding/tests/test_embedding.py +222 -0
isa_model/inference/services/img/__init__.py +2 -2
isa_model/inference/services/img/base_image_gen_service.py +24 -7
isa_model/inference/services/img/replicate_image_gen_service.py +84 -422
isa_model/inference/services/img/services/replicate_face_swap.py +193 -0
isa_model/inference/services/img/services/replicate_flux.py +226 -0
isa_model/inference/services/img/services/replicate_flux_kontext.py +219 -0
isa_model/inference/services/img/services/replicate_sticker_maker.py +249 -0
isa_model/inference/services/img/tests/test_img_client.py +297 -0
isa_model/inference/services/llm/base_llm_service.py +30 -6
isa_model/inference/services/llm/helpers/llm_adapter.py +63 -9
isa_model/inference/services/llm/ollama_llm_service.py +2 -1
isa_model/inference/services/llm/openai_llm_service.py +652 -55
isa_model/inference/services/llm/yyds_llm_service.py +2 -1
isa_model/inference/services/vision/__init__.py +5 -5
isa_model/inference/services/vision/base_vision_service.py +118 -185
isa_model/inference/services/vision/helpers/image_utils.py +11 -5
isa_model/inference/services/vision/isa_vision_service.py +573 -0
isa_model/inference/services/vision/tests/test_ocr_client.py +284 -0
isa_model/serving/api/fastapi_server.py +88 -16
isa_model/serving/api/middleware/auth.py +311 -0
isa_model/serving/api/middleware/security.py +278 -0
isa_model/serving/api/routes/analytics.py +486 -0
isa_model/serving/api/routes/deployments.py +339 -0
isa_model/serving/api/routes/evaluations.py +579 -0
isa_model/serving/api/routes/logs.py +430 -0
isa_model/serving/api/routes/settings.py +582 -0
isa_model/serving/api/routes/unified.py +324 -165
isa_model/serving/api/startup.py +304 -0
isa_model/serving/modal_proxy_server.py +249 -0
isa_model/training/__init__.py +100 -6
isa_model/training/core/__init__.py +4 -1
isa_model/training/examples/intelligent_training_example.py +281 -0
isa_model/training/intelligent/__init__.py +25 -0
isa_model/training/intelligent/decision_engine.py +643 -0
isa_model/training/intelligent/intelligent_factory.py +888 -0
isa_model/training/intelligent/knowledge_base.py +751 -0
isa_model/training/intelligent/resource_optimizer.py +839 -0
isa_model/training/intelligent/task_classifier.py +576 -0
isa_model/training/storage/__init__.py +24 -0
isa_model/training/storage/core_integration.py +439 -0
isa_model/training/storage/training_repository.py +552 -0
isa_model/training/storage/training_storage.py +628 -0
{isa_model-0.3.9.dist-info → isa_model-0.4.0.dist-info}/METADATA +13 -1
isa_model-0.4.0.dist-info/RECORD +182 -0
isa_model/deployment/cloud/modal/isa_vision_doc_service.py +0 -766
isa_model/deployment/cloud/modal/register_models.py +0 -321
isa_model/inference/adapter/unified_api.py +0 -248
isa_model/inference/services/helpers/stacked_config.py +0 -148
isa_model/inference/services/img/flux_professional_service.py +0 -603
isa_model/inference/services/img/helpers/base_stacked_service.py +0 -274
isa_model/inference/services/others/table_transformer_service.py +0 -61
isa_model/inference/services/vision/doc_analysis_service.py +0 -640
isa_model/inference/services/vision/helpers/base_stacked_service.py +0 -274
isa_model/inference/services/vision/ui_analysis_service.py +0 -823
isa_model/scripts/inference_tracker.py +0 -283
isa_model/scripts/mlflow_manager.py +0 -379
isa_model/scripts/model_registry.py +0 -465
isa_model/scripts/register_models.py +0 -370
isa_model/scripts/register_models_with_embeddings.py +0 -510
isa_model/scripts/start_mlflow.py +0 -95
isa_model/scripts/training_tracker.py +0 -257
isa_model-0.3.9.dist-info/RECORD +0 -138
{isa_model-0.3.9.dist-info → isa_model-0.4.0.dist-info}/WHEEL +0 -0
{isa_model-0.3.9.dist-info → isa_model-0.4.0.dist-info}/top_level.txt +0 -0

isa_model/serving/api/routes/unified.py CHANGED Viewed

@@ -9,13 +9,16 @@ This is the main API that handles all types of AI requests:
 - Embedding tasks
 """
-from fastapi import APIRouter, HTTPException, UploadFile, File, Form
+from fastapi import APIRouter, HTTPException, UploadFile, File, Form, Request, Depends
 from fastapi.responses import StreamingResponse
 from pydantic import BaseModel, Field
-from typing import Optional, Dict, Any, Union, List
+from typing import Optional, Dict, Any, Union, List, AsyncGenerator
 import logging
+from ..middleware.auth import optional_auth, require_read_access
+from ..middleware.security import rate_limit_standard, rate_limit_heavy, sanitize_input
 import asyncio
 import json
+import time
 from pathlib import Path
 from isa_model.client import ISAModelClient
@@ -24,30 +27,152 @@ logger = logging.getLogger(__name__)
 router = APIRouter()
 class UnifiedRequest(BaseModel):
-    """Unified request model for all AI services"""
-    input_data: Union[str, Dict[str, Any]] = Field(..., description="Input data (text, image URL, etc.)")
-    task: str = Field(..., description="Task to perform (chat, analyze_image, generate_speech, etc.)")
-    service_type: str = Field(..., description="Service type (text, vision, audio, image, embedding)")
-    model_hint: Optional[str] = Field(None, description="Optional model preference")
-    provider_hint: Optional[str] = Field(None, description="Optional provider preference")
-    stream: Optional[bool] = Field(False, description="Enable streaming for text services")
-    parameters: Optional[Dict[str, Any]] = Field(default_factory=dict, description="Additional task parameters")
+    """
+    **统一请求模型 - 支持所有AI服务类型**
+    这个模型为所有AI服务（文本、视觉、音频、图像生成、嵌入）提供统一的请求接口。
+    **支持的服务类型**:
+    - `text`: 文本服务 (聊天、生成、翻译)
+    - `vision`: 视觉服务 (图像分析、OCR、UI检测)
+    - `audio`: 音频服务 (TTS、STT、转录)
+    - `image`: 图像生成服务 (文本生成图像、图像转换)
+    - `embedding`: 嵌入服务 (文本向量化、相似度计算)
+    **请求示例**:
+    ```json
+    {
+        "input_data": "你好，世界！",
+        "task": "chat",
+        "service_type": "text",
+        "model": "gpt-4o-mini",
+        "provider": "openai"
+    }
+    ```
+    """
+    input_data: Union[str, Dict[str, Any]] = Field(
+        ...,
+        description="输入数据，支持多种格式：文本字符串、LangChain消息列表、图像URL/路径、音频文件路径等。根据service_type确定具体格式。",
+        examples=["你好，世界！", "https://example.com/image.jpg", "/path/to/audio.mp3"]
+    )
+    task: str = Field(
+        ...,
+        description="要执行的任务类型。常见任务：chat(聊天)、analyze_image(图像分析)、generate_speech(语音生成)、create_embedding(创建嵌入)等。",
+        examples=["chat", "analyze_image", "generate_speech", "transcribe", "generate_image", "create_embedding"]
+    )
+    service_type: str = Field(
+        ...,
+        description="服务类型，决定使用哪种AI服务。可选值：text、vision、audio、image、embedding。",
+        examples=["text", "vision", "audio", "image", "embedding"]
+    )
+    model: Optional[str] = Field(
+        None,
+        description="可选的模型指定。如果指定，系统将尝试使用该模型。常见模型：gpt-4o-mini、gpt-4o、whisper-1、flux-schnell等。",
+        examples=["gpt-4o-mini", "gpt-4o", "whisper-1", "tts-1", "flux-schnell", "text-embedding-3-small"]
+    )
+    provider: Optional[str] = Field(
+        None,
+        description="可选的服务提供商指定。如果指定，系统将尝试使用该提供商。常见提供商：openai、replicate、anthropic等。",
+        examples=["openai", "replicate", "anthropic"]
+    )
+    stream: Optional[bool] = Field(
+        None,
+        description="是否启用流式响应。仅适用于文本服务。text+chat任务默认启用流式。当使用工具调用时会自动禁用流式响应以确保完整性。"
+    )
+    tools: Optional[List[Dict[str, Any]]] = Field(
+        None,
+        description="可选的工具列表，用于函数调用功能。仅适用于文本服务。工具格式遵循LangChain工具规范。使用工具时会自动禁用流式响应。",
+        examples=[[
+            {
+                "name": "get_weather",
+                "description": "获取天气信息",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "location": {"type": "string", "description": "城市名称"}
+                    },
+                    "required": ["location"]
+                }
+            }
+        ]]
+    )
+    parameters: Optional[Dict[str, Any]] = Field(
+        default_factory=dict,
+        description="额外的任务参数，用于精细控制服务行为。参数内容根据具体服务类型而定，如temperature、max_tokens、voice等。",
+        examples=[{"temperature": 0.7, "max_tokens": 1000}, {"voice": "alloy", "speed": 1.0}, {"width": 1024, "height": 1024}]
+    )
 class UnifiedResponse(BaseModel):
-    """Unified response model for all AI services"""
-    success: bool
-    result: Optional[Any] = None
-    error: Optional[str] = None
-    metadata: Dict[str, Any]
+    """
+    **统一响应模型 - 所有AI服务的标准响应格式**
+    提供一致的成功/失败状态、结果数据和元数据信息。
+    **成功响应示例**:
+    ```json
+    {
+        "success": true,
+        "result": {
+            "content": "你好！我是AI助手。",
+            "tool_calls": [],
+            "response_metadata": {
+                "token_usage": {
+                    "prompt_tokens": 15,
+                    "completion_tokens": 10,
+                    "total_tokens": 25
+                }
+            }
+        },
+        "error": null,
+        "metadata": {
+            "model_used": "gpt-4o-mini",
+            "provider": "openai",
+            "task": "chat",
+            "service_type": "text",
+            "processing_time": 1.23
+        }
+    }
+    ```
+    **错误响应示例**:
+    ```json
+    {
+        "success": false,
+        "result": null,
+        "error": "Model 'invalid-model' not found",
+        "metadata": {
+            "error_code": "MODEL_NOT_FOUND",
+            "task": "chat",
+            "service_type": "text"
+        }
+    }
+    ```
+    """
+    success: bool = Field(
+        ...,
+        description="请求是否成功执行。true表示成功，false表示失败。"
+    )
+    result: Optional[Any] = Field(
+        None,
+        description="服务执行结果。成功时包含实际数据，失败时为null。数据类型根据服务类型而定：文本服务返回AIMessage对象，视觉服务返回分析文本，音频服务返回文件路径或文本，图像服务返回图像URL，嵌入服务返回向量数组。"
+    )
+    error: Optional[str] = Field(
+        None,
+        description="错误信息描述。成功时为null，失败时包含详细的错误说明。"
+    )
+    metadata: Dict[str, Any] = Field(
+        ...,
+        description="响应元数据，包含执行信息如使用的模型、提供商、处理时间、token使用量等。元数据内容根据服务类型和执行情况而定。"
+    )
 # Global ISA client instance for server-side processing
 _isa_client = None
 def get_isa_client():
-    """Get or create ISA client for local processing"""
+    """Get or create ISA client for service processing"""
     global _isa_client
     if _isa_client is None:
-        _isa_client = ISAModelClient(mode="local")  # Use local mode
+        _isa_client = ISAModelClient()  # Use direct service mode
     return _isa_client
 @router.get("/")
@@ -61,11 +186,16 @@ async def unified_info():
         "version": "1.0.0"
     }
-@router.post("/invoke", response_model=UnifiedResponse)
-async def unified_invoke(request: UnifiedRequest) -> UnifiedResponse:
+@router.post("/invoke")
+@rate_limit_standard()
+async def unified_invoke(request: Request, user: Dict = Depends(require_read_access)):
     """
     **Unified API endpoint for all AI services**
+    Supports both JSON and multipart/form-data requests:
+    - JSON: Standard API request with UnifiedRequest body
+    - Form: File upload with form parameters
     This single endpoint handles:
     - Vision: image analysis, OCR, UI detection
     - Text: chat, generation, translation
@@ -76,167 +206,196 @@ async def unified_invoke(request: UnifiedRequest) -> UnifiedResponse:
     **Uses ISAModelClient in local mode - all the complex logic is in client.py**
     """
     try:
-        # Get ISA client instance (local mode)
+        # Get ISA client instance (service mode)
         client = get_isa_client()
-        # Use client's local invoke method directly
-        # This handles all the complexity: model selection, service routing, execution
-        result = await client._invoke_local(
-            input_data=request.input_data,
-            task=request.task,
-            service_type=request.service_type,
-            model_hint=request.model_hint,
-            provider_hint=request.provider_hint,
-            **request.parameters
-        )
-        # Return the result in our API format
-        return UnifiedResponse(
-            success=result["success"],
-            result=result.get("result"),
-            error=result.get("error"),
-            metadata=result["metadata"]
-        )
-    except Exception as e:
-        logger.error(f"Unified invoke failed: {e}")
-        return UnifiedResponse(
-            success=False,
-            error=str(e),
-            metadata={
-                "task": request.task,
-                "service_type": request.service_type,
-                "model_hint": request.model_hint,
-                "provider_hint": request.provider_hint
-            }
-        )
-@router.post("/stream")
-async def unified_stream(request: UnifiedRequest):
-    """
-    **Unified streaming endpoint for text services**
-    Returns Server-Sent Events (SSE) stream for real-time token generation.
-    Only supports text service types.
-    """
-    try:
-        # Validate streaming request
-        if request.service_type != "text":
-            raise HTTPException(status_code=400, detail="Streaming only supported for text services")
+        # Check content type to determine request format
+        content_type = request.headers.get("content-type", "")
-        # Get ISA client instance (local mode)
-        client = get_isa_client()
+        if content_type.startswith("multipart/form-data"):
+            # Handle form data with file upload
+            form = await request.form()
+            # Extract required fields
+            task = form.get("task")
+            service_type = form.get("service_type")
+            model = form.get("model")
+            provider = form.get("provider")
+            parameters = form.get("parameters")
+            file = form.get("file")
+            if not task or not service_type:
+                raise HTTPException(status_code=400, detail="task and service_type are required")
+            if file is None:
+                raise HTTPException(status_code=400, detail="file is required for multipart requests")
+            # Read file data
+            file_data = await file.read()
+            # Parse parameters if provided as JSON string
+            parsed_params = {}
+            if parameters:
+                try:
+                    parsed_params = json.loads(parameters)
+                except json.JSONDecodeError:
+                    parsed_params = {}
+            result = await client._invoke_service(
+                input_data=file_data,
+                task=task,
+                service_type=service_type,
+                model_hint=model,
+                provider_hint=provider,
+                filename=file.filename,
+                content_type=file.content_type,
+                file_size=len(file_data),
+                **parsed_params
+            )
+            # Return the result in our API format
+            return UnifiedResponse(
+                success=result["success"],
+                result=result.get("result"),
+                error=result.get("error"),
+                metadata={
+                    **result["metadata"],
+                    "filename": file.filename,
+                    "content_type": file.content_type,
+                    "file_size": len(file_data)
+                }
+            )
-        async def generate_stream():
-            """Generator for SSE streaming"""
+        else:
+            # Handle JSON request
             try:
-                # Use client's streaming method
-                stream_gen = await client.invoke(
-                    input_data=request.input_data,
-                    task=request.task,
-                    service_type=request.service_type,
-                    model_hint=request.model_hint,
-                    provider_hint=request.provider_hint,
-                    stream=True,
-                    **request.parameters
-                )
+                json_body = await request.json()
+                unified_request = UnifiedRequest(**json_body)
-                # Stream tokens as SSE format
-                async for token in stream_gen:
-                    # SSE format: "data: {json}\n\n"
-                    token_data = {
-                        "token": token,
-                        "type": "token"
-                    }
-                    yield f"data: {json.dumps(token_data)}\n\n"
-                # Send completion signal
-                completion_data = {
-                    "type": "completion",
-                    "status": "finished"
-                }
-                yield f"data: {json.dumps(completion_data)}\n\n"
+                # Sanitize string inputs to prevent XSS and injection attacks
+                if isinstance(unified_request.input_data, str):
+                    unified_request.input_data = sanitize_input(unified_request.input_data)
             except Exception as e:
-                logger.error(f"Streaming error: {e}")
-                error_data = {
-                    "type": "error",
-                    "error": str(e)
-                }
-                yield f"data: {json.dumps(error_data)}\n\n"
-        # Return SSE stream response
-        return StreamingResponse(
-            generate_stream(),
-            media_type="text/plain",
-            headers={
-                "Cache-Control": "no-cache",
-                "Connection": "keep-alive",
-                "Content-Type": "text/plain; charset=utf-8"
-            }
-        )
-    except Exception as e:
-        logger.error(f"Streaming setup failed: {e}")
-        raise HTTPException(status_code=500, detail=str(e))
-@router.post("/invoke-file", response_model=UnifiedResponse)
-async def unified_invoke_file(
-    task: str = Form(...),
-    service_type: str = Form(...),
-    model_hint: Optional[str] = Form(None),
-    provider_hint: Optional[str] = Form(None),
-    file: UploadFile = File(...)
-) -> UnifiedResponse:
-    """
-    Unified file upload endpoint
-    For tasks that require file input (images, audio, documents)
-    """
-    try:
-        # Read file data
-        file_data = await file.read()
-        # Get ISA client instance (local mode)
-        client = get_isa_client()
-        # Use client's local invoke method with binary data
-        result = await client._invoke_local(
-            input_data=file_data,  # Binary data
-            task=task,
-            service_type=service_type,
-            model_hint=model_hint,
-            provider_hint=provider_hint,
-            filename=file.filename,
-            content_type=file.content_type,
-            file_size=len(file_data)
-        )
-        # Return the result in our API format
-        return UnifiedResponse(
-            success=result["success"],
-            result=result.get("result"),
-            error=result.get("error"),
-            metadata={
-                **result["metadata"],
-                "filename": file.filename,
-                "content_type": file.content_type,
-                "file_size": len(file_data)
-            }
-        )
+                raise HTTPException(status_code=400, detail=f"Invalid JSON request: {e}")
+            # Prepare parameters, ensuring tools isn't duplicated
+            params = dict(unified_request.parameters) if unified_request.parameters else {}
+            if unified_request.tools:
+                params.pop("tools", None)  # Remove tools from parameters if present
+                params["tools"] = unified_request.tools
+            # Check if this should be a streaming response
+            # Default to streaming for text+chat unless explicitly disabled
+            is_text_chat = (unified_request.service_type == "text" and unified_request.task == "chat")
+            stream_setting = unified_request.stream if unified_request.stream is not None else is_text_chat
+            should_stream = (
+                is_text_chat and
+                not unified_request.tools and  # No tools
+                stream_setting  # Stream enabled by default for text+chat or explicitly
+            )
+            if should_stream:
+                # Return streaming response for text chat
+                async def generate_stream():
+                    try:
+                        # Use streaming invoke but track metadata manually
+                        collected_tokens = []
+                        selected_model = None
+                        service_info = None
+                        start_time = time.time()
+                        # Get model selection info first (lightweight operation)
+                        try:
+                            selected_model = await client._select_model(
+                                input_data=unified_request.input_data,
+                                task=unified_request.task,
+                                service_type=unified_request.service_type,
+                                model_hint=unified_request.model,
+                                provider_hint=unified_request.provider
+                            )
+                            service_info = {
+                                "model_used": selected_model["model_id"],
+                                "provider": selected_model["provider"],
+                                "task": unified_request.task,
+                                "service_type": unified_request.service_type,
+                                "selection_reason": selected_model.get("reason", "Default selection"),
+                                "streaming": True
+                            }
+                        except Exception:
+                            pass
+                        # Stream the tokens and get metadata
+                        processing_time = 0
+                        async for item in client.invoke_stream(
+                            input_data=unified_request.input_data,
+                            task=unified_request.task,
+                            service_type=unified_request.service_type,
+                            model=unified_request.model,
+                            provider=unified_request.provider,
+                            return_metadata=True,  # Request metadata with billing info
+                            **params
+                        ):
+                            if isinstance(item, tuple) and item[0] == 'metadata':
+                                # This is the final metadata with billing info
+                                metadata = item[1]
+                                processing_time = time.time() - start_time
+                                metadata["processing_time"] = processing_time
+                                yield f"data: {json.dumps({'metadata': metadata})}\n\n"
+                            else:
+                                # This is a token
+                                collected_tokens.append(item)
+                                yield f"data: {json.dumps({'token': item})}\n\n"
+                    except Exception as e:
+                        # Send error as final event
+                        yield f"data: {json.dumps({'error': str(e)})}\n\n"
+                    finally:
+                        # Send end-of-stream marker
+                        yield f"data: {json.dumps({'done': True})}\n\n"
+                return StreamingResponse(
+                    generate_stream(),
+                    media_type="text/event-stream",
+                    headers={
+                        "Cache-Control": "no-cache",
+                        "Connection": "keep-alive",
+                        "X-Accel-Buffering": "no"  # Disable nginx buffering
+                    }
+                )
+            else:
+                # Non-streaming response (original behavior)
+                result = await client._invoke_service(
+                    input_data=unified_request.input_data,
+                    task=unified_request.task,
+                    service_type=unified_request.service_type,
+                    model_hint=unified_request.model,
+                    provider_hint=unified_request.provider,
+                    **params
+                )
+                # Return the result in our API format
+                return UnifiedResponse(
+                    success=result["success"],
+                    result=result.get("result"),
+                    error=result.get("error"),
+                    metadata=result["metadata"]
+                )
+    except HTTPException:
+        raise
     except Exception as e:
-        logger.error(f"File invoke failed: {e}")
+        logger.error(f"Unified invoke failed: {e}")
         return UnifiedResponse(
             success=False,
             error=str(e),
-            metadata={
-                "task": task,
-                "service_type": service_type,
-                "filename": file.filename if file else None
-            }
+            metadata={}
         )
 @router.get("/models")
 async def get_available_models(service_type: Optional[str] = None):
     """Get available models (optional filter by service type)"""

isa-model 0.3.9__py3-none-any.whl → 0.4.0__py3-none-any.whl

isa-model 0.3.9py3-none-any.whl → 0.4.0py3-none-any.whl