PyPI - isa-model - Versions diffs - 0.3.91__py3-none-any.whl → 0.4.3__py3-none-any.whl - Mend

isa-model 0.3.91py3-none-any.whl → 0.4.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (228) hide show

isa_model/client.py +1166 -584
isa_model/core/cache/redis_cache.py +410 -0
isa_model/core/config/config_manager.py +282 -12
isa_model/core/config.py +91 -1
isa_model/core/database/__init__.py +1 -0
isa_model/core/database/direct_db_client.py +114 -0
isa_model/core/database/migration_manager.py +563 -0
isa_model/core/database/migrations.py +297 -0
isa_model/core/database/supabase_client.py +258 -0
isa_model/core/dependencies.py +316 -0
isa_model/core/discovery/__init__.py +19 -0
isa_model/core/discovery/consul_discovery.py +190 -0
isa_model/core/logging/__init__.py +54 -0
isa_model/core/logging/influx_logger.py +523 -0
isa_model/core/logging/loki_logger.py +160 -0
isa_model/core/models/__init__.py +46 -0
isa_model/core/models/config_models.py +625 -0
isa_model/core/models/deployment_billing_tracker.py +430 -0
isa_model/core/models/model_billing_tracker.py +60 -88
isa_model/core/models/model_manager.py +66 -25
isa_model/core/models/model_metadata.py +690 -0
isa_model/core/models/model_repo.py +217 -55
isa_model/core/models/model_statistics_tracker.py +234 -0
isa_model/core/models/model_storage.py +0 -1
isa_model/core/models/model_version_manager.py +959 -0
isa_model/core/models/system_models.py +857 -0
isa_model/core/pricing_manager.py +2 -249
isa_model/core/repositories/__init__.py +9 -0
isa_model/core/repositories/config_repository.py +912 -0
isa_model/core/resilience/circuit_breaker.py +366 -0
isa_model/core/security/secrets.py +358 -0
isa_model/core/services/__init__.py +2 -4
isa_model/core/services/intelligent_model_selector.py +479 -370
isa_model/core/storage/hf_storage.py +2 -2
isa_model/core/types.py +8 -0
isa_model/deployment/__init__.py +5 -48
isa_model/deployment/core/__init__.py +2 -31
isa_model/deployment/core/deployment_manager.py +1278 -368
isa_model/deployment/local/__init__.py +31 -0
isa_model/deployment/local/config.py +248 -0
isa_model/deployment/local/gpu_gateway.py +607 -0
isa_model/deployment/local/health_checker.py +428 -0
isa_model/deployment/local/provider.py +586 -0
isa_model/deployment/local/tensorrt_service.py +621 -0
isa_model/deployment/local/transformers_service.py +644 -0
isa_model/deployment/local/vllm_service.py +527 -0
isa_model/deployment/modal/__init__.py +8 -0
isa_model/deployment/modal/config.py +136 -0
isa_model/deployment/modal/deployer.py +894 -0
isa_model/deployment/modal/services/__init__.py +3 -0
isa_model/deployment/modal/services/audio/__init__.py +1 -0
isa_model/deployment/modal/services/audio/isa_audio_chatTTS_service.py +520 -0
isa_model/deployment/modal/services/audio/isa_audio_openvoice_service.py +758 -0
isa_model/deployment/modal/services/audio/isa_audio_service_v2.py +1044 -0
isa_model/deployment/modal/services/embedding/__init__.py +1 -0
isa_model/deployment/modal/services/embedding/isa_embed_rerank_service.py +296 -0
isa_model/deployment/modal/services/llm/__init__.py +1 -0
isa_model/deployment/modal/services/llm/isa_llm_service.py +424 -0
isa_model/deployment/modal/services/video/__init__.py +1 -0
isa_model/deployment/modal/services/video/isa_video_hunyuan_service.py +423 -0
isa_model/deployment/modal/services/vision/__init__.py +1 -0
isa_model/deployment/modal/services/vision/isa_vision_ocr_service.py +519 -0
isa_model/deployment/modal/services/vision/isa_vision_qwen25_service.py +709 -0
isa_model/deployment/modal/services/vision/isa_vision_table_service.py +676 -0
isa_model/deployment/modal/services/vision/isa_vision_ui_service.py +833 -0
isa_model/deployment/modal/services/vision/isa_vision_ui_service_optimized.py +660 -0
isa_model/deployment/models/org-org-acme-corp-tenant-a-service-llm-20250825-225822/tenant-a-service_modal_service.py +48 -0
isa_model/deployment/models/org-test-org-123-prefix-test-service-llm-20250825-225822/prefix-test-service_modal_service.py +48 -0
isa_model/deployment/models/test-llm-service-llm-20250825-204442/test-llm-service_modal_service.py +48 -0
isa_model/deployment/models/test-monitoring-gpt2-llm-20250825-212906/test-monitoring-gpt2_modal_service.py +48 -0
isa_model/deployment/models/test-monitoring-gpt2-llm-20250825-213009/test-monitoring-gpt2_modal_service.py +48 -0
isa_model/deployment/storage/__init__.py +5 -0
isa_model/deployment/storage/deployment_repository.py +824 -0
isa_model/deployment/triton/__init__.py +10 -0
isa_model/deployment/triton/config.py +196 -0
isa_model/deployment/triton/configs/__init__.py +1 -0
isa_model/deployment/triton/provider.py +512 -0
isa_model/deployment/triton/scripts/__init__.py +1 -0
isa_model/deployment/triton/templates/__init__.py +1 -0
isa_model/inference/__init__.py +47 -1
isa_model/inference/ai_factory.py +179 -16
isa_model/inference/legacy_services/__init__.py +21 -0
isa_model/inference/legacy_services/model_evaluation.py +637 -0
isa_model/inference/legacy_services/model_service.py +573 -0
isa_model/inference/legacy_services/model_serving.py +717 -0
isa_model/inference/legacy_services/model_training.py +561 -0
isa_model/inference/models/__init__.py +21 -0
isa_model/inference/models/inference_config.py +551 -0
isa_model/inference/models/inference_record.py +675 -0
isa_model/inference/models/performance_models.py +714 -0
isa_model/inference/repositories/__init__.py +9 -0
isa_model/inference/repositories/inference_repository.py +828 -0
isa_model/inference/services/audio/__init__.py +21 -0
isa_model/inference/services/audio/base_realtime_service.py +225 -0
isa_model/inference/services/audio/base_stt_service.py +184 -11
isa_model/inference/services/audio/isa_tts_service.py +0 -0
isa_model/inference/services/audio/openai_realtime_service.py +320 -124
isa_model/inference/services/audio/openai_stt_service.py +53 -11
isa_model/inference/services/base_service.py +17 -1
isa_model/inference/services/custom_model_manager.py +277 -0
isa_model/inference/services/embedding/__init__.py +13 -0
isa_model/inference/services/embedding/base_embed_service.py +111 -8
isa_model/inference/services/embedding/isa_embed_service.py +305 -0
isa_model/inference/services/embedding/ollama_embed_service.py +15 -3
isa_model/inference/services/embedding/openai_embed_service.py +2 -4
isa_model/inference/services/embedding/resilient_embed_service.py +285 -0
isa_model/inference/services/embedding/tests/test_embedding.py +222 -0
isa_model/inference/services/img/__init__.py +2 -2
isa_model/inference/services/img/base_image_gen_service.py +24 -7
isa_model/inference/services/img/replicate_image_gen_service.py +84 -422
isa_model/inference/services/img/services/replicate_face_swap.py +193 -0
isa_model/inference/services/img/services/replicate_flux.py +226 -0
isa_model/inference/services/img/services/replicate_flux_kontext.py +219 -0
isa_model/inference/services/img/services/replicate_sticker_maker.py +249 -0
isa_model/inference/services/img/tests/test_img_client.py +297 -0
isa_model/inference/services/llm/__init__.py +10 -2
isa_model/inference/services/llm/base_llm_service.py +361 -26
isa_model/inference/services/llm/cerebras_llm_service.py +628 -0
isa_model/inference/services/llm/helpers/llm_adapter.py +71 -12
isa_model/inference/services/llm/helpers/llm_prompts.py +342 -0
isa_model/inference/services/llm/helpers/llm_utils.py +321 -23
isa_model/inference/services/llm/huggingface_llm_service.py +581 -0
isa_model/inference/services/llm/local_llm_service.py +747 -0
isa_model/inference/services/llm/ollama_llm_service.py +11 -3
isa_model/inference/services/llm/openai_llm_service.py +670 -56
isa_model/inference/services/llm/yyds_llm_service.py +10 -3
isa_model/inference/services/vision/__init__.py +27 -6
isa_model/inference/services/vision/base_vision_service.py +118 -185
isa_model/inference/services/vision/blip_vision_service.py +359 -0
isa_model/inference/services/vision/helpers/image_utils.py +19 -10
isa_model/inference/services/vision/isa_vision_service.py +634 -0
isa_model/inference/services/vision/openai_vision_service.py +19 -10
isa_model/inference/services/vision/tests/test_ocr_client.py +284 -0
isa_model/inference/services/vision/vgg16_vision_service.py +257 -0
isa_model/serving/api/cache_manager.py +245 -0
isa_model/serving/api/dependencies/__init__.py +1 -0
isa_model/serving/api/dependencies/auth.py +194 -0
isa_model/serving/api/dependencies/database.py +139 -0
isa_model/serving/api/error_handlers.py +284 -0
isa_model/serving/api/fastapi_server.py +240 -18
isa_model/serving/api/middleware/auth.py +317 -0
isa_model/serving/api/middleware/security.py +268 -0
isa_model/serving/api/middleware/tenant_context.py +414 -0
isa_model/serving/api/routes/analytics.py +489 -0
isa_model/serving/api/routes/config.py +645 -0
isa_model/serving/api/routes/deployment_billing.py +315 -0
isa_model/serving/api/routes/deployments.py +475 -0
isa_model/serving/api/routes/gpu_gateway.py +440 -0
isa_model/serving/api/routes/health.py +32 -12
isa_model/serving/api/routes/inference_monitoring.py +486 -0
isa_model/serving/api/routes/local_deployments.py +448 -0
isa_model/serving/api/routes/logs.py +430 -0
isa_model/serving/api/routes/settings.py +582 -0
isa_model/serving/api/routes/tenants.py +575 -0
isa_model/serving/api/routes/unified.py +992 -171
isa_model/serving/api/routes/webhooks.py +479 -0
isa_model/serving/api/startup.py +318 -0
isa_model/serving/modal_proxy_server.py +249 -0
isa_model/utils/gpu_utils.py +311 -0
{isa_model-0.3.91.dist-info → isa_model-0.4.3.dist-info}/METADATA +76 -22
isa_model-0.4.3.dist-info/RECORD +193 -0
isa_model/deployment/cloud/__init__.py +0 -9
isa_model/deployment/cloud/modal/__init__.py +0 -10
isa_model/deployment/cloud/modal/isa_vision_doc_service.py +0 -766
isa_model/deployment/cloud/modal/isa_vision_table_service.py +0 -532
isa_model/deployment/cloud/modal/isa_vision_ui_service.py +0 -406
isa_model/deployment/cloud/modal/register_models.py +0 -321
isa_model/deployment/core/deployment_config.py +0 -356
isa_model/deployment/core/isa_deployment_service.py +0 -401
isa_model/deployment/gpu_int8_ds8/app/server.py +0 -66
isa_model/deployment/gpu_int8_ds8/scripts/test_client.py +0 -43
isa_model/deployment/gpu_int8_ds8/scripts/test_client_os.py +0 -35
isa_model/deployment/runtime/deployed_service.py +0 -338
isa_model/deployment/services/__init__.py +0 -9
isa_model/deployment/services/auto_deploy_vision_service.py +0 -538
isa_model/deployment/services/model_service.py +0 -332
isa_model/deployment/services/service_monitor.py +0 -356
isa_model/deployment/services/service_registry.py +0 -527
isa_model/eval/__init__.py +0 -92
isa_model/eval/benchmarks.py +0 -469
isa_model/eval/config/__init__.py +0 -10
isa_model/eval/config/evaluation_config.py +0 -108
isa_model/eval/evaluators/__init__.py +0 -18
isa_model/eval/evaluators/base_evaluator.py +0 -503
isa_model/eval/evaluators/llm_evaluator.py +0 -472
isa_model/eval/factory.py +0 -531
isa_model/eval/infrastructure/__init__.py +0 -24
isa_model/eval/infrastructure/experiment_tracker.py +0 -466
isa_model/eval/metrics.py +0 -798
isa_model/inference/adapter/unified_api.py +0 -248
isa_model/inference/services/helpers/stacked_config.py +0 -148
isa_model/inference/services/img/flux_professional_service.py +0 -603
isa_model/inference/services/img/helpers/base_stacked_service.py +0 -274
isa_model/inference/services/others/table_transformer_service.py +0 -61
isa_model/inference/services/vision/doc_analysis_service.py +0 -640
isa_model/inference/services/vision/helpers/base_stacked_service.py +0 -274
isa_model/inference/services/vision/ui_analysis_service.py +0 -823
isa_model/scripts/inference_tracker.py +0 -283
isa_model/scripts/mlflow_manager.py +0 -379
isa_model/scripts/model_registry.py +0 -465
isa_model/scripts/register_models.py +0 -370
isa_model/scripts/register_models_with_embeddings.py +0 -510
isa_model/scripts/start_mlflow.py +0 -95
isa_model/scripts/training_tracker.py +0 -257
isa_model/training/__init__.py +0 -74
isa_model/training/annotation/annotation_schema.py +0 -47
isa_model/training/annotation/processors/annotation_processor.py +0 -126
isa_model/training/annotation/storage/dataset_manager.py +0 -131
isa_model/training/annotation/storage/dataset_schema.py +0 -44
isa_model/training/annotation/tests/test_annotation_flow.py +0 -109
isa_model/training/annotation/tests/test_minio copy.py +0 -113
isa_model/training/annotation/tests/test_minio_upload.py +0 -43
isa_model/training/annotation/views/annotation_controller.py +0 -158
isa_model/training/cloud/__init__.py +0 -22
isa_model/training/cloud/job_orchestrator.py +0 -402
isa_model/training/cloud/runpod_trainer.py +0 -454
isa_model/training/cloud/storage_manager.py +0 -482
isa_model/training/core/__init__.py +0 -23
isa_model/training/core/config.py +0 -181
isa_model/training/core/dataset.py +0 -222
isa_model/training/core/trainer.py +0 -720
isa_model/training/core/utils.py +0 -213
isa_model/training/factory.py +0 -424
isa_model-0.3.91.dist-info/RECORD +0 -138
/isa_model/{core/storage/minio_storage.py → deployment/modal/services/audio/isa_audio_fish_service.py} +0 -0
/isa_model/deployment/{services → modal/services/vision}/simple_auto_deploy_vision_service.py +0 -0
{isa_model-0.3.91.dist-info → isa_model-0.4.3.dist-info}/WHEEL +0 -0
{isa_model-0.3.91.dist-info → isa_model-0.4.3.dist-info}/top_level.txt +0 -0

isa_model/inference/services/llm/base_llm_service.py CHANGED Viewed

@@ -1,9 +1,12 @@
 from abc import ABC, abstractmethod
 from typing import Dict, Any, List, Union, Optional, AsyncGenerator, Callable
 import logging
+import json
 from isa_model.inference.services.base_service import BaseService
 from isa_model.inference.services.llm.helpers.llm_adapter import AdapterManager
+from isa_model.inference.services.llm.helpers.llm_utils import TokenCounter, TextProcessor, ResponseParser, LLMMetrics
+from isa_model.inference.services.llm.helpers.llm_prompts import LLMPrompts, LLMPromptTemplates
 logger = logging.getLogger(__name__)
@@ -18,6 +21,12 @@ class BaseLLMService(BaseService):
         # 初始化适配器管理器
         self.adapter_manager = AdapterManager()
+        # Initialize helper utilities (optional, can be overridden by specific services)
+        self.token_counter = TokenCounter(model_name)
+        self.text_processor = TextProcessor()
+        self.response_parser = ResponseParser()
+        self.llm_prompts = LLMPrompts()
         # Get config from provider
         provider_config = self.get_provider_config()
         self.streaming = provider_config.get("streaming", False)
@@ -28,6 +37,9 @@ class BaseLLMService(BaseService):
         self,
         input_data: Union[str, List[Dict[str, str]], Any],
         task: Optional[str] = None,
+        show_reasoning: bool = False,
+        output_format: Optional[str] = None,
+        json_schema: Optional[Dict] = None,
         **kwargs
     ) -> Dict[str, Any]:
         """
@@ -39,86 +51,219 @@ class BaseLLMService(BaseService):
                 - list: 消息历史 [{"role": "user", "content": "hello"}]
                 - Any: LangChain 消息对象或其他格式
             task: 任务类型，支持多种LLM任务
+            output_format: Output format ("json", "markdown", "code", etc.)
+            json_schema: JSON schema for structured output validation
             **kwargs: 任务特定的附加参数
         Returns:
-            Dict containing task results
+            Dict containing task results (optionally formatted as JSON)
         """
         task = task or "chat"
+        # Store formatting options for use by specific task methods
+        format_options = {
+            "output_format": output_format,
+            "json_schema": json_schema,
+            "repair_attempts": kwargs.get("repair_attempts", 3)
+        }
+        # Execute task and apply formatting
+        result = None
         # ==================== 对话类任务 ====================
         if task == "chat":
-            return await self.chat(input_data, kwargs.get("max_tokens", self.max_tokens))
+            # Pass all kwargs to ainvoke for better parameter support (like response_format)
+            result_raw = await self.ainvoke(input_data, show_reasoning=show_reasoning, **kwargs)
+            # Wrap in chat response format, preserving AIMessage objects with tool_calls
+            if hasattr(result_raw, 'tool_calls'):
+                # This is an AIMessage with tool_calls - preserve the entire object
+                result = {"message": result_raw}
+            elif hasattr(result_raw, 'content'):
+                # Regular AIMessage without tool_calls - extract content
+                content = result_raw.content
+                result = {"message": content}
+            else:
+                # Plain string response
+                content = str(result_raw)
+                result = {"message": content}
         elif task == "complete":
-            return await self.complete_text(input_data, kwargs.get("max_tokens", self.max_tokens))
+            result = await self.complete_text(input_data, kwargs.get("max_tokens", self.max_tokens))
         elif task == "instruct":
-            return await self.instruct(input_data, kwargs.get("instruction"), kwargs.get("max_tokens", self.max_tokens))
+            result = await self.instruct(input_data, kwargs.get("instruction"), kwargs.get("max_tokens", self.max_tokens))
         # ==================== 文本生成类任务 ====================
         elif task == "generate":
-            return await self.generate_text(input_data, kwargs.get("max_tokens", self.max_tokens))
+            result = await self.generate_text(input_data, kwargs.get("max_tokens", self.max_tokens))
         elif task == "rewrite":
-            return await self.rewrite_text(input_data, kwargs.get("style"), kwargs.get("tone"))
+            result = await self.rewrite_text(input_data, kwargs.get("style"), kwargs.get("tone"))
         elif task == "summarize":
-            return await self.summarize_text(input_data, kwargs.get("max_length"), kwargs.get("style"))
+            result = await self.summarize_text(input_data, kwargs.get("max_length"), kwargs.get("style"))
         elif task == "translate":
-            return await self.translate_text(input_data, kwargs.get("target_language"), kwargs.get("source_language"))
+            target_language = kwargs.get("target_language")
+            if not target_language:
+                raise ValueError("target_language is required for translate task")
+            result = await self.translate_text(input_data, target_language, kwargs.get("source_language"))
         # ==================== 分析类任务 ====================
         elif task == "analyze":
-            return await self.analyze_text(input_data, kwargs.get("analysis_type"))
+            result = await self.analyze_text(input_data, kwargs.get("analysis_type"))
         elif task == "classify":
-            return await self.classify_text(input_data, kwargs.get("categories"))
+            result = await self.classify_text(input_data, kwargs.get("categories"))
         elif task == "extract":
-            return await self.extract_information(input_data, kwargs.get("extract_type"))
+            result = await self.extract_information(input_data, kwargs.get("extract_type"))
         elif task == "sentiment":
-            return await self.analyze_sentiment(input_data)
+            # Always use chat with appropriate prompt for sentiment analysis
+            if output_format == "json":
+                # Create JSON-formatted prompt
+                json_prompt = self.create_json_prompt(
+                    f"Please analyze the sentiment of the following text: {input_data}",
+                    json_schema or {
+                        "type": "object",
+                        "properties": {
+                            "sentiment": {"type": "string", "enum": ["positive", "negative", "neutral"]},
+                            "confidence": {"type": "number", "minimum": 0, "maximum": 1},
+                            "explanation": {"type": "string"}
+                        },
+                        "required": ["sentiment"]
+                    }
+                )
+                result = await self.chat(json_prompt, show_reasoning=show_reasoning)
+            else:
+                # Use simple chat prompt for sentiment analysis
+                sentiment_prompt = f"Please analyze the sentiment of the following text and classify it as positive, negative, or neutral:\n\n{input_data}\n\nSentiment:"
+                result = await self.chat(sentiment_prompt, show_reasoning=show_reasoning)
         # ==================== 编程类任务 ====================
         elif task == "code":
-            return await self.generate_code(input_data, kwargs.get("language"), kwargs.get("style"))
+            # Always use chat with appropriate prompt for code generation
+            language = kwargs.get("language", "")
+            style = kwargs.get("style", "")
+            code_prompt = f"Please write code"
+            if language:
+                code_prompt += f" in {language}"
+            code_prompt += f" for the following requirement:\n\n{input_data}\n\n"
+            if style:
+                code_prompt += f"Style requirements: {style}\n\n"
+            code_prompt += "Please provide clean, working code with comments."
+            result = await self.chat(code_prompt, show_reasoning=show_reasoning)
         elif task == "explain_code":
-            return await self.explain_code(input_data, kwargs.get("language"))
+            result = await self.explain_code(input_data, kwargs.get("language"))
         elif task == "debug_code":
-            return await self.debug_code(input_data, kwargs.get("language"))
+            result = await self.debug_code(input_data, kwargs.get("language"))
         elif task == "refactor_code":
-            return await self.refactor_code(input_data, kwargs.get("language"), kwargs.get("improvements"))
+            result = await self.refactor_code(input_data, kwargs.get("language"), kwargs.get("improvements"))
         # ==================== 推理类任务 ====================
         elif task == "reason":
-            return await self.reason_about(input_data, kwargs.get("reasoning_type"))
+            # Always use chat with appropriate prompt for reasoning
+            reasoning_type = kwargs.get("reasoning_type", "")
+            reason_prompt = f"Please analyze and explain the reasoning behind the following question or topic"
+            if reasoning_type:
+                reason_prompt += f" using {reasoning_type} reasoning"
+            reason_prompt += f":\n\n{input_data}\n\n"
+            reason_prompt += "Provide a clear, step-by-step explanation of your reasoning process."
+            result = await self.chat(reason_prompt, show_reasoning=show_reasoning)
         elif task == "solve":
-            return await self.solve_problem(input_data, kwargs.get("problem_type"))
+            # Always use chat with appropriate prompt for problem solving
+            problem_type = kwargs.get("problem_type", "")
+            solve_prompt = f"Please solve the following problem"
+            if problem_type:
+                solve_prompt += f" (type: {problem_type})"
+            solve_prompt += f":\n\n{input_data}\n\n"
+            solve_prompt += "Provide a clear solution with step-by-step explanation."
+            result = await self.chat(solve_prompt, show_reasoning=show_reasoning)
         elif task == "plan":
-            return await self.create_plan(input_data, kwargs.get("plan_type"))
+            result = await self.create_plan(input_data, kwargs.get("plan_type"))
+        elif task == "deep_research":
+            result = await self.deep_research(input_data, kwargs.get("research_type"), kwargs.get("search_enabled", True))
         # ==================== 工具调用类任务 ====================
         elif task == "tool_call":
-            return await self.call_tools(input_data, kwargs.get("available_tools"))
+            result = await self.call_tools(input_data, kwargs.get("available_tools"))
         elif task == "function_call":
-            return await self.call_function(input_data, kwargs.get("function_name"), kwargs.get("parameters"))
+            function_name = kwargs.get("function_name")
+            if not function_name:
+                raise ValueError("function_name is required for function_call task")
+            result = await self.call_function(input_data, function_name, kwargs.get("parameters"))
         else:
             raise NotImplementedError(f"{self.__class__.__name__} does not support task: {task}")
+        # Apply output formatting if requested
+        if result is not None and output_format:
+            # Extract the raw response for formatting
+            # If result is a dict with 'message' key, use the message for formatting
+            format_input = result
+            if isinstance(result, dict) and 'message' in result:
+                format_input = result['message']
+            formatted_result = self.format_structured_output(
+                response=format_input,
+                output_format=output_format,
+                schema=json_schema,
+                repair_attempts=format_options.get("repair_attempts", 3)
+            )
+            # If formatting succeeded, return formatted result
+            if formatted_result.get("success", False):
+                return {
+                    "result": formatted_result["data"],
+                    "formatted": True,
+                    "format": output_format,
+                    "original": result
+                }
+            else:
+                # If formatting failed, return original with error info
+                return {
+                    "result": result,
+                    "formatted": False,
+                    "format_errors": formatted_result.get("errors", []),
+                    "original": result
+                }
+        # Return unformatted result
+        return result if result is not None else {"message": "Task completed but returned no result"}
     # ==================== 对话类方法 ====================
     async def chat(
         self,
         input_data: Union[str, List[Dict[str, str]], Any],
-        max_tokens: Optional[int] = None
+        max_tokens: Optional[int] = None,
+        show_reasoning: bool = False
     ) -> Dict[str, Any]:
         """
-        对话聊天 - Provider必须实现
+        对话聊天 - 委托给 ainvoke 方法
         Args:
             input_data: 输入消息
             max_tokens: 最大生成token数
+            show_reasoning: 是否显示推理过程
         Returns:
             Dict containing chat response
         """
-        raise NotImplementedError(f"{self.__class__.__name__} does not support chat task")
+        result = await self.ainvoke(input_data, show_reasoning=show_reasoning)
+        # Ensure we return a proper response structure
+        if result is None:
+            logger.warning("ainvoke returned None - this may indicate an implementation issue")
+            return {"message": ""}
+        # Extract content if it's an AIMessage object
+        if hasattr(result, 'content'):
+            content = result.content
+        else:
+            content = str(result)
+        return {"message": content}
     # ==================== 文本生成类方法 ====================
@@ -303,6 +448,17 @@ class BaseLLMService(BaseService):
         """
         raise NotImplementedError(f"{self.__class__.__name__} does not support create_plan task")
+    async def deep_research(
+        self,
+        input_data: Union[str, Any],
+        research_type: Optional[str] = None,
+        search_enabled: bool = True
+    ) -> Dict[str, Any]:
+        """
+        深度研究 - O-series模型专用任务，支持网络搜索和深入分析
+        """
+        raise NotImplementedError(f"{self.__class__.__name__} does not support deep_research task")
     # ==================== 工具调用类方法 ====================
     async def call_tools(
@@ -354,7 +510,7 @@ class BaseLLMService(BaseService):
         """使用适配器管理器转换消息格式"""
         return self.adapter_manager.convert_messages(input_data)
-    def _format_response(self, response: str, original_input: Any) -> Union[str, Any]:
+    def _format_response(self, response: Union[str, Any], original_input: Any) -> Union[str, Any]:
         """使用适配器管理器格式化响应"""
         return self.adapter_manager.format_response(response, original_input)
@@ -379,7 +535,7 @@ class BaseLLMService(BaseService):
         pass
     @abstractmethod
-    async def ainvoke(self, input_data: Union[str, List[Dict[str, str]], Any]) -> Union[str, Any]:
+    async def ainvoke(self, input_data: Union[str, List[Dict[str, str]], Any], show_reasoning: bool = False) -> Union[str, Any]:
         """
         Universal async invocation method that handles different input types
@@ -388,6 +544,7 @@ class BaseLLMService(BaseService):
                 - str: Simple text prompt
                 - list: Message history like [{"role": "user", "content": "hello"}]
                 - Any: LangChain message objects or other formats
+            show_reasoning: If True and model supports it, show reasoning process
         Returns:
             Model response (string for simple cases, object for complex cases)
@@ -491,6 +648,183 @@ class BaseLLMService(BaseService):
             )
         return 0.0
+    # ==================== JSON OUTPUT AND FORMATTING METHODS ====================
+    def format_structured_output(
+        self,
+        response: Union[str, Any],
+        output_format: str = "json",
+        schema: Optional[Dict] = None,
+        repair_attempts: int = 3
+    ) -> Dict[str, Any]:
+        """
+        Format response as structured output (JSON, etc.)
+        Args:
+            response: Raw response from model
+            output_format: Desired output format ("json", "code", "structured")
+            schema: Optional JSON schema for validation
+            repair_attempts: Number of JSON repair attempts
+        Returns:
+            Dict with formatted output and metadata
+        """
+        if output_format == "json":
+            if isinstance(response, str):
+                return self.text_processor.extract_json_from_text(response, schema, repair_attempts)
+            else:
+                # Handle response objects with content attribute
+                content = getattr(response, 'content', str(response))
+                return self.text_processor.extract_json_from_text(content, schema, repair_attempts)
+        elif output_format == "code":
+            content = response if isinstance(response, str) else getattr(response, 'content', str(response))
+            code_blocks = self.text_processor.extract_code_blocks(content)
+            return {
+                "success": True,
+                "data": code_blocks,
+                "method": "code_block_extraction",
+                "errors": []
+            }
+        elif output_format == "structured":
+            # Use ResponseParser for general structured parsing
+            content = response if isinstance(response, str) else getattr(response, 'content', str(response))
+            parsed = self.response_parser.parse_structured_response(content, "json")
+            if parsed:
+                return {
+                    "success": True,
+                    "data": parsed,
+                    "method": "structured_parsing",
+                    "errors": []
+                }
+            else:
+                return {
+                    "success": False,
+                    "data": content,
+                    "method": "raw_fallback",
+                    "errors": ["Failed to parse as structured output"]
+                }
+        # Fallback: return raw response
+        return {
+            "success": True,
+            "data": response,
+            "method": "raw_output",
+            "errors": []
+        }
+    def create_json_prompt(
+        self,
+        base_prompt: str,
+        json_schema: Optional[Dict] = None,
+        output_instructions: Optional[str] = None
+    ) -> str:
+        """
+        Create a prompt that requests JSON output
+        Args:
+            base_prompt: The base prompt content
+            json_schema: Optional JSON schema to include in prompt
+            output_instructions: Custom output format instructions
+        Returns:
+            Enhanced prompt requesting JSON output
+        """
+        if output_instructions:
+            json_instruction = output_instructions
+        else:
+            json_instruction = LLMPromptTemplates.OUTPUT_FORMATS["json"]
+        if json_schema:
+            schema_text = f"\n\nPlease format your response according to this JSON schema:\n```json\n{json.dumps(json_schema, indent=2)}\n```"
+            return f"{base_prompt}{schema_text}\n\n{json_instruction}"
+        else:
+            return f"{base_prompt}\n\n{json_instruction}"
+    def create_structured_prompt(
+        self,
+        task_type: str,
+        content: str,
+        output_format: str = "json",
+        **kwargs
+    ) -> str:
+        """
+        Create a structured prompt using LLMPrompts templates
+        Args:
+            task_type: Type of task (from LLMPrompts methods)
+            content: Main content/input
+            output_format: Desired output format
+            **kwargs: Additional arguments for the prompt template
+        Returns:
+            Formatted prompt string
+        """
+        try:
+            # Get the appropriate prompt template
+            if hasattr(self.llm_prompts, f"{task_type}_prompt"):
+                method = getattr(self.llm_prompts, f"{task_type}_prompt")
+                base_prompt = method(content, **kwargs)
+            else:
+                # Fallback to generic prompt
+                base_prompt = f"Please {task_type} the following:\n\n{content}"
+            # Add output format instructions
+            if output_format in LLMPromptTemplates.OUTPUT_FORMATS:
+                format_instruction = LLMPromptTemplates.OUTPUT_FORMATS[output_format]
+                return f"{base_prompt}\n\n{format_instruction}"
+            return base_prompt
+        except Exception as e:
+            logger.warning(f"Failed to create structured prompt: {e}")
+            return f"Please {task_type} the following:\n\n{content}"
+    def count_tokens(self, text: Union[str, List[Dict[str, str]]]) -> int:
+        """
+        Count tokens in text or message list
+        Args:
+            text: String or message list to count tokens for
+        Returns:
+            Number of tokens
+        """
+        if isinstance(text, str):
+            return self.token_counter.count_tokens(text)
+        elif isinstance(text, list):
+            return self.token_counter.count_messages_tokens(text)
+        else:
+            return self.token_counter.count_tokens(str(text))
+    def truncate_to_token_limit(self, text: str, max_tokens: int) -> str:
+        """
+        Truncate text to fit within token limit
+        Args:
+            text: Text to truncate
+            max_tokens: Maximum number of tokens
+        Returns:
+            Truncated text
+        """
+        return self.token_counter.truncate_text(text, max_tokens)
+    def split_text_by_tokens(self, text: str, chunk_size: int, overlap: int = 0) -> List[str]:
+        """
+        Split text into chunks by token count
+        Args:
+            text: Text to split
+            chunk_size: Size of each chunk in tokens
+            overlap: Number of overlapping tokens between chunks
+        Returns:
+            List of text chunks
+        """
+        return self.token_counter.split_text_by_tokens(text, chunk_size, overlap)
     # ==================== METADATA AND UTILITY METHODS ====================
     def get_supported_tasks(self) -> List[str]:
@@ -527,6 +861,7 @@ class BaseLLMService(BaseService):
             'reason_about': 'reason',
             'solve_problem': 'solve',
             'create_plan': 'plan',
+            'deep_research': 'deep_research',
             # 工具调用类
             'call_tools': 'tool_call',
             'call_function': 'function_call'

isa-model 0.3.91__py3-none-any.whl → 0.4.3__py3-none-any.whl

isa-model 0.3.91py3-none-any.whl → 0.4.3py3-none-any.whl