PyPI - isa-model - Versions diffs - 0.0.2__py3-none-any.whl → 0.3.1__py3-none-any.whl - Mend

isa-model 0.0.2py3-none-any.whl → 0.3.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (93) hide show

isa_model/__init__.py +1 -1
isa_model/core/model_manager.py +69 -4
isa_model/core/model_registry.py +273 -46
isa_model/core/storage/hf_storage.py +419 -0
isa_model/deployment/__init__.py +52 -0
isa_model/deployment/core/__init__.py +34 -0
isa_model/deployment/core/deployment_config.py +356 -0
isa_model/deployment/core/deployment_manager.py +549 -0
isa_model/deployment/core/isa_deployment_service.py +401 -0
isa_model/eval/factory.py +381 -140
isa_model/inference/ai_factory.py +427 -236
isa_model/inference/billing_tracker.py +406 -0
isa_model/inference/providers/base_provider.py +51 -4
isa_model/inference/providers/ml_provider.py +50 -0
isa_model/inference/providers/ollama_provider.py +37 -18
isa_model/inference/providers/openai_provider.py +65 -36
isa_model/inference/providers/replicate_provider.py +42 -30
isa_model/inference/services/audio/base_stt_service.py +21 -2
isa_model/inference/services/audio/openai_realtime_service.py +353 -0
isa_model/inference/services/audio/openai_stt_service.py +252 -0
isa_model/inference/services/audio/openai_tts_service.py +149 -9
isa_model/inference/services/audio/replicate_tts_service.py +239 -0
isa_model/inference/services/base_service.py +36 -1
isa_model/inference/services/embedding/base_embed_service.py +112 -0
isa_model/inference/services/embedding/ollama_embed_service.py +28 -2
isa_model/inference/services/embedding/openai_embed_service.py +223 -0
isa_model/inference/services/llm/__init__.py +2 -0
isa_model/inference/services/llm/base_llm_service.py +158 -86
isa_model/inference/services/llm/llm_adapter.py +414 -0
isa_model/inference/services/llm/ollama_llm_service.py +252 -63
isa_model/inference/services/llm/openai_llm_service.py +231 -93
isa_model/inference/services/llm/triton_llm_service.py +481 -0
isa_model/inference/services/ml/base_ml_service.py +78 -0
isa_model/inference/services/ml/sklearn_ml_service.py +140 -0
isa_model/inference/services/vision/__init__.py +3 -3
isa_model/inference/services/vision/base_image_gen_service.py +161 -0
isa_model/inference/services/vision/base_vision_service.py +177 -0
isa_model/inference/services/vision/helpers/image_utils.py +4 -3
isa_model/inference/services/vision/ollama_vision_service.py +151 -17
isa_model/inference/services/vision/openai_vision_service.py +275 -41
isa_model/inference/services/vision/replicate_image_gen_service.py +278 -118
isa_model/training/__init__.py +62 -32
isa_model/training/cloud/__init__.py +22 -0
isa_model/training/cloud/job_orchestrator.py +402 -0
isa_model/training/cloud/runpod_trainer.py +454 -0
isa_model/training/cloud/storage_manager.py +482 -0
isa_model/training/core/__init__.py +23 -0
isa_model/training/core/config.py +181 -0
isa_model/training/core/dataset.py +222 -0
isa_model/training/core/trainer.py +720 -0
isa_model/training/core/utils.py +213 -0
isa_model/training/factory.py +229 -198
isa_model-0.3.1.dist-info/METADATA +465 -0
isa_model-0.3.1.dist-info/RECORD +91 -0
isa_model/core/model_router.py +0 -226
isa_model/core/model_version.py +0 -0
isa_model/core/resource_manager.py +0 -202
isa_model/deployment/gpu_fp16_ds8/models/deepseek_r1/1/model.py +0 -120
isa_model/deployment/gpu_fp16_ds8/scripts/download_model.py +0 -18
isa_model/training/engine/llama_factory/__init__.py +0 -39
isa_model/training/engine/llama_factory/config.py +0 -115
isa_model/training/engine/llama_factory/data_adapter.py +0 -284
isa_model/training/engine/llama_factory/examples/__init__.py +0 -6
isa_model/training/engine/llama_factory/examples/finetune_with_tracking.py +0 -185
isa_model/training/engine/llama_factory/examples/rlhf_with_tracking.py +0 -163
isa_model/training/engine/llama_factory/factory.py +0 -331
isa_model/training/engine/llama_factory/rl.py +0 -254
isa_model/training/engine/llama_factory/trainer.py +0 -171
isa_model/training/image_model/configs/create_config.py +0 -37
isa_model/training/image_model/configs/create_flux_config.py +0 -26
isa_model/training/image_model/configs/create_lora_config.py +0 -21
isa_model/training/image_model/prepare_massed_compute.py +0 -97
isa_model/training/image_model/prepare_upload.py +0 -17
isa_model/training/image_model/raw_data/create_captions.py +0 -16
isa_model/training/image_model/raw_data/create_lora_captions.py +0 -20
isa_model/training/image_model/raw_data/pre_processing.py +0 -200
isa_model/training/image_model/train/train.py +0 -42
isa_model/training/image_model/train/train_flux.py +0 -41
isa_model/training/image_model/train/train_lora.py +0 -57
isa_model/training/image_model/train_main.py +0 -25
isa_model-0.0.2.dist-info/METADATA +0 -327
isa_model-0.0.2.dist-info/RECORD +0 -92
isa_model-0.0.2.dist-info/licenses/LICENSE +0 -21
/isa_model/training/{llm_model/annotation → annotation}/annotation_schema.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/processors/annotation_processor.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/storage/dataset_manager.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/storage/dataset_schema.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/tests/test_annotation_flow.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/tests/test_minio copy.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/tests/test_minio_upload.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/views/annotation_controller.py +0 -0
{isa_model-0.0.2.dist-info → isa_model-0.3.1.dist-info}/WHEEL +0 -0
{isa_model-0.0.2.dist-info → isa_model-0.3.1.dist-info}/top_level.txt +0 -0

isa_model/inference/services/llm/base_llm_service.py CHANGED Viewed

@@ -1,134 +1,206 @@
 from abc import ABC, abstractmethod
-from typing import Dict, Any, List, Union, Optional, AsyncGenerator, TypeVar
+from typing import Dict, Any, List, Union, Optional, AsyncGenerator, Callable
 from isa_model.inference.services.base_service import BaseService
-T = TypeVar('T')  # Generic type for responses
+from isa_model.inference.services.llm.llm_adapter import AdapterManager
 class BaseLLMService(BaseService):
-    """Base class for Large Language Model services"""
+    """Base class for Large Language Model services with unified invoke interface"""
-    @abstractmethod
-    async def ainvoke(self, prompt: Union[str, List[Dict[str, str]], Any]) -> T:
-        """
-        Universal invocation method that handles different input types
+    def __init__(self, provider, model_name: str):
+        super().__init__(provider, model_name)
+        self._bound_tools: List[Any] = []  # 改为存储原始工具对象
+        self._tool_mappings: Dict[str, tuple] = {}  # 工具名到(工具, 适配器)的映射
-        Args:
-            prompt: Can be a string, list of messages, or other format
-        Returns:
-            Model response in the appropriate format
-        """
-        pass
+        # 初始化适配器管理器
+        self.adapter_manager = AdapterManager()
+        # Get streaming config from provider config
+        self.streaming = self.config.get("streaming", False)
-    @abstractmethod
-    async def achat(self, messages: List[Dict[str, str]]) -> T:
+    def bind_tools(self, tools: List[Any], **kwargs) -> 'BaseLLMService':
         """
-        Chat completion method using message format
+        Bind tools to this LLM service for function calling
         Args:
-            messages: List of message dictionaries with 'role' and 'content' keys
-                     Example: [{"role": "user", "content": "Hello"}]
+            tools: List of tools to bind (functions, LangChain tools, etc.)
+            **kwargs: Additional tool binding parameters
         Returns:
-            Chat completion response
+            Self for method chaining
         """
-        pass
+        self._bound_tools = tools
+        return self
-    @abstractmethod
-    async def acompletion(self, prompt: str) -> T:
-        """
-        Text completion method for simple prompt completion
+    async def _prepare_tools_for_request(self) -> List[Dict[str, Any]]:
+        """准备工具用于请求"""
+        if not self._bound_tools:
+            return []
-        Args:
-            prompt: Input text prompt
-        Returns:
-            Text completion response
-        """
-        pass
+        schemas, self._tool_mappings = await self.adapter_manager.convert_tools_to_schemas(self._bound_tools)
+        return schemas
+    def _prepare_messages(self, input_data: Union[str, List[Dict[str, str]], Any]) -> List[Dict[str, str]]:
+        """使用适配器管理器转换消息格式"""
+        return self.adapter_manager.convert_messages(input_data)
+    def _format_response(self, response: str, original_input: Any) -> Union[str, Any]:
+        """使用适配器管理器格式化响应"""
+        return self.adapter_manager.format_response(response, original_input)
+    async def _execute_tool_call(self, tool_name: str, arguments: Dict[str, Any]) -> Any:
+        """使用适配器管理器执行工具调用"""
+        return await self.adapter_manager.execute_tool(tool_name, arguments, self._tool_mappings)
     @abstractmethod
-    async def agenerate(self, messages: List[Dict[str, str]], n: int = 1) -> List[T]:
+    async def ainvoke(self, input_data: Union[str, List[Dict[str, str]], Any]) -> Union[str, Any]:
         """
-        Generate multiple completions for the same input
+        Universal async invocation method that handles different input types
         Args:
-            messages: List of message dictionaries
-            n: Number of completions to generate
+            input_data: Can be:
+                - str: Simple text prompt
+                - list: Message history like [{"role": "user", "content": "hello"}]
+                - Any: LangChain message objects or other formats
         Returns:
-            List of completion responses
+            Model response (string for simple cases, object for complex cases)
         """
         pass
-    @abstractmethod
-    async def astream_chat(self, messages: List[Dict[str, str]]) -> AsyncGenerator[str, None]:
+    def invoke(self, input_data: Union[str, List[Dict[str, str]], Any]) -> Union[str, Any]:
         """
-        Stream chat responses token by token
+        Synchronous wrapper for ainvoke
         Args:
-            messages: List of message dictionaries
+            input_data: Same as ainvoke
-        Yields:
-            Individual tokens or chunks of the response
-        """
-        pass
+        Returns:
+            Model response
+        """
+        import asyncio
+        try:
+            # Try to get current event loop
+            loop = asyncio.get_running_loop()
+            # If we're in an event loop, create a new thread
+            import concurrent.futures
+            with concurrent.futures.ThreadPoolExecutor() as executor:
+                future = executor.submit(asyncio.run, self.ainvoke(input_data))
+                return future.result()
+        except RuntimeError:
+            # No event loop running, create a new one
+            return asyncio.run(self.ainvoke(input_data))
-    @abstractmethod
-    async def astream_completion(self, prompt: str) -> AsyncGenerator[str, None]:
-        """
-        Stream completion responses token by token
+    # 保留旧的方法以保持向后兼容
+    def _convert_tools_to_schema(self, tools: List[Union[Dict[str, Any], Callable]]) -> List[Dict[str, Any]]:
+        """Convert tools to OpenAI function calling schema (deprecated, use adapter manager)"""
+        import asyncio
+        try:
+            loop = asyncio.get_event_loop()
+            schemas, _ = loop.run_until_complete(self.adapter_manager.convert_tools_to_schemas(tools))
+            return schemas
+        except RuntimeError:
+            schemas, _ = asyncio.run(self.adapter_manager.convert_tools_to_schemas(tools))
+            return schemas
+    def _has_bound_tools(self) -> bool:
+        """Check if this service has bound tools"""
+        return bool(self._bound_tools)
+    def _get_bound_tools(self) -> List[Dict[str, Any]]:
+        """Get the bound tools schema"""
+        return self._bound_tools
+    def _convert_langchain_to_openai(self, messages: List[Any]) -> List[Dict[str, str]]:
+        """Convert LangChain message objects to OpenAI format"""
+        converted_messages = []
-        Args:
-            prompt: Input text prompt
-        Yields:
-            Individual tokens or chunks of the response
-        """
-        pass
+        for msg in messages:
+            # Handle different LangChain message types
+            if hasattr(msg, 'type') and hasattr(msg, 'content'):
+                # LangChain message object
+                msg_dict = {"content": str(msg.content)}
+                # Map LangChain types to OpenAI roles
+                if msg.type == "system":
+                    msg_dict["role"] = "system"
+                elif msg.type == "human":
+                    msg_dict["role"] = "user"
+                elif msg.type == "ai":
+                    msg_dict["role"] = "assistant"
+                    # Handle tool calls if present
+                    if hasattr(msg, 'tool_calls') and msg.tool_calls:
+                        # Handle tool calls - need to store as separate key since it's not a string
+                        tool_calls = [
+                            {
+                                "id": tc.get("id", f"call_{i}"),
+                                "type": "function",
+                                "function": {
+                                    "name": tc["name"],
+                                    "arguments": tc.get("args", {}) if isinstance(tc.get("args"), dict) else tc.get("args", "{}")
+                                }
+                            } for i, tc in enumerate(msg.tool_calls)
+                        ]
+                        # Store tool_calls separately to avoid type issues
+                        msg_dict["tool_calls"] = tool_calls  # type: ignore
+                elif msg.type == "tool":
+                    msg_dict["role"] = "tool"
+                    if hasattr(msg, 'tool_call_id'):
+                        msg_dict["tool_call_id"] = msg.tool_call_id
+                elif msg.type == "function":  # Legacy function message
+                    msg_dict["role"] = "function"
+                    if hasattr(msg, 'name'):
+                        msg_dict["name"] = msg.name
+                else:
+                    msg_dict["role"] = "user"  # Default fallback
+                converted_messages.append(msg_dict)
+            elif isinstance(msg, dict):
+                # Already in OpenAI format
+                converted_messages.append(msg)
+            else:
+                # Fallback: treat as user message
+                converted_messages.append({"role": "user", "content": str(msg)})
+        return converted_messages
     @abstractmethod
     def get_token_usage(self) -> Dict[str, Any]:
-        """
-        Get cumulative token usage statistics for this service instance
-        Returns:
-            Dict containing token usage information:
-            - total_tokens: Total tokens used
-            - prompt_tokens: Tokens used for prompts
-            - completion_tokens: Tokens used for completions
-            - requests_count: Number of requests made
-        """
+        """Get cumulative token usage statistics"""
         pass
     @abstractmethod
     def get_last_token_usage(self) -> Dict[str, int]:
-        """
-        Get token usage from the last request
-        Returns:
-            Dict containing last request token usage:
-            - prompt_tokens: Tokens in last prompt
-            - completion_tokens: Tokens in last completion
-            - total_tokens: Total tokens in last request
-        """
+        """Get token usage from the last request"""
         pass
     @abstractmethod
     def get_model_info(self) -> Dict[str, Any]:
-        """
-        Get information about the current model
-        Returns:
-            Dict containing model information:
-            - name: Model name
-            - max_tokens: Maximum context length
-            - supports_streaming: Whether streaming is supported
-            - supports_functions: Whether function calling is supported
-        """
+        """Get information about the current model"""
         pass
     @abstractmethod
     async def close(self):
         """Cleanup resources and close connections"""
         pass
+    def get_last_usage_with_cost(self) -> Dict[str, Any]:
+        """Get last request usage with cost information"""
+        usage = self.get_last_token_usage()
+        # Calculate cost using provider
+        if hasattr(self.provider, 'calculate_cost'):
+            cost = getattr(self.provider, 'calculate_cost')(
+                self.model_name,
+                usage["prompt_tokens"],
+                usage["completion_tokens"]
+            )
+        else:
+            cost = 0.0
+        return {
+            **usage,
+            "cost_usd": cost,
+            "model": self.model_name,
+            "provider": getattr(self.provider, 'name', 'unknown')
+        }

isa-model 0.0.2__py3-none-any.whl → 0.3.1__py3-none-any.whl

isa-model 0.0.2py3-none-any.whl → 0.3.1py3-none-any.whl