PyPI - isa-model - Versions diffs - 0.2.0__py3-none-any.whl → 0.2.9__py3-none-any.whl - Mend

isa-model 0.2.0py3-none-any.whl → 0.2.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (77) hide show

isa_model/__init__.py +1 -1
isa_model/core/storage/hf_storage.py +419 -0
isa_model/deployment/__init__.py +52 -0
isa_model/deployment/core/__init__.py +34 -0
isa_model/deployment/core/deployment_config.py +356 -0
isa_model/deployment/core/deployment_manager.py +549 -0
isa_model/deployment/core/isa_deployment_service.py +401 -0
isa_model/eval/factory.py +381 -140
isa_model/inference/ai_factory.py +142 -240
isa_model/inference/providers/ml_provider.py +50 -0
isa_model/inference/services/audio/openai_tts_service.py +104 -3
isa_model/inference/services/embedding/base_embed_service.py +112 -0
isa_model/inference/services/embedding/ollama_embed_service.py +28 -2
isa_model/inference/services/llm/__init__.py +2 -0
isa_model/inference/services/llm/base_llm_service.py +111 -1
isa_model/inference/services/llm/ollama_llm_service.py +234 -26
isa_model/inference/services/llm/openai_llm_service.py +243 -28
isa_model/inference/services/llm/triton_llm_service.py +481 -0
isa_model/inference/services/ml/base_ml_service.py +78 -0
isa_model/inference/services/ml/sklearn_ml_service.py +140 -0
isa_model/inference/services/vision/__init__.py +3 -3
isa_model/inference/services/vision/base_image_gen_service.py +161 -0
isa_model/inference/services/vision/base_vision_service.py +177 -0
isa_model/inference/services/vision/ollama_vision_service.py +143 -17
isa_model/inference/services/vision/replicate_image_gen_service.py +139 -7
isa_model/training/__init__.py +62 -32
isa_model/training/cloud/__init__.py +22 -0
isa_model/training/cloud/job_orchestrator.py +402 -0
isa_model/training/cloud/runpod_trainer.py +454 -0
isa_model/training/cloud/storage_manager.py +482 -0
isa_model/training/core/__init__.py +23 -0
isa_model/training/core/config.py +181 -0
isa_model/training/core/dataset.py +222 -0
isa_model/training/core/trainer.py +720 -0
isa_model/training/core/utils.py +213 -0
isa_model/training/factory.py +229 -198
isa_model-0.2.9.dist-info/METADATA +465 -0
isa_model-0.2.9.dist-info/RECORD +86 -0
isa_model/core/model_router.py +0 -226
isa_model/core/model_version.py +0 -0
isa_model/core/resource_manager.py +0 -202
isa_model/deployment/gpu_fp16_ds8/models/deepseek_r1/1/model.py +0 -120
isa_model/deployment/gpu_fp16_ds8/scripts/download_model.py +0 -18
isa_model/training/engine/llama_factory/__init__.py +0 -39
isa_model/training/engine/llama_factory/config.py +0 -115
isa_model/training/engine/llama_factory/data_adapter.py +0 -284
isa_model/training/engine/llama_factory/examples/__init__.py +0 -6
isa_model/training/engine/llama_factory/examples/finetune_with_tracking.py +0 -185
isa_model/training/engine/llama_factory/examples/rlhf_with_tracking.py +0 -163
isa_model/training/engine/llama_factory/factory.py +0 -331
isa_model/training/engine/llama_factory/rl.py +0 -254
isa_model/training/engine/llama_factory/trainer.py +0 -171
isa_model/training/image_model/configs/create_config.py +0 -37
isa_model/training/image_model/configs/create_flux_config.py +0 -26
isa_model/training/image_model/configs/create_lora_config.py +0 -21
isa_model/training/image_model/prepare_massed_compute.py +0 -97
isa_model/training/image_model/prepare_upload.py +0 -17
isa_model/training/image_model/raw_data/create_captions.py +0 -16
isa_model/training/image_model/raw_data/create_lora_captions.py +0 -20
isa_model/training/image_model/raw_data/pre_processing.py +0 -200
isa_model/training/image_model/train/train.py +0 -42
isa_model/training/image_model/train/train_flux.py +0 -41
isa_model/training/image_model/train/train_lora.py +0 -57
isa_model/training/image_model/train_main.py +0 -25
isa_model-0.2.0.dist-info/METADATA +0 -327
isa_model-0.2.0.dist-info/RECORD +0 -92
isa_model-0.2.0.dist-info/licenses/LICENSE +0 -21
/isa_model/training/{llm_model/annotation → annotation}/annotation_schema.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/processors/annotation_processor.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/storage/dataset_manager.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/storage/dataset_schema.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/tests/test_annotation_flow.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/tests/test_minio copy.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/tests/test_minio_upload.py +0 -0
/isa_model/training/{llm_model/annotation → annotation}/views/annotation_controller.py +0 -0
{isa_model-0.2.0.dist-info → isa_model-0.2.9.dist-info}/WHEEL +0 -0
{isa_model-0.2.0.dist-info → isa_model-0.2.9.dist-info}/top_level.txt +0 -0

isa_model/inference/services/llm/openai_llm_service.py CHANGED Viewed

@@ -1,12 +1,13 @@
 import logging
 import os
-from typing import Dict, Any, List, Union, AsyncGenerator, Optional
+import json
+from typing import Dict, Any, List, Union, AsyncGenerator, Optional, Callable
 # 使用官方 OpenAI 库和 dotenv
 from openai import AsyncOpenAI
 from dotenv import load_dotenv
-from isa_model.inference.services.base_service import BaseLLMService
+from isa_model.inference.services.llm.base_llm_service import BaseLLMService
 from isa_model.inference.providers.base_provider import BaseProvider
 # 加载 .env.local 文件中的环境变量
@@ -34,14 +35,103 @@ class OpenAILLMService(BaseLLMService):
             raise ValueError("OPENAI_API_KEY 未设置。") from e
         self.last_token_usage = {"prompt_tokens": 0, "completion_tokens": 0, "total_tokens": 0}
+        self.total_token_usage = {"prompt_tokens": 0, "completion_tokens": 0, "total_tokens": 0, "requests_count": 0}
+        # Tool binding attributes
+        self._bound_tools: List[Dict[str, Any]] = []
+        self._tool_binding_kwargs: Dict[str, Any] = {}
+        self._tool_functions: Dict[str, Callable] = {}
         logger.info(f"Initialized OpenAILLMService with model {self.model_name} and endpoint {self.client.base_url}")
-    async def ainvoke(self, prompt: Union[str, List[Dict[str, str]], Any]) -> str:
+    def _create_bound_copy(self) -> 'OpenAILLMService':
+        """Create a copy of this service for tool binding"""
+        bound_service = OpenAILLMService(self.provider, self.model_name)
+        bound_service._bound_tools = self._bound_tools.copy()
+        bound_service._tool_binding_kwargs = self._tool_binding_kwargs.copy()
+        bound_service._tool_functions = self._tool_functions.copy()
+        return bound_service
+    def bind_tools(self, tools: List[Union[Dict[str, Any], Callable]], **kwargs) -> 'OpenAILLMService':
+        """Bind tools to this LLM service for function calling"""
+        bound_service = self._create_bound_copy()
+        bound_service._bound_tools = self._convert_tools_to_schema(tools)
+        bound_service._tool_binding_kwargs = kwargs
+        # Store the actual functions for execution
+        for tool in tools:
+            if callable(tool):
+                bound_service._tool_functions[tool.__name__] = tool
+        return bound_service
+    async def ainvoke(self, prompt: Union[str, List[Any], Any]) -> str:
         """Universal invocation method"""
         if isinstance(prompt, str):
             return await self.acompletion(prompt)
         elif isinstance(prompt, list):
-            return await self.achat(prompt)
+            if not prompt:
+                raise ValueError("Empty message list provided")
+            # 检查是否是 LangGraph 消息对象
+            first_msg = prompt[0]
+            if hasattr(first_msg, 'content') and hasattr(first_msg, 'type'):
+                # 转换 LangGraph 消息对象为标准格式
+                converted_messages = []
+                for msg in prompt:
+                    if hasattr(msg, 'type') and hasattr(msg, 'content'):
+                        # LangGraph 消息对象
+                        msg_dict = {"content": msg.content}
+                        # 根据消息类型设置 role
+                        if msg.type == "system":
+                            msg_dict["role"] = "system"
+                        elif msg.type == "human":
+                            msg_dict["role"] = "user"
+                        elif msg.type == "ai":
+                            msg_dict["role"] = "assistant"
+                            # 处理工具调用
+                            if hasattr(msg, 'tool_calls') and msg.tool_calls:
+                                msg_dict["tool_calls"] = [
+                                    {
+                                        "id": tc.get("id", f"call_{i}"),
+                                        "type": "function",
+                                        "function": {
+                                            "name": tc["name"],
+                                            "arguments": json.dumps(tc["args"])
+                                        }
+                                    } for i, tc in enumerate(msg.tool_calls)
+                                ]
+                        elif msg.type == "tool":
+                            msg_dict["role"] = "tool"
+                            if hasattr(msg, 'tool_call_id'):
+                                msg_dict["tool_call_id"] = msg.tool_call_id
+                        else:
+                            msg_dict["role"] = "user"  # 默认为用户消息
+                        converted_messages.append(msg_dict)
+                    elif isinstance(msg, dict):
+                        # 已经是字典格式
+                        converted_messages.append(msg)
+                    else:
+                        # 处理其他类型（如字符串）
+                        converted_messages.append({"role": "user", "content": str(msg)})
+                return await self.achat(converted_messages)
+            elif isinstance(first_msg, dict):
+                # 标准字典格式的消息
+                return await self.achat(prompt)
+            else:
+                # 处理其他格式，如字符串列表
+                converted_messages = []
+                for msg in prompt:
+                    if isinstance(msg, str):
+                        converted_messages.append({"role": "user", "content": msg})
+                    elif isinstance(msg, dict):
+                        converted_messages.append(msg)
+                    else:
+                        converted_messages.append({"role": "user", "content": str(msg)})
+                return await self.achat(converted_messages)
         else:
             raise ValueError("Prompt must be a string or a list of messages")
@@ -51,12 +141,19 @@ class OpenAILLMService(BaseLLMService):
             temperature = self.config.get("temperature", 0.7)
             max_tokens = self.config.get("max_tokens", 1024)
-            response = await self.client.chat.completions.create(
-                model=self.model_name,
-                messages=messages,
-                temperature=temperature,
-                max_tokens=max_tokens
-            )
+            kwargs = {
+                "model": self.model_name,
+                "messages": messages,
+                "temperature": temperature,
+                "max_tokens": max_tokens
+            }
+            # Add tools if bound
+            if self._has_bound_tools():
+                kwargs["tools"] = self._get_bound_tools()
+                kwargs["tool_choice"] = "auto"
+            response = await self.client.chat.completions.create(**kwargs)
             if response.usage:
                 self.last_token_usage = {
@@ -64,13 +161,87 @@ class OpenAILLMService(BaseLLMService):
                     "completion_tokens": response.usage.completion_tokens,
                     "total_tokens": response.usage.total_tokens
                 }
+                # Update total usage
+                self.total_token_usage["prompt_tokens"] += self.last_token_usage["prompt_tokens"]
+                self.total_token_usage["completion_tokens"] += self.last_token_usage["completion_tokens"]
+                self.total_token_usage["total_tokens"] += self.last_token_usage["total_tokens"]
+                self.total_token_usage["requests_count"] += 1
-            return response.choices[0].message.content or ""
+            # Handle tool calls if present
+            message = response.choices[0].message
+            if message.tool_calls:
+                return await self._handle_tool_calls(message, messages)
+            return message.content or ""
         except Exception as e:
             logger.error(f"Error in chat completion: {e}")
             raise
+    async def _handle_tool_calls(self, assistant_message, original_messages: List[Dict[str, str]]) -> str:
+        """Handle tool calls from the assistant"""
+        # Add assistant message with tool calls to conversation
+        messages = original_messages + [{
+            "role": "assistant",
+            "content": assistant_message.content or "",
+            "tool_calls": [
+                {
+                    "id": tc.id,
+                    "type": tc.type,
+                    "function": {
+                        "name": tc.function.name,
+                        "arguments": tc.function.arguments
+                    }
+                } for tc in assistant_message.tool_calls
+            ]
+        }]
+        # Execute each tool call
+        for tool_call in assistant_message.tool_calls:
+            function_name = tool_call.function.name
+            arguments = json.loads(tool_call.function.arguments)
+            try:
+                # Execute the tool
+                if function_name in self._tool_functions:
+                    result = self._tool_functions[function_name](**arguments)
+                    if hasattr(result, '__await__'):  # Handle async functions
+                        result = await result
+                else:
+                    result = f"Error: Function {function_name} not found"
+                # Add tool result to messages
+                messages.append({
+                    "role": "tool",
+                    "content": str(result),
+                    "tool_call_id": tool_call.id
+                })
+            except Exception as e:
+                logger.error(f"Error executing tool {function_name}: {e}")
+                messages.append({
+                    "role": "tool",
+                    "content": f"Error executing {function_name}: {str(e)}",
+                    "tool_call_id": tool_call.id
+                })
+        # Get final response from the model with all context
+        try:
+            kwargs = {
+                "model": self.model_name,
+                "messages": messages,
+                "temperature": self.config.get("temperature", 0.7),
+                "max_tokens": self.config.get("max_tokens", 1024)
+            }
+            response = await self.client.chat.completions.create(**kwargs)
+            return response.choices[0].message.content or ""
+        except Exception as e:
+            logger.error(f"Error getting final response after tool calls: {e}")
+            raise
     async def acompletion(self, prompt: str) -> str:
         """Text completion method (using chat API)"""
         messages = [{"role": "user", "content": prompt}]
@@ -82,13 +253,20 @@ class OpenAILLMService(BaseLLMService):
             temperature = self.config.get("temperature", 0.7)
             max_tokens = self.config.get("max_tokens", 1024)
-            response = await self.client.chat.completions.create(
-                model=self.model_name,
-                messages=messages,
-                temperature=temperature,
-                max_tokens=max_tokens,
-                n=n
-            )
+            kwargs = {
+                "model": self.model_name,
+                "messages": messages,
+                "temperature": temperature,
+                "max_tokens": max_tokens,
+                "n": n
+            }
+            # Add tools if bound
+            if self._has_bound_tools():
+                kwargs["tools"] = self._get_bound_tools()
+                kwargs["tool_choice"] = "auto"
+            response = await self.client.chat.completions.create(**kwargs)
             if response.usage:
                 self.last_token_usage = {
@@ -96,6 +274,12 @@ class OpenAILLMService(BaseLLMService):
                     "completion_tokens": response.usage.completion_tokens,
                     "total_tokens": response.usage.total_tokens
                 }
+                # Update total usage
+                self.total_token_usage["prompt_tokens"] += self.last_token_usage["prompt_tokens"]
+                self.total_token_usage["completion_tokens"] += self.last_token_usage["completion_tokens"]
+                self.total_token_usage["total_tokens"] += self.last_token_usage["total_tokens"]
+                self.total_token_usage["requests_count"] += 1
             return [choice.message.content or "" for choice in response.choices]
         except Exception as e:
@@ -108,13 +292,20 @@ class OpenAILLMService(BaseLLMService):
             temperature = self.config.get("temperature", 0.7)
             max_tokens = self.config.get("max_tokens", 1024)
-            stream = await self.client.chat.completions.create(
-                model=self.model_name,
-                messages=messages,
-                temperature=temperature,
-                max_tokens=max_tokens,
-                stream=True
-            )
+            kwargs = {
+                "model": self.model_name,
+                "messages": messages,
+                "temperature": temperature,
+                "max_tokens": max_tokens,
+                "stream": True
+            }
+            # Add tools if bound
+            if self._has_bound_tools():
+                kwargs["tools"] = self._get_bound_tools()
+                kwargs["tool_choice"] = "auto"
+            stream = await self.client.chat.completions.create(**kwargs)
             async for chunk in stream:
                 content = chunk.choices[0].delta.content
@@ -125,14 +316,38 @@ class OpenAILLMService(BaseLLMService):
             logger.error(f"Error in stream chat: {e}")
             raise
-    def get_token_usage(self) -> Dict[str, int]:
+    async def astream_completion(self, prompt: str) -> AsyncGenerator[str, None]:
+        """Stream completion responses"""
+        messages = [{"role": "user", "content": prompt}]
+        async for chunk in self.astream_chat(messages):
+            yield chunk
+    def get_token_usage(self) -> Dict[str, Any]:
         """Get total token usage statistics"""
-        return self.last_token_usage
+        return self.total_token_usage
     def get_last_token_usage(self) -> Dict[str, int]:
         """Get token usage from last request"""
         return self.last_token_usage
+    def get_model_info(self) -> Dict[str, Any]:
+        """Get information about the current model"""
+        return {
+            "name": self.model_name,
+            "max_tokens": self.config.get("max_tokens", 1024),
+            "supports_streaming": True,
+            "supports_functions": True,
+            "provider": "openai"
+        }
+    def _has_bound_tools(self) -> bool:
+        """Check if this service has bound tools"""
+        return bool(self._bound_tools)
+    def _get_bound_tools(self) -> List[Dict[str, Any]]:
+        """Get the bound tools schema"""
+        return self._bound_tools
     async def close(self):
         """Close the backend client"""
-        await self.client.aclose()
+        await self.client.close()

isa-model 0.2.0__py3-none-any.whl → 0.2.9__py3-none-any.whl

isa-model 0.2.0py3-none-any.whl → 0.2.9py3-none-any.whl