PyPI - isa-model - Versions diffs - 0.1.0__py3-none-any.whl - Mend

isa-model 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (117) hide show

isa_model/__init__.py +5 -0
isa_model/core/model_manager.py +143 -0
isa_model/core/model_registry.py +115 -0
isa_model/core/model_router.py +226 -0
isa_model/core/model_storage.py +133 -0
isa_model/core/model_version.py +0 -0
isa_model/core/resource_manager.py +202 -0
isa_model/core/storage/hf_storage.py +0 -0
isa_model/core/storage/local_storage.py +0 -0
isa_model/core/storage/minio_storage.py +0 -0
isa_model/deployment/mlflow_gateway/__init__.py +8 -0
isa_model/deployment/mlflow_gateway/start_gateway.py +65 -0
isa_model/deployment/unified_multimodal_client.py +341 -0
isa_model/inference/__init__.py +11 -0
isa_model/inference/adapter/triton_adapter.py +453 -0
isa_model/inference/adapter/unified_api.py +248 -0
isa_model/inference/ai_factory.py +354 -0
isa_model/inference/backends/Pytorch/bge_embed_backend.py +188 -0
isa_model/inference/backends/Pytorch/gemma_backend.py +167 -0
isa_model/inference/backends/Pytorch/llama_backend.py +166 -0
isa_model/inference/backends/Pytorch/whisper_backend.py +194 -0
isa_model/inference/backends/__init__.py +53 -0
isa_model/inference/backends/base_backend_client.py +26 -0
isa_model/inference/backends/container_services.py +104 -0
isa_model/inference/backends/local_services.py +72 -0
isa_model/inference/backends/openai_client.py +130 -0
isa_model/inference/backends/replicate_client.py +197 -0
isa_model/inference/backends/third_party_services.py +239 -0
isa_model/inference/backends/triton_client.py +97 -0
isa_model/inference/base.py +46 -0
isa_model/inference/client_sdk/__init__.py +0 -0
isa_model/inference/client_sdk/client.py +134 -0
isa_model/inference/client_sdk/client_data_std.py +34 -0
isa_model/inference/client_sdk/client_sdk_schema.py +16 -0
isa_model/inference/client_sdk/exceptions.py +0 -0
isa_model/inference/engine/triton/model_repository/bge/1/model.py +174 -0
isa_model/inference/engine/triton/model_repository/gemma/1/model.py +250 -0
isa_model/inference/engine/triton/model_repository/llama/1/model.py +76 -0
isa_model/inference/engine/triton/model_repository/whisper/1/model.py +195 -0
isa_model/inference/providers/__init__.py +19 -0
isa_model/inference/providers/base_provider.py +30 -0
isa_model/inference/providers/model_cache_manager.py +341 -0
isa_model/inference/providers/ollama_provider.py +73 -0
isa_model/inference/providers/openai_provider.py +87 -0
isa_model/inference/providers/replicate_provider.py +94 -0
isa_model/inference/providers/triton_provider.py +439 -0
isa_model/inference/providers/vllm_provider.py +0 -0
isa_model/inference/providers/yyds_provider.py +83 -0
isa_model/inference/services/__init__.py +14 -0
isa_model/inference/services/audio/fish_speech/handler.py +215 -0
isa_model/inference/services/audio/runpod_tts_fish_service.py +212 -0
isa_model/inference/services/audio/triton_speech_service.py +138 -0
isa_model/inference/services/audio/whisper_service.py +186 -0
isa_model/inference/services/audio/yyds_audio_service.py +71 -0
isa_model/inference/services/base_service.py +106 -0
isa_model/inference/services/base_tts_service.py +66 -0
isa_model/inference/services/embedding/bge_service.py +183 -0
isa_model/inference/services/embedding/ollama_embed_service.py +85 -0
isa_model/inference/services/embedding/ollama_rerank_service.py +118 -0
isa_model/inference/services/embedding/onnx_rerank_service.py +73 -0
isa_model/inference/services/llm/__init__.py +16 -0
isa_model/inference/services/llm/gemma_service.py +143 -0
isa_model/inference/services/llm/llama_service.py +143 -0
isa_model/inference/services/llm/ollama_llm_service.py +108 -0
isa_model/inference/services/llm/openai_llm_service.py +129 -0
isa_model/inference/services/llm/replicate_llm_service.py +179 -0
isa_model/inference/services/llm/triton_llm_service.py +230 -0
isa_model/inference/services/others/table_transformer_service.py +61 -0
isa_model/inference/services/vision/__init__.py +12 -0
isa_model/inference/services/vision/helpers/image_utils.py +58 -0
isa_model/inference/services/vision/helpers/text_splitter.py +46 -0
isa_model/inference/services/vision/ollama_vision_service.py +60 -0
isa_model/inference/services/vision/replicate_vision_service.py +241 -0
isa_model/inference/services/vision/triton_vision_service.py +199 -0
isa_model/inference/services/vision/yyds_vision_service.py +80 -0
isa_model/inference/utils/conversion/bge_rerank_convert.py +73 -0
isa_model/inference/utils/conversion/onnx_converter.py +0 -0
isa_model/inference/utils/conversion/torch_converter.py +0 -0
isa_model/scripts/inference_tracker.py +283 -0
isa_model/scripts/mlflow_manager.py +379 -0
isa_model/scripts/model_registry.py +465 -0
isa_model/scripts/start_mlflow.py +95 -0
isa_model/scripts/training_tracker.py +257 -0
isa_model/training/engine/llama_factory/__init__.py +39 -0
isa_model/training/engine/llama_factory/config.py +115 -0
isa_model/training/engine/llama_factory/data_adapter.py +284 -0
isa_model/training/engine/llama_factory/examples/__init__.py +6 -0
isa_model/training/engine/llama_factory/examples/finetune_with_tracking.py +185 -0
isa_model/training/engine/llama_factory/examples/rlhf_with_tracking.py +163 -0
isa_model/training/engine/llama_factory/factory.py +331 -0
isa_model/training/engine/llama_factory/rl.py +254 -0
isa_model/training/engine/llama_factory/trainer.py +171 -0
isa_model/training/image_model/configs/create_config.py +37 -0
isa_model/training/image_model/configs/create_flux_config.py +26 -0
isa_model/training/image_model/configs/create_lora_config.py +21 -0
isa_model/training/image_model/prepare_massed_compute.py +97 -0
isa_model/training/image_model/prepare_upload.py +17 -0
isa_model/training/image_model/raw_data/create_captions.py +16 -0
isa_model/training/image_model/raw_data/create_lora_captions.py +20 -0
isa_model/training/image_model/raw_data/pre_processing.py +200 -0
isa_model/training/image_model/train/train.py +42 -0
isa_model/training/image_model/train/train_flux.py +41 -0
isa_model/training/image_model/train/train_lora.py +57 -0
isa_model/training/image_model/train_main.py +25 -0
isa_model/training/llm_model/annotation/annotation_schema.py +47 -0
isa_model/training/llm_model/annotation/processors/annotation_processor.py +126 -0
isa_model/training/llm_model/annotation/storage/dataset_manager.py +131 -0
isa_model/training/llm_model/annotation/storage/dataset_schema.py +44 -0
isa_model/training/llm_model/annotation/tests/test_annotation_flow.py +109 -0
isa_model/training/llm_model/annotation/tests/test_minio copy.py +113 -0
isa_model/training/llm_model/annotation/tests/test_minio_upload.py +43 -0
isa_model/training/llm_model/annotation/views/annotation_controller.py +158 -0
isa_model-0.1.0.dist-info/METADATA +116 -0
isa_model-0.1.0.dist-info/RECORD +117 -0
isa_model-0.1.0.dist-info/WHEEL +5 -0
isa_model-0.1.0.dist-info/licenses/LICENSE +21 -0
isa_model-0.1.0.dist-info/top_level.txt +1 -0

isa_model/training/llm_model/annotation/storage/dataset_schema.py ADDED Viewed

@@ -0,0 +1,44 @@
+# app/services/llm_model/annotation/dataset/dataset_schema.py
+from enum import Enum
+from pydantic import BaseModel, Field
+from typing import Dict, List, Optional
+from datetime import datetime
+from bson import ObjectId
+class DatasetType(str, Enum):
+    SFT = "sft"
+    RLHF = "rlhf"
+class DatasetStatus(str, Enum):
+    PENDING = "pending"
+    PROCESSING = "processing"
+    READY = "ready"
+    ERROR = "error"
+class DatasetFiles(BaseModel):
+    train: str
+    eval: Optional[str]
+    test: Optional[str]
+class DatasetStats(BaseModel):
+    total_examples: int
+    avg_length: Optional[float]
+    num_conversations: Optional[int]
+    additional_metrics: Optional[Dict] = {}
+class Dataset(BaseModel):
+    id: Optional[ObjectId] = Field(None, alias="_id")
+    name: str
+    type: DatasetType
+    version: str
+    storage_path: str
+    files: DatasetFiles
+    stats: DatasetStats
+    source_annotations: List[str]
+    created_at: datetime
+    status: DatasetStatus
+    metadata: Optional[Dict] = {}
+    class Config:
+        arbitrary_types_allowed = True
+        populate_by_name = True

isa_model/training/llm_model/annotation/tests/test_annotation_flow.py ADDED Viewed

@@ -0,0 +1,109 @@
+# test_annotation_flow.py
+import os
+os.environ["ENV"] = "local"
+import asyncio
+from datetime import datetime
+from bson import ObjectId
+from app.services.llm_model.annotation.views.annotation_controller import AnnotationController
+from app.services.llm_model.annotation.processors.annotation_processor import AnnotationProcessor
+from app.services.llm_model.annotation.annotation_schema import (
+    AnnotationFeedback,
+    RatingScale,
+    AnnotationType,
+    AnnotationAspects,
+    BetterResponse
+)
+from app.config.config_manager import config_manager
+async def setup_test_data():
+    """Setup initial test data in MongoDB"""
+    db = await config_manager.get_db('mongodb')
+    # Create a test annotation
+    test_annotation = {
+        "_id": ObjectId(),
+        "project_name": "test_project",
+        "items": [{
+            "item_id": "test_item_1",
+            "input": {
+                "messages": [{
+                    "role": "user",
+                    "content": "What is the capital of France?"
+                }]
+            },
+            "output": {
+                "content": "The capital of France is Paris."
+            },
+            "status": "pending"
+        }],
+        "created_at": datetime.utcnow().isoformat()
+    }
+    await db['annotations'].insert_one(test_annotation)
+    return test_annotation
+async def test_annotation_flow():
+    """Test the complete annotation flow"""
+    try:
+        # Initialize controllers
+        annotation_controller = AnnotationController()
+        annotation_processor = AnnotationProcessor()
+        # Setup test data
+        test_data = await setup_test_data()
+        annotation_id = str(test_data["_id"])
+        item_id = test_data["items"][0]["item_id"]
+        print("1. Created test annotation")
+        # Create test feedback
+        feedback = AnnotationFeedback(
+            rating=RatingScale.EXCELLENT,
+            category=AnnotationType.ACCURACY,
+            aspects=AnnotationAspects(
+                factually_correct=True,
+                relevant=True,
+                harmful=False,
+                biased=False,
+                complete=True,
+                efficient=True
+            ),
+            better_response=BetterResponse(
+                content="Paris is the capital city of France, known for its iconic Eiffel Tower.",
+                reason="Added more context and detail"
+            ),
+            comment="Good response, but could be more detailed"
+        )
+        # Submit annotation
+        result = await annotation_controller.submit_annotation(
+            annotation_id=annotation_id,
+            item_id=item_id,
+            feedback=feedback,
+            annotator_id="test_annotator"
+        )
+        print("2. Submitted annotation:", result)
+        # Process annotation queue
+        await annotation_processor.process_queue()
+        print("3. Processed annotation queue")
+        # Verify dataset creation
+        db = await config_manager.get_db('mongodb')
+        datasets = await db['training_datasets'].find().to_list(length=10)
+        print("\nCreated Datasets:")
+        for dataset in datasets:
+            print(f"- {dataset['name']} ({dataset['type']})")
+            print(f"  Status: {dataset['status']}")
+            print(f"  Examples: {dataset['stats']['total_examples']}")
+    except Exception as e:
+        print(f"Error during test: {e}")
+if __name__ == "__main__":
+    # Run the test
+    print("Starting annotation flow test...")
+    asyncio.run(test_annotation_flow())

isa_model/training/llm_model/annotation/tests/test_minio copy.py ADDED Viewed

@@ -0,0 +1,113 @@
+#!/usr/bin/env python3
+import os
+from minio import Minio
+import json
+import logging
+from io import BytesIO
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+def test_minio():
+    try:
+        # Get MinIO host from environment variable or use default
+        minio_host = os.getenv("MINIO_HOST", "localhost:9000")
+        logger.info(f"Using MinIO host: {minio_host}")
+        # 1. Create MinIO client
+        logger.info("Creating MinIO client...")
+        client = Minio(
+            minio_host,
+            access_key="minioadmin",
+            secret_key="minioadmin",
+            secure=False
+        )
+        # 2. Test bucket operations
+        bucket_name = "knowledge-files"  # Changed to match the actual bucket name
+        logger.info(f"Testing bucket operations with {bucket_name}...")
+        # Create bucket if it doesn't exist
+        if not client.bucket_exists(bucket_name):
+            client.make_bucket(bucket_name)
+            logger.info(f"Created new bucket: {bucket_name}")
+        else:
+            logger.info(f"Using existing bucket: {bucket_name}")
+        # Set bucket policy - allow all operations
+        policy = {
+            "Version": "2012-10-17",
+            "Statement": [
+                {
+                    "Effect": "Allow",
+                    "Principal": {"AWS": ["*"]},
+                    "Action": [
+                        "s3:GetBucketLocation",
+                        "s3:ListBucket",
+                        "s3:ListBucketMultipartUploads"
+                    ],
+                    "Resource": [f"arn:aws:s3:::{bucket_name}"]
+                },
+                {
+                    "Effect": "Allow",
+                    "Principal": {"AWS": ["*"]},
+                    "Action": [
+                        "s3:AbortMultipartUpload",
+                        "s3:DeleteObject",
+                        "s3:GetObject",
+                        "s3:ListMultipartUploadParts",
+                        "s3:PutObject"
+                    ],
+                    "Resource": [f"arn:aws:s3:::{bucket_name}/*"]
+                }
+            ]
+        }
+        try:
+            client.set_bucket_policy(bucket_name, json.dumps(policy))
+            logger.info("Set bucket policy successfully")
+        except Exception as e:
+            logger.warning(f"Failed to set bucket policy: {e}")
+        # 3. Test file upload
+        source_file = "init-scripts/files/haley_system.txt"
+        object_name = "haley_system.txt"
+        if os.path.exists(source_file):
+            # Get file size
+            file_size = os.path.getsize(source_file)
+            logger.info(f"Found source file: {source_file} (size: {file_size} bytes)")
+            # Upload file
+            with open(source_file, 'rb') as file_data:
+                client.put_object(
+                    bucket_name,
+                    object_name,
+                    file_data,
+                    file_size,
+                    content_type="text/plain"
+                )
+            logger.info(f"Uploaded file: {object_name}")
+            # 4. Test file download
+            data = client.get_object(bucket_name, object_name)
+            content = data.read().decode('utf-8')
+            logger.info(f"Successfully downloaded file. First 100 chars: {content[:100]}...")
+            # 5. Verify file exists
+            stat = client.stat_object(bucket_name, object_name)
+            logger.info(f"File stats: {stat}")
+            logger.info("Test completed successfully!")
+        else:
+            logger.error(f"Source file not found: {source_file}")
+            raise FileNotFoundError(f"Source file not found: {source_file}")
+    except Exception as e:
+        logger.error(f"Test failed: {str(e)}")
+        raise
+if __name__ == "__main__":
+    test_minio()

isa_model/training/llm_model/annotation/tests/test_minio_upload.py ADDED Viewed

@@ -0,0 +1,43 @@
+#!/usr/bin/env python3
+import os
+from minio import Minio
+import io
+# MinIO client setup
+client = Minio(
+    "localhost:9000",
+    access_key="minioadmin",
+    secret_key="minioadmin",
+    secure=False
+)
+# Test bucket name
+bucket_name = "test-bucket"
+# Create bucket if not exists
+if not client.bucket_exists(bucket_name):
+    client.make_bucket(bucket_name)
+    print(f"Created bucket: {bucket_name}")
+else:
+    print(f"Bucket already exists: {bucket_name}")
+# Upload test file
+source_file = "init-scripts/files/haley_system.txt"
+if os.path.exists(source_file):
+    with open(source_file, 'rb') as file_data:
+        content = file_data.read()
+        # Upload file
+        client.put_object(
+            bucket_name,
+            "haley_system.txt",
+            io.BytesIO(content),
+            len(content),
+            content_type="text/plain"
+        )
+        print(f"Successfully uploaded {source_file}")
+        # Verify upload
+        stat = client.stat_object(bucket_name, "haley_system.txt")
+        print(f"File stats: {stat}")
+else:
+    print(f"Source file not found: {source_file}")

isa_model/training/llm_model/annotation/views/annotation_controller.py ADDED Viewed

@@ -0,0 +1,158 @@
+# app/services/llm_model/tracing/annotation/annotation_controller.py
+from typing import Dict, Any, List, Optional
+from datetime import datetime
+from bson import ObjectId
+from app.config.config_manager import config_manager
+from app.services.training.llm_model.annotation.annotation_schema import AnnotationFeedback, RatingScale
+from app.services.training.llm_model.annotation.storage.dataset_manager import DatasetManager
+class AnnotationController:
+    def __init__(self):
+        self.logger = config_manager.get_logger(__name__)
+    async def get_pending_annotations(
+        self,
+        project_name: str,
+        category: Optional[str] = None,
+        min_rating: Optional[int] = None,
+        page: int = 1,
+        limit: int = 10
+    ) -> Dict[str, Any]:
+        """Get filtered list of pending annotations"""
+        db = await config_manager.get_db('mongodb')
+        collection = db['annotations']
+        # Build query with filters
+        query = {"status": "pending", "project_name": project_name}
+        if category:
+            query["annotation_type"] = category
+        if min_rating:
+            query["items.feedback.rating"] = {"$gte": min_rating}
+        annotations = await collection.find(query)\
+            .sort("created_at", -1)\
+            .skip((page - 1) * limit)\
+            .limit(limit)\
+            .to_list(length=limit)
+        return {
+            "annotations": annotations,
+            "pagination": {
+                "page": page,
+                "limit": limit,
+                "total": await collection.count_documents(query)
+            }
+        }
+    async def submit_annotation(
+        self,
+        annotation_id: str,
+        item_id: str,
+        feedback: AnnotationFeedback,
+        annotator_id: str
+    ) -> Dict[str, Any]:
+        """Submit and process annotation feedback"""
+        db = await config_manager.get_db('mongodb')
+        collection = db['annotations']
+        # Determine if annotation should be selected for training
+        is_selected = self._evaluate_for_training(feedback)
+        feedback_dict = feedback.dict()
+        feedback_dict["is_selected_for_training"] = is_selected
+        # Update annotation
+        result = await collection.update_one(
+            {
+                "_id": ObjectId(annotation_id),
+                "items.item_id": item_id
+            },
+            {
+                "$set": {
+                    "items.$.feedback": feedback_dict,
+                    "items.$.status": "completed",
+                    "items.$.annotated_at": datetime.utcnow().isoformat(),
+                    "items.$.annotator_id": annotator_id,
+                    "items.$.training_status": "pending" if is_selected else "none"
+                }
+            }
+        )
+        # Process for training if selected
+        if is_selected:
+            await self._queue_for_training(annotation_id, item_id, feedback)
+        return {
+            "status": "success",
+            "selected_for_training": is_selected,
+            "message": "Annotation submitted successfully"
+        }
+    def _evaluate_for_training(self, feedback: AnnotationFeedback) -> bool:
+        """Evaluate if annotation should be used for training"""
+        # Select for SFT if rating is excellent and aspects are positive
+        if feedback.rating == RatingScale.EXCELLENT:
+            aspects = feedback.aspects
+            if all([
+                aspects.factually_correct,
+                aspects.relevant,
+                not aspects.harmful,
+                not aspects.biased
+            ]):
+                return True
+        # Select for RLHF if better response is provided
+        if feedback.better_response:
+            return True
+        return False
+    async def _queue_for_training(
+        self,
+        annotation_id: str,
+        item_id: str,
+        feedback: AnnotationFeedback
+    ):
+        """Queue selected annotations for training data generation"""
+        db = await config_manager.get_db('mongodb')
+        training_queue = db['training_queue']
+        await training_queue.insert_one({
+            "annotation_id": annotation_id,
+            "item_id": item_id,
+            "type": "sft" if feedback.rating == RatingScale.EXCELLENT else "rlhf",
+            "feedback": feedback.dict(),
+            "status": "pending",
+            "created_at": datetime.utcnow().isoformat()
+        })
+class DatasetPreparationProcessor:
+    def __init__(self):
+        self.logger = config_manager.get_logger(__name__)
+        self.dataset_manager = DatasetManager()
+        self.batch_size = 1000  # Configure as needed
+    async def process_annotation_queue(self) -> None:
+        """Process pending annotations and prepare datasets"""
+        db = await config_manager.get_db('mongodb')
+        annotation_queue = db['dataset_preparation_queue']
+        # Process items for SFT dataset
+        sft_items = await self._get_pending_annotations("sft")
+        if len(sft_items) >= self.batch_size:
+            await self._create_sft_dataset(sft_items)
+        # Process items for RLHF dataset
+        rlhf_items = await self._get_pending_annotations("rlhf")
+        if len(rlhf_items) >= self.batch_size:
+            await self._create_rlhf_dataset(rlhf_items)
+    async def _get_pending_annotations(self, dataset_type: str) -> List[Dict[str, Any]]:
+        """Get pending annotations for dataset preparation"""
+        db = await config_manager.get_db('mongodb')
+        queue = db['dataset_preparation_queue']
+        return await queue.find({
+            "status": "pending",
+            "dataset_type": dataset_type
+        }).to_list(length=self.batch_size)

isa_model-0.1.0.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,116 @@
+Metadata-Version: 2.4
+Name: isa-model
+Version: 0.1.0
+Summary: Unified AI model serving framework
+Author-email: isA_Model Contributors <your.email@example.com>
+License: MIT
+Classifier: Development Status :: 3 - Alpha
+Classifier: Intended Audience :: Developers
+Classifier: Operating System :: OS Independent
+Classifier: Programming Language :: Python :: 3
+Classifier: License :: OSI Approved :: MIT License
+Requires-Python: >=3.8
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Requires-Dist: fastapi>=0.95.0
+Requires-Dist: numpy>=1.20.0
+Requires-Dist: httpx>=0.23.0
+Requires-Dist: pydantic>=2.0.0
+Requires-Dist: uvicorn>=0.22.0
+Requires-Dist: requests>=2.28.0
+Requires-Dist: aiohttp>=3.8.0
+Requires-Dist: transformers>=4.30.0
+Requires-Dist: langchain-core>=0.1.0
+Requires-Dist: tritonclient[grpc,http]>=2.30.0
+Requires-Dist: huggingface-hub>=0.16.0
+Requires-Dist: kubernetes>=25.3.0
+Requires-Dist: mlflow>=2.4.0
+Requires-Dist: torch>=2.0.0
+Dynamic: license-file
+# isA_Model - AI服务工厂
+isA_Model是一个轻量级AI服务工厂，用于统一管理和调用不同的AI模型和服务提供商。
+## 特性
+- 支持多种AI提供商(Ollama, OpenAI, Replicate, Triton)
+- 统一的API接口
+- 灵活的工厂模式
+- 异步支持
+- 单例模式，高效缓存
+## 安装
+```bash
+pip install -r requirements.txt
+```
+## 快速开始
+使用AI工厂很简单：
+```python
+from isa_model.inference.ai_factory import AIFactory
+from isa_model.inference.base import ModelType
+# 获取工厂实例
+factory = AIFactory()
+# LLM示例 - 使用Ollama
+llm = factory.get_llm(model_name="llama3.1", provider="ollama")
+response = await llm.generate("你好，请介绍一下自己。")
+print(response)
+# 图像生成示例 - 使用Replicate
+vision_service = factory.get_vision_model(
+    model_name="stability-ai/sdxl:c221b2b8ef527988fb59bf24a8b97c4561f1c671f73bd389f866bfb27c061316",
+    provider="replicate",
+    config={"api_token": "your_replicate_token"}
+)
+result = await vision_service.generate_image({
+    "prompt": "A beautiful sunset over mountains",
+    "num_inference_steps": 25
+})
+print(result["urls"])
+```
+## 工厂架构
+isA_Model使用三层架构:
+1. **客户端层** - 应用程序代码
+2. **服务层** - 模型服务实现(LLM, 图像, 嵌入等)
+3. **提供商层** - 底层API集成(Ollama, OpenAI, Replicate等)
+### 主要组件
+- `AIFactory` - 中央工厂类，提供模型和服务访问
+- `BaseService` - 所有服务的基类
+- `BaseProvider` - 所有提供商的基类
+- 特定服务实现 - 如`ReplicateVisionService`, `OllamaLLMService`等
+## 支持的模型类型
+- **LLM** - 大语言模型
+- **VISION** - 图像生成和分析
+- **EMBEDDING** - 文本嵌入
+- **AUDIO** - 语音识别
+- **RERANK** - 重排序
+## 示例
+查看`test_*.py`文件获取更多使用示例。
+## 环境变量
+将API密钥和其他配置添加到`.env.local`文件中:
+```
+OPENAI_API_KEY=your_openai_key
+REPLICATE_API_TOKEN=your_replicate_token
+```
+## 许可证
+MIT