PyPI - isa-model - Versions diffs - 0.3.5__py3-none-any.whl → 0.3.7__py3-none-any.whl - Mend

isa-model 0.3.5py3-none-any.whl → 0.3.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (88) hide show

isa_model/__init__.py +30 -1
isa_model/client.py +937 -0
isa_model/core/config/__init__.py +16 -0
isa_model/core/config/config_manager.py +514 -0
isa_model/core/config.py +426 -0
isa_model/core/models/model_billing_tracker.py +476 -0
isa_model/core/models/model_manager.py +399 -0
isa_model/core/{storage/supabase_storage.py → models/model_repo.py} +72 -73
isa_model/core/pricing_manager.py +426 -0
isa_model/core/services/__init__.py +19 -0
isa_model/core/services/intelligent_model_selector.py +547 -0
isa_model/core/types.py +291 -0
isa_model/deployment/__init__.py +2 -0
isa_model/deployment/cloud/modal/isa_vision_doc_service.py +157 -3
isa_model/deployment/cloud/modal/isa_vision_table_service.py +532 -0
isa_model/deployment/cloud/modal/isa_vision_ui_service.py +104 -3
isa_model/deployment/cloud/modal/register_models.py +321 -0
isa_model/deployment/runtime/deployed_service.py +338 -0
isa_model/deployment/services/__init__.py +9 -0
isa_model/deployment/services/auto_deploy_vision_service.py +538 -0
isa_model/deployment/services/model_service.py +332 -0
isa_model/deployment/services/service_monitor.py +356 -0
isa_model/deployment/services/service_registry.py +527 -0
isa_model/deployment/services/simple_auto_deploy_vision_service.py +275 -0
isa_model/eval/__init__.py +80 -44
isa_model/eval/config/__init__.py +10 -0
isa_model/eval/config/evaluation_config.py +108 -0
isa_model/eval/evaluators/__init__.py +18 -0
isa_model/eval/evaluators/base_evaluator.py +503 -0
isa_model/eval/evaluators/llm_evaluator.py +472 -0
isa_model/eval/factory.py +417 -709
isa_model/eval/infrastructure/__init__.py +24 -0
isa_model/eval/infrastructure/experiment_tracker.py +466 -0
isa_model/eval/metrics.py +191 -21
isa_model/inference/ai_factory.py +257 -601
isa_model/inference/services/audio/base_stt_service.py +65 -1
isa_model/inference/services/audio/base_tts_service.py +75 -1
isa_model/inference/services/audio/openai_stt_service.py +189 -151
isa_model/inference/services/audio/openai_tts_service.py +12 -10
isa_model/inference/services/audio/replicate_tts_service.py +61 -56
isa_model/inference/services/base_service.py +55 -17
isa_model/inference/services/embedding/base_embed_service.py +65 -1
isa_model/inference/services/embedding/ollama_embed_service.py +103 -43
isa_model/inference/services/embedding/openai_embed_service.py +8 -10
isa_model/inference/services/helpers/stacked_config.py +148 -0
isa_model/inference/services/img/__init__.py +18 -0
isa_model/inference/services/{vision → img}/base_image_gen_service.py +80 -1
isa_model/inference/services/{stacked → img}/flux_professional_service.py +25 -1
isa_model/inference/services/{stacked → img/helpers}/base_stacked_service.py +40 -35
isa_model/inference/services/{vision → img}/replicate_image_gen_service.py +44 -31
isa_model/inference/services/llm/__init__.py +3 -3
isa_model/inference/services/llm/base_llm_service.py +492 -40
isa_model/inference/services/llm/helpers/llm_prompts.py +258 -0
isa_model/inference/services/llm/helpers/llm_utils.py +280 -0
isa_model/inference/services/llm/ollama_llm_service.py +51 -17
isa_model/inference/services/llm/openai_llm_service.py +70 -19
isa_model/inference/services/llm/yyds_llm_service.py +24 -23
isa_model/inference/services/vision/__init__.py +38 -4
isa_model/inference/services/vision/base_vision_service.py +218 -117
isa_model/inference/services/vision/{isA_vision_service.py → disabled/isA_vision_service.py} +98 -0
isa_model/inference/services/{stacked → vision}/doc_analysis_service.py +1 -1
isa_model/inference/services/vision/helpers/base_stacked_service.py +274 -0
isa_model/inference/services/vision/helpers/image_utils.py +272 -3
isa_model/inference/services/vision/helpers/vision_prompts.py +297 -0
isa_model/inference/services/vision/openai_vision_service.py +104 -307
isa_model/inference/services/vision/replicate_vision_service.py +140 -325
isa_model/inference/services/{stacked → vision}/ui_analysis_service.py +2 -498
isa_model/scripts/register_models.py +370 -0
isa_model/scripts/register_models_with_embeddings.py +510 -0
isa_model/serving/api/fastapi_server.py +6 -1
isa_model/serving/api/routes/unified.py +274 -0
{isa_model-0.3.5.dist-info → isa_model-0.3.7.dist-info}/METADATA +4 -1
{isa_model-0.3.5.dist-info → isa_model-0.3.7.dist-info}/RECORD +78 -53
isa_model/config/__init__.py +0 -9
isa_model/config/config_manager.py +0 -213
isa_model/core/model_manager.py +0 -213
isa_model/core/model_registry.py +0 -375
isa_model/core/vision_models_init.py +0 -116
isa_model/inference/billing_tracker.py +0 -406
isa_model/inference/services/llm/triton_llm_service.py +0 -481
isa_model/inference/services/stacked/__init__.py +0 -26
isa_model/inference/services/stacked/config.py +0 -426
isa_model/inference/services/vision/ollama_vision_service.py +0 -194
/isa_model/core/{model_storage.py → models/model_storage.py} +0 -0
/isa_model/inference/services/{vision → embedding}/helpers/text_splitter.py +0 -0
/isa_model/inference/services/llm/{llm_adapter.py → helpers/llm_adapter.py} +0 -0
{isa_model-0.3.5.dist-info → isa_model-0.3.7.dist-info}/WHEEL +0 -0
{isa_model-0.3.5.dist-info → isa_model-0.3.7.dist-info}/top_level.txt +0 -0

isa_model/config/config_manager.py DELETED Viewed

@@ -1,213 +0,0 @@
-"""
-Configuration Manager
-Central configuration management with environment support
-"""
-import os
-import yaml
-from typing import Dict, Any, Optional
-from pathlib import Path
-from dataclasses import dataclass
-import logging
-logger = logging.getLogger(__name__)
-@dataclass
-class ConfigSection:
-    """Base configuration section"""
-    def to_dict(self) -> Dict[str, Any]:
-        return self.__dict__
-@dataclass
-class DeploymentConfig(ConfigSection):
-    """Deployment configuration"""
-    platform: str = "replicate"  # replicate, modal, aws, local
-    modal_app_name: str = "isa-ui-analysis"
-    modal_gpu_type: str = "A100-40GB"
-    modal_memory: int = 32768
-    modal_timeout: int = 1800
-    modal_keep_warm: int = 1
-@dataclass
-class ModelConfig(ConfigSection):
-    """Model configuration"""
-    ui_detection_model: str = "microsoft/omniparser-v2"
-    ui_planning_model: str = "gpt-4o-mini"
-    fallback_detection: str = "yolov8n"
-    quantization: bool = False
-    batch_size: int = 1
-@dataclass
-class ServingConfig(ConfigSection):
-    """Serving configuration"""
-    host: str = "0.0.0.0"
-    port: int = 8000
-    workers: int = 1
-    reload: bool = False
-    log_level: str = "info"
-    cors_origins: list = None
-    def __post_init__(self):
-        if self.cors_origins is None:
-            self.cors_origins = ["*"]
-@dataclass
-class APIConfig(ConfigSection):
-    """API configuration"""
-    rate_limit: int = 100  # requests per minute
-    max_file_size: int = 10 * 1024 * 1024  # 10MB
-    cache_ttl: int = 3600  # 1 hour
-    enable_auth: bool = False
-@dataclass
-class ISAConfig:
-    """Complete ISA configuration"""
-    environment: str
-    deployment: DeploymentConfig
-    models: ModelConfig
-    serving: ServingConfig
-    api: APIConfig
-    def to_dict(self) -> Dict[str, Any]:
-        return {
-            "environment": self.environment,
-            "deployment": self.deployment.to_dict(),
-            "models": self.models.to_dict(),
-            "serving": self.serving.to_dict(),
-            "api": self.api.to_dict()
-        }
-class ConfigManager:
-    """Configuration manager with environment support"""
-    _instance = None
-    _config = None
-    def __new__(cls):
-        if cls._instance is None:
-            cls._instance = super(ConfigManager, cls).__new__(cls)
-        return cls._instance
-    def __init__(self):
-        if self._config is None:
-            self._load_config()
-    def _load_config(self):
-        """Load configuration from environment and files"""
-        env = os.getenv("ISA_ENV", "development")
-        # Default configurations
-        default_config = {
-            "deployment": DeploymentConfig(),
-            "models": ModelConfig(),
-            "serving": ServingConfig(),
-            "api": APIConfig()
-        }
-        # Load environment-specific configuration
-        config_file = self._get_config_file(env)
-        if config_file and config_file.exists():
-            try:
-                with open(config_file, 'r') as f:
-                    file_config = yaml.safe_load(f)
-                # Merge configurations
-                self._config = self._merge_configs(default_config, file_config, env)
-                logger.info(f"Loaded configuration for environment: {env}")
-            except Exception as e:
-                logger.warning(f"Failed to load config file {config_file}: {e}")
-                self._config = ISAConfig(environment=env, **default_config)
-        else:
-            logger.info(f"No config file found for {env}, using defaults")
-            self._config = ISAConfig(environment=env, **default_config)
-        # Override with environment variables
-        self._apply_env_overrides()
-    def _get_config_file(self, env: str) -> Optional[Path]:
-        """Get configuration file path for environment"""
-        # Try to find config file in multiple locations
-        possible_paths = [
-            Path(__file__).parent / "environments" / f"{env}.yaml",
-            Path.cwd() / "config" / f"{env}.yaml",
-            Path.cwd() / f"config_{env}.yaml"
-        ]
-        for path in possible_paths:
-            if path.exists():
-                return path
-        return None
-    def _merge_configs(self, default: Dict, file_config: Dict, env: str) -> ISAConfig:
-        """Merge default and file configurations"""
-        # Update deployment config
-        deployment_data = {**default["deployment"].__dict__}
-        if "deployment" in file_config:
-            deployment_data.update(file_config["deployment"])
-        deployment = DeploymentConfig(**deployment_data)
-        # Update model config
-        models_data = {**default["models"].__dict__}
-        if "models" in file_config:
-            models_data.update(file_config["models"])
-        models = ModelConfig(**models_data)
-        # Update serving config
-        serving_data = {**default["serving"].__dict__}
-        if "serving" in file_config:
-            serving_data.update(file_config["serving"])
-        serving = ServingConfig(**serving_data)
-        # Update API config
-        api_data = {**default["api"].__dict__}
-        if "api" in file_config:
-            api_data.update(file_config["api"])
-        api = APIConfig(**api_data)
-        return ISAConfig(
-            environment=env,
-            deployment=deployment,
-            models=models,
-            serving=serving,
-            api=api
-        )
-    def _apply_env_overrides(self):
-        """Apply environment variable overrides"""
-        # Deployment overrides
-        if os.getenv("ISA_DEPLOYMENT_PLATFORM"):
-            self._config.deployment.platform = os.getenv("ISA_DEPLOYMENT_PLATFORM")
-        # Model overrides
-        if os.getenv("ISA_UI_DETECTION_MODEL"):
-            self._config.models.ui_detection_model = os.getenv("ISA_UI_DETECTION_MODEL")
-        # Serving overrides
-        if os.getenv("ISA_SERVING_PORT"):
-            self._config.serving.port = int(os.getenv("ISA_SERVING_PORT"))
-        if os.getenv("ISA_SERVING_HOST"):
-            self._config.serving.host = os.getenv("ISA_SERVING_HOST")
-    def get_config(self) -> ISAConfig:
-        """Get current configuration"""
-        return self._config
-    def reload(self):
-        """Reload configuration"""
-        self._config = None
-        self._load_config()
-# Singleton instance
-_config_manager = ConfigManager()
-def get_config() -> ISAConfig:
-    """Get configuration instance"""
-    return _config_manager.get_config()
-def reload_config():
-    """Reload configuration"""
-    _config_manager.reload()

isa_model/core/model_manager.py DELETED Viewed

@@ -1,213 +0,0 @@
-from typing import Dict, Optional, List, Any
-import logging
-from pathlib import Path
-from huggingface_hub import hf_hub_download, snapshot_download
-from huggingface_hub.errors import HfHubHTTPError
-from .model_storage import ModelStorage, LocalModelStorage
-from .model_registry import ModelRegistry, ModelType, ModelCapability
-logger = logging.getLogger(__name__)
-class ModelManager:
-    """Model management service for handling model downloads, versions, and caching"""
-    # 统一的模型计费信息 (per 1M tokens)
-    MODEL_PRICING = {
-        # OpenAI Models
-        "openai": {
-            "gpt-4o-mini": {"input": 0.15, "output": 0.6},
-            "gpt-4.1-mini": {"input": 0.4, "output": 1.6},
-            "gpt-4.1-nano": {"input": 0.1, "output": 0.4},
-            "gpt-4o": {"input": 5.0, "output": 15.0},
-            "gpt-4-turbo": {"input": 10.0, "output": 30.0},
-            "gpt-4": {"input": 30.0, "output": 60.0},
-            "gpt-3.5-turbo": {"input": 0.5, "output": 1.5},
-            "text-embedding-3-small": {"input": 0.02, "output": 0.0},
-            "text-embedding-3-large": {"input": 0.13, "output": 0.0},
-            "whisper-1": {"input": 6.0, "output": 0.0},
-            "tts-1": {"input": 15.0, "output": 0.0},
-            "tts-1-hd": {"input": 30.0, "output": 0.0},
-        },
-        # Ollama Models (免费本地模型)
-        "ollama": {
-            "llama3.2:3b-instruct-fp16": {"input": 0.0, "output": 0.0},
-            "llama3.2-vision:latest": {"input": 0.0, "output": 0.0},
-            "bge-m3": {"input": 0.0, "output": 0.0},
-        },
-        # Replicate Models
-        "replicate": {
-            "black-forest-labs/flux-schnell": {"input": 3.0, "output": 0.0},  # $3 per 1000 images
-            "black-forest-labs/flux-kontext-pro": {"input": 40.0, "output": 0.0},  # $0.04 per image = $40 per 1000 images
-            "meta/meta-llama-3-8b-instruct": {"input": 0.05, "output": 0.25},
-            "kokoro-82m": {"input": 0.0, "output": 0.4},  # ~$0.0004 per second
-            "jaaari/kokoro-82m:f559560eb822dc509045f3921a1921234918b91739db4bf3daab2169b71c7a13": {"input": 0.0, "output": 0.4},
-        },
-        # YYDS Models
-        "yyds": {
-            "claude-sonnet-4-20250514": {"input": 4.5, "output": 22.5},  # $0.0045/1K = $4.5/1M, $0.0225/1K = $22.5/1M
-            "claude-3-5-sonnet-20241022": {"input": 3.0, "output": 15.0},  # $0.003/1K = $3.0/1M, $0.015/1K = $15.0/1M
-        }
-    }
-    def __init__(self,
-                 storage: Optional[ModelStorage] = None,
-                 registry: Optional[ModelRegistry] = None):
-        self.storage = storage or LocalModelStorage()
-        self.registry = registry or ModelRegistry()
-    def get_model_pricing(self, provider: str, model_name: str) -> Dict[str, float]:
-        """获取模型定价信息"""
-        return self.MODEL_PRICING.get(provider, {}).get(model_name, {"input": 0.0, "output": 0.0})
-    def calculate_cost(self, provider: str, model_name: str, input_tokens: int, output_tokens: int) -> float:
-        """计算请求成本"""
-        pricing = self.get_model_pricing(provider, model_name)
-        input_cost = (input_tokens / 1_000_000) * pricing["input"]
-        output_cost = (output_tokens / 1_000_000) * pricing["output"]
-        return input_cost + output_cost
-    def get_cheapest_model(self, provider: str, model_type: str = "llm") -> Optional[str]:
-        """获取最便宜的模型"""
-        provider_models = self.MODEL_PRICING.get(provider, {})
-        if not provider_models:
-            return None
-        # 计算每个模型的平均成本 (假设输入输出比例 1:1)
-        cheapest_model = None
-        lowest_cost = float('inf')
-        for model_name, pricing in provider_models.items():
-            avg_cost = (pricing["input"] + pricing["output"]) / 2
-            if avg_cost < lowest_cost:
-                lowest_cost = avg_cost
-                cheapest_model = model_name
-        return cheapest_model
-    async def get_model(self,
-                       model_id: str,
-                       repo_id: str,
-                       model_type: ModelType,
-                       capabilities: List[ModelCapability],
-                       revision: Optional[str] = None,
-                       force_download: bool = False) -> Optional[Path]:
-        """
-        Get model files, downloading if necessary
-        Args:
-            model_id: Unique identifier for the model
-            repo_id: Hugging Face repository ID
-            model_type: Type of model (LLM, embedding, etc.)
-            capabilities: List of model capabilities
-            revision: Specific model version/tag
-            force_download: Force re-download even if cached
-        Returns:
-            Path to the model files or None if failed
-        """
-        # Check if model is already downloaded
-        if not force_download:
-            model_path = await self.storage.load_model(model_id)
-            if model_path:
-                logger.info(f"Using cached model {model_id}")
-                return model_path
-        try:
-            # Download model files
-            logger.info(f"Downloading model {model_id} from {repo_id}")
-            model_dir = Path(f"./models/temp/{model_id}")
-            model_dir.mkdir(parents=True, exist_ok=True)
-            snapshot_download(
-                repo_id=repo_id,
-                revision=revision,
-                local_dir=model_dir,
-                local_dir_use_symlinks=False
-            )
-            # Save model and metadata
-            metadata = {
-                "repo_id": repo_id,
-                "revision": revision,
-                "downloaded_at": str(Path(model_dir).stat().st_mtime)
-            }
-            # Register model
-            self.registry.register_model(
-                model_id=model_id,
-                model_type=model_type,
-                capabilities=capabilities,
-                metadata=metadata
-            )
-            # Save model files
-            await self.storage.save_model(model_id, str(model_dir), metadata)
-            return await self.storage.load_model(model_id)
-        except HfHubHTTPError as e:
-            logger.error(f"Failed to download model {model_id}: {e}")
-            return None
-        except Exception as e:
-            logger.error(f"Unexpected error downloading model {model_id}: {e}")
-            return None
-    async def list_models(self) -> List[Dict[str, Any]]:
-        """List all downloaded models with their metadata"""
-        models = await self.storage.list_models()
-        return [
-            {
-                "model_id": model_id,
-                **metadata,
-                **(self.registry.get_model_info(model_id) or {})
-            }
-            for model_id, metadata in models.items()
-        ]
-    async def remove_model(self, model_id: str) -> bool:
-        """Remove a model and its metadata"""
-        try:
-            # Remove from storage
-            storage_success = await self.storage.delete_model(model_id)
-            # Unregister from registry
-            registry_success = self.registry.unregister_model(model_id)
-            return storage_success and registry_success
-        except Exception as e:
-            logger.error(f"Failed to remove model {model_id}: {e}")
-            return False
-    async def get_model_info(self, model_id: str) -> Optional[Dict[str, Any]]:
-        """Get information about a specific model"""
-        storage_info = await self.storage.get_metadata(model_id)
-        registry_info = self.registry.get_model_info(model_id)
-        if not storage_info and not registry_info:
-            return None
-        return {
-            **(storage_info or {}),
-            **(registry_info or {})
-        }
-    async def update_model(self,
-                          model_id: str,
-                          repo_id: str,
-                          model_type: ModelType,
-                          capabilities: List[ModelCapability],
-                          revision: Optional[str] = None) -> bool:
-        """Update a model to a new version"""
-        try:
-            return bool(await self.get_model(
-                model_id=model_id,
-                repo_id=repo_id,
-                model_type=model_type,
-                capabilities=capabilities,
-                revision=revision,
-                force_download=True
-            ))
-        except Exception as e:
-            logger.error(f"Failed to update model {model_id}: {e}")
-            return False

isa-model 0.3.5__py3-none-any.whl → 0.3.7__py3-none-any.whl

isa-model 0.3.5py3-none-any.whl → 0.3.7py3-none-any.whl