PyPI - isa-model - Versions diffs - 0.1.0__py3-none-any.whl → 0.1.1__py3-none-any.whl - Mend

isa-model 0.1.0py3-none-any.whl → 0.1.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (76) hide show

isa_model/__init__.py +1 -1
isa_model/core/model_registry.py +273 -46
isa_model/deployment/gpu_fp16_ds8/models/deepseek_r1/1/model.py +120 -0
isa_model/deployment/gpu_fp16_ds8/scripts/download_model.py +18 -0
isa_model/deployment/gpu_int8_ds8/app/server.py +66 -0
isa_model/deployment/gpu_int8_ds8/scripts/test_client.py +43 -0
isa_model/deployment/gpu_int8_ds8/scripts/test_client_os.py +35 -0
isa_model/eval/__init__.py +56 -0
isa_model/eval/benchmarks.py +469 -0
isa_model/eval/factory.py +582 -0
isa_model/eval/metrics.py +628 -0
isa_model/inference/ai_factory.py +98 -93
isa_model/inference/providers/openai_provider.py +21 -7
isa_model/inference/providers/replicate_provider.py +18 -5
isa_model/inference/providers/triton_provider.py +1 -1
isa_model/inference/services/audio/base_stt_service.py +91 -0
isa_model/inference/services/audio/base_tts_service.py +136 -0
isa_model/inference/services/audio/{yyds_audio_service.py → openai_tts_service.py} +4 -4
isa_model/inference/services/embedding/ollama_embed_service.py +48 -36
isa_model/inference/services/llm/__init__.py +0 -4
isa_model/inference/services/llm/base_llm_service.py +134 -0
isa_model/inference/services/llm/ollama_llm_service.py +1 -10
isa_model/inference/services/llm/openai_llm_service.py +70 -61
isa_model/inference/services/vision/__init__.py +1 -1
isa_model/inference/services/vision/ollama_vision_service.py +4 -4
isa_model/inference/services/vision/{yyds_vision_service.py → openai_vision_service.py} +5 -5
isa_model/inference/services/vision/replicate_image_gen_service.py +185 -0
isa_model/training/__init__.py +44 -0
isa_model/training/factory.py +393 -0
isa_model-0.1.1.dist-info/METADATA +327 -0
{isa_model-0.1.0.dist-info → isa_model-0.1.1.dist-info}/RECORD +35 -60
isa_model/deployment/mlflow_gateway/__init__.py +0 -8
isa_model/deployment/mlflow_gateway/start_gateway.py +0 -65
isa_model/deployment/unified_multimodal_client.py +0 -341
isa_model/inference/adapter/triton_adapter.py +0 -453
isa_model/inference/backends/Pytorch/bge_embed_backend.py +0 -188
isa_model/inference/backends/Pytorch/gemma_backend.py +0 -167
isa_model/inference/backends/Pytorch/llama_backend.py +0 -166
isa_model/inference/backends/Pytorch/whisper_backend.py +0 -194
isa_model/inference/backends/__init__.py +0 -53
isa_model/inference/backends/base_backend_client.py +0 -26
isa_model/inference/backends/container_services.py +0 -104
isa_model/inference/backends/local_services.py +0 -72
isa_model/inference/backends/openai_client.py +0 -130
isa_model/inference/backends/replicate_client.py +0 -197
isa_model/inference/backends/third_party_services.py +0 -239
isa_model/inference/backends/triton_client.py +0 -97
isa_model/inference/client_sdk/client.py +0 -134
isa_model/inference/client_sdk/client_data_std.py +0 -34
isa_model/inference/client_sdk/client_sdk_schema.py +0 -16
isa_model/inference/client_sdk/exceptions.py +0 -0
isa_model/inference/engine/triton/model_repository/bge/1/model.py +0 -174
isa_model/inference/engine/triton/model_repository/gemma/1/model.py +0 -250
isa_model/inference/engine/triton/model_repository/llama/1/model.py +0 -76
isa_model/inference/engine/triton/model_repository/whisper/1/model.py +0 -195
isa_model/inference/providers/vllm_provider.py +0 -0
isa_model/inference/providers/yyds_provider.py +0 -83
isa_model/inference/services/audio/fish_speech/handler.py +0 -215
isa_model/inference/services/audio/runpod_tts_fish_service.py +0 -212
isa_model/inference/services/audio/triton_speech_service.py +0 -138
isa_model/inference/services/audio/whisper_service.py +0 -186
isa_model/inference/services/base_tts_service.py +0 -66
isa_model/inference/services/embedding/bge_service.py +0 -183
isa_model/inference/services/embedding/ollama_rerank_service.py +0 -118
isa_model/inference/services/embedding/onnx_rerank_service.py +0 -73
isa_model/inference/services/llm/gemma_service.py +0 -143
isa_model/inference/services/llm/llama_service.py +0 -143
isa_model/inference/services/llm/replicate_llm_service.py +0 -179
isa_model/inference/services/llm/triton_llm_service.py +0 -230
isa_model/inference/services/vision/replicate_vision_service.py +0 -241
isa_model/inference/services/vision/triton_vision_service.py +0 -199
isa_model-0.1.0.dist-info/METADATA +0 -116
/isa_model/inference/{client_sdk/__init__.py → services/embedding/openai_embed_service.py} +0 -0
{isa_model-0.1.0.dist-info → isa_model-0.1.1.dist-info}/WHEEL +0 -0
{isa_model-0.1.0.dist-info → isa_model-0.1.1.dist-info}/licenses/LICENSE +0 -0
{isa_model-0.1.0.dist-info → isa_model-0.1.1.dist-info}/top_level.txt +0 -0

isa_model-0.1.1.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,327 @@
+Metadata-Version: 2.4
+Name: isa-model
+Version: 0.1.1
+Summary: Unified AI model serving framework
+Author-email: isA_Model Contributors <your.email@example.com>
+License-Expression: MIT
+Classifier: Development Status :: 3 - Alpha
+Classifier: Intended Audience :: Developers
+Classifier: Operating System :: OS Independent
+Classifier: Programming Language :: Python :: 3
+Requires-Python: >=3.8
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Requires-Dist: fastapi>=0.95.0
+Requires-Dist: numpy>=1.20.0
+Requires-Dist: httpx>=0.23.0
+Requires-Dist: pydantic>=2.0.0
+Requires-Dist: uvicorn>=0.22.0
+Requires-Dist: requests>=2.28.0
+Requires-Dist: aiohttp>=3.8.0
+Requires-Dist: transformers>=4.30.0
+Requires-Dist: langchain-core>=0.1.0
+Requires-Dist: huggingface-hub>=0.16.0
+Requires-Dist: kubernetes>=25.3.0
+Requires-Dist: mlflow>=2.4.0
+Requires-Dist: torch>=2.0.0
+Requires-Dist: openai>=1.10.0
+Requires-Dist: replicate>=0.23.0
+Requires-Dist: python-dotenv>=1.0.0
+Dynamic: license-file
+# isA Model - Unified AI Model Serving Framework
+A comprehensive Python framework for working with multiple AI providers and models through a unified interface. Support for OpenAI, Replicate, Ollama, and more.
+## Installation
+```bash
+pip install isa-model
+```
+## Quick Start
+The isa-model package supports three main usage patterns:
+### 1. Pass API Keys Directly (Recommended)
+This is the most flexible approach - no environment variables needed:
+```python
+from isa_model.inference.ai_factory import AIFactory
+# Create factory instance
+factory = AIFactory.get_instance()
+# Use OpenAI with API key
+llm = factory.get_llm(
+    model_name="gpt-4o-mini",
+    provider="openai",
+    api_key="your-openai-api-key-here"
+)
+# Use Replicate for image generation
+image_gen = factory.get_vision_model(
+    model_name="stability-ai/sdxl",
+    provider="replicate",
+    api_key="your-replicate-token-here"
+)
+```
+### 2. Use Environment Variables
+Set your API keys as environment variables:
+```bash
+export OPENAI_API_KEY="your-openai-api-key"
+export REPLICATE_API_TOKEN="your-replicate-token"
+```
+Then use without passing keys:
+```python
+from isa_model.inference.ai_factory import AIFactory
+factory = AIFactory.get_instance()
+# Will automatically use OPENAI_API_KEY from environment
+llm = factory.get_llm(model_name="gpt-4o-mini", provider="openai")
+# Will automatically use REPLICATE_API_TOKEN from environment
+image_gen = factory.get_vision_model(model_name="stability-ai/sdxl", provider="replicate")
+```
+### 3. Use Local Models (No API Key Needed)
+For local models like Ollama, no API keys are required:
+```python
+from isa_model.inference.ai_factory import AIFactory
+factory = AIFactory.get_instance()
+# Use local Ollama model (no API key needed)
+llm = factory.get_llm(model_name="llama3.1", provider="ollama")
+```
+## Supported Services
+### Language Models (LLM)
+```python
+# OpenAI models
+llm = factory.get_llm("gpt-4o-mini", "openai", api_key="your-key")
+llm = factory.get_llm("gpt-4o", "openai", api_key="your-key")
+# Ollama models (local)
+llm = factory.get_llm("llama3.1", "ollama")
+llm = factory.get_llm("codellama", "ollama")
+# Replicate models
+llm = factory.get_llm("meta/llama-3-70b-instruct", "replicate", api_key="your-token")
+```
+### Vision Models
+```python
+# OpenAI vision
+vision = factory.get_vision_model("gpt-4o", "openai", api_key="your-key")
+# Replicate image generation
+image_gen = factory.get_vision_model("stability-ai/sdxl", "replicate", api_key="your-token")
+# Ollama vision (local)
+vision = factory.get_vision_model("llava", "ollama")
+```
+### Embedding Models
+```python
+# OpenAI embeddings
+embedder = factory.get_embedding("text-embedding-3-small", "openai", {"api_key": "your-key"})
+# Ollama embeddings (local)
+embedder = factory.get_embedding("bge-m3", "ollama")
+```
+## Base Service Classes
+The framework provides comprehensive base classes for implementing new AI services:
+### BaseLLMService
+- `ainvoke()` - Universal invocation method
+- `achat()` - Chat completion with messages
+- `acompletion()` - Simple text completion
+- `agenerate()` - Generate multiple completions
+- `astream_chat()` - Streaming chat responses
+- `get_token_usage()` - Token usage statistics
+### BaseVisionService
+- `analyze_image()` - Analyze and describe images
+- `describe_image()` - Generate detailed descriptions
+- `extract_text()` - OCR text extraction
+- `detect_objects()` - Object detection
+- `classify_image()` - Image classification
+- `compare_images()` - Image similarity comparison
+### BaseImageGenService
+- `generate_image()` - Generate single image from text
+- `generate_images()` - Generate multiple images
+- `image_to_image()` - Transform existing images
+- `get_supported_sizes()` - Get supported dimensions
+### BaseEmbedService
+- `create_text_embedding()` - Single text embedding
+- `create_text_embeddings()` - Batch text embeddings
+- `compute_similarity()` - Similarity calculation
+- `find_similar_texts()` - Semantic search
+### BaseSTTService (Speech-to-Text)
+- `transcribe_audio()` - Audio transcription
+- `transcribe_audio_batch()` - Batch transcription
+- `detect_language()` - Language detection
+### BaseTTSService (Text-to-Speech)
+- `synthesize_speech()` - Text to speech conversion
+- `synthesize_speech_to_file()` - Save speech to file
+- `get_available_voices()` - List available voices
+## Usage Examples
+### Chat Completion
+```python
+import asyncio
+from isa_model.inference.ai_factory import AIFactory
+async def chat_example():
+    factory = AIFactory.get_instance()
+    llm = factory.get_llm("gpt-4o-mini", "openai", api_key="your-key")
+    messages = [
+        {"role": "user", "content": "Hello, how are you?"}
+    ]
+    response = await llm.achat(messages)
+    print(response)
+# Run the async function
+asyncio.run(chat_example())
+```
+### Image Analysis
+```python
+import asyncio
+from isa_model.inference.ai_factory import AIFactory
+async def vision_example():
+    factory = AIFactory.get_instance()
+    vision = factory.get_vision_model("gpt-4o", "openai", api_key="your-key")
+    result = await vision.analyze_image(
+        image="path/to/your/image.jpg",
+        prompt="What do you see in this image?"
+    )
+    print(result["text"])
+asyncio.run(vision_example())
+```
+### Image Generation
+```python
+import asyncio
+from isa_model.inference.ai_factory import AIFactory
+async def image_gen_example():
+    factory = AIFactory.get_instance()
+    image_gen = factory.get_vision_model(
+        "stability-ai/sdxl",
+        "replicate",
+        api_key="your-replicate-token"
+    )
+    result = await image_gen.generate_image(
+        prompt="A beautiful sunset over mountains",
+        width=1024,
+        height=1024
+    )
+    # Save the generated image
+    with open("generated_image.png", "wb") as f:
+        f.write(result["image_data"])
+asyncio.run(image_gen_example())
+```
+## Configuration Options
+You can pass additional configuration options:
+```python
+# Custom configuration
+config = {
+    "temperature": 0.7,
+    "max_tokens": 1000,
+    "top_p": 0.9
+}
+llm = factory.get_llm(
+    model_name="gpt-4o-mini",
+    provider="openai",
+    config=config,
+    api_key="your-key"
+)
+```
+## Error Handling
+The framework provides informative error messages and graceful fallbacks:
+```python
+try:
+    llm = factory.get_llm("gpt-4o-mini", "openai", api_key="invalid-key")
+    response = await llm.achat([{"role": "user", "content": "Hello"}])
+except Exception as e:
+    print(f"Error: {e}")
+```
+## Development
+### Installing for Development
+```bash
+git clone <repository-url>
+cd isA_Model
+pip install -e .
+```
+### Running Tests
+```bash
+pytest tests/
+```
+### Building and Publishing
+```bash
+# Build the package
+python -m build
+# Upload to PyPI (requires PYPI_API_TOKEN in .env.local)
+bash scripts/normal_update.sh
+```
+## License
+MIT License - see LICENSE file for details.
+## Contributing
+Contributions are welcome! Please read our contributing guidelines and submit pull requests to our GitHub repository.
+## Support
+For questions and support, please open an issue on our GitHub repository.

{isa_model-0.1.0.dist-info → isa_model-0.1.1.dist-info}/RECORD RENAMED Viewed

@@ -1,6 +1,6 @@
-isa_model/__init__.py,sha256=d63WuNpouABPnomHiQKmPp829-ba-CtKnyefZwgFNsc,87
+isa_model/__init__.py,sha256=gr-wNN5AZw-rACDfAaQjU5yRHNvqAdimR4O7opDC7tE,87
 isa_model/core/model_manager.py,sha256=eQp0MV0x5sghL1qliPUWkFX4sEKqInyGLoICfNkJnZM,5275
-isa_model/core/model_registry.py,sha256=3K32y9N0M1fXoUH_EBPoFq9Tj1enFgOSx9H57upmsHs,4005
+isa_model/core/model_registry.py,sha256=gT8yFxi1gC-45Bolc9WX19ZvrjuV1xyBgQX6TFhz62k,14032
 isa_model/core/model_router.py,sha256=WT45wP5Ta-c3QErPGUY86G9-IpWQXjLC5FG8cPI-qK0,8637
 isa_model/core/model_storage.py,sha256=yMLapW87EY1EPXw6S7H8UQAZh3hJ1KxsEohjgjw-HrA,4507
 isa_model/core/model_version.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -8,69 +8,42 @@ isa_model/core/resource_manager.py,sha256=jlrlhHqtCbq4sAFgfGEEhTWRcuftXtjfV6SjkZ
 isa_model/core/storage/hf_storage.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 isa_model/core/storage/local_storage.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 isa_model/core/storage/minio_storage.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-isa_model/deployment/unified_multimodal_client.py,sha256=GjdQTfFAG4S3dvYvVrH9HraHuDMLPnoeTQKXx0Ybx5M,10858
-isa_model/deployment/mlflow_gateway/__init__.py,sha256=gXV4Vg5lTkqjf9ZQ1Xp-36U15GpoGo5x529stoH3zeI,197
-isa_model/deployment/mlflow_gateway/start_gateway.py,sha256=bfGuHggag3tIO9ItY5H6LSx1fZKDILBUog1JWw6Rlz4,1762
+isa_model/deployment/gpu_fp16_ds8/models/deepseek_r1/1/model.py,sha256=jCAN_r-22gNR1HURAjmIZVeuU1TNidcyXRzxQdi2jOs,4015
+isa_model/deployment/gpu_fp16_ds8/scripts/download_model.py,sha256=E6iSAgBu3OGfK-HLIXbGWfYSAIGQSGzj6wMAy1JAugI,566
+isa_model/deployment/gpu_int8_ds8/app/server.py,sha256=lwWxdnR2DNEd0vIGQyfabKtDSUzSHVQsy3Z_AJejpVg,2102
+isa_model/deployment/gpu_int8_ds8/scripts/test_client.py,sha256=aCULgRYzEQj_ELUK1bmPgN99yvFgNR5C0O3gc8S32pg,1421
+isa_model/deployment/gpu_int8_ds8/scripts/test_client_os.py,sha256=XXrneTCHUeh1LNRcu-YtZQ5B4pNawlrxC-cTWmJU2A8,936
+isa_model/eval/__init__.py,sha256=3sM7qLSIL_RMKcsmkCYcjOjv9ozuk16r7pnl4F-XeNA,1197
+isa_model/eval/benchmarks.py,sha256=_L4Vwj2hwf2yhqoleIASO9z5e3LRCClCVEVCQbGt0I8,16885
+isa_model/eval/factory.py,sha256=JmGRLTYPtZLqKwy8o1Z9NHUHX6mkRDw13ac_Qin_VrE,19529
+isa_model/eval/metrics.py,sha256=mYeGwSa9PkgY0p-vadAscvak-pLrVfCSrsmAodVpgNQ,22584
 isa_model/inference/__init__.py,sha256=usfuQJ4zYY2RRtHkE-V6LuJ5aN7WJogtPUj9Qmy4Wvw,318
-isa_model/inference/ai_factory.py,sha256=VLmmgJe26khTSXm_0z1p73vvbsvmVv9T8xvcJmnsEHo,15704
+isa_model/inference/ai_factory.py,sha256=mF-Pj8FUCsOvSG0IIg1OVMhDwXnpxIbZQJWVYWfjv2s,14660
 isa_model/inference/base.py,sha256=qwOddnSGI0GUdD6qIdGBPQpkW7UjU3Y-zaZvu70B4WA,1278
-isa_model/inference/adapter/triton_adapter.py,sha256=nmG1uNVXY28VxCdITDJw_p1FXVuBp9mtOutnHzv0cQ4,15120
 isa_model/inference/adapter/unified_api.py,sha256=67_Ok8W20m6Otf6r9WyOEVpnxondP4UAxOASk9ozDk4,8668
-isa_model/inference/backends/__init__.py,sha256=zNu9tlQlET5Jpr8kRGHV0vVW7XEyISeyNTxfkeEuYk4,1254
-isa_model/inference/backends/base_backend_client.py,sha256=aDlHnStvpxD8whX9E1TZ-8yh2SBfxHD_uzBNj84p1dE,648
-isa_model/inference/backends/container_services.py,sha256=BMa32QuFY19AOlhW4kFsPPrYDxiU5xbAPkf-l5cCCMo,4000
-isa_model/inference/backends/local_services.py,sha256=hReD3NimF5-TfrRl2gibHRs_TNF8TQ70IeDAQU4Xw1Q,2625
-isa_model/inference/backends/openai_client.py,sha256=gwB2VE-NfDtYaSM2ILh4uEp-i0X8SHf-fHPv1skF9WA,4703
-isa_model/inference/backends/replicate_client.py,sha256=kmcTvhyv09TWb-mx8As8GsjIJezI9Hsc4MZMinVqQo0,7062
-isa_model/inference/backends/third_party_services.py,sha256=jyvOoXulmIowcvbk5XzAUjUgUm2dn1ox3F1nPLI4fBQ,9471
-isa_model/inference/backends/triton_client.py,sha256=HuZB_FY4PhI-u6vpZMOzMjALFO9Jds1Vzyw8PMaTuxg,3712
-isa_model/inference/backends/Pytorch/bge_embed_backend.py,sha256=UNZbOYDzPvaxi8_8jRs881v-xpwGK1omB8uDWjL-N_s,5917
-isa_model/inference/backends/Pytorch/gemma_backend.py,sha256=i8W58H4iVfDvEHc6m5VZymNPTgexVGPDZ1rDn5s4ae0,5410
-isa_model/inference/backends/Pytorch/llama_backend.py,sha256=tRpAs9DdoqH1pjzDMg5T60sIYMOjtaSlLJ-Roxcl1aU,5248
-isa_model/inference/backends/Pytorch/whisper_backend.py,sha256=oMJ3Fg6O7zaURDg21IdM3HCdnyJiF-iyxIvNOuFFc8k,6218
-isa_model/inference/client_sdk/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-isa_model/inference/client_sdk/client.py,sha256=pvKNwnTGcPX-5Q3ACfiftXfghUaIksFfd-zqEi-ze0g,5049
-isa_model/inference/client_sdk/client_data_std.py,sha256=tFBMb2F6pqNeq49fKkRSJW656qpO0BB1rs_wqYJGCS4,1817
-isa_model/inference/client_sdk/client_sdk_schema.py,sha256=Kq5pKrvEzCs2ZYJ44PaMTimHyyCttI-fE1MES-qkGFc,544
-isa_model/inference/client_sdk/exceptions.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-isa_model/inference/engine/triton/model_repository/bge/1/model.py,sha256=43MuLQ_nNl64VTRPLmxe7SzkRJl-cZ3A_wnlgQMl_B8,6004
-isa_model/inference/engine/triton/model_repository/gemma/1/model.py,sha256=1aR7UG6W-Dv1PyOTRTmnKIerogricl2DI_4p__hfSt4,9481
-isa_model/inference/engine/triton/model_repository/llama/1/model.py,sha256=4m9_IorEeAPMve-93AECo3pRjK6Swhs38RbCfCn3WKo,3744
-isa_model/inference/engine/triton/model_repository/whisper/1/model.py,sha256=0hugV7MZYj4EwiF1JZzYjFSuj-HK7KVumwtPL2Dg8-w,7943
 isa_model/inference/providers/__init__.py,sha256=a83q-LMFv8u47wf0XtxvqOw_mlVgA_90wtuwy02qdDE,581
 isa_model/inference/providers/base_provider.py,sha256=btkSXE7o1IfOpv22hMM6_DNlm05tbLMszsP1J4T26KE,924
 isa_model/inference/providers/model_cache_manager.py,sha256=dLRpx7OJweQ5LcSAkU7D0DQRfLtIhG6nGvg4W_gau80,15315
 isa_model/inference/providers/ollama_provider.py,sha256=BLkWp4gmCw6Fwf1yNRY90VftMqwca9YOGOHf6DqVEKs,2692
-isa_model/inference/providers/openai_provider.py,sha256=Gwg7JALDs2xTEIWVX0foFue7PlSTjES3I-OLD9cnXOA,3280
-isa_model/inference/providers/replicate_provider.py,sha256=m4FzCd2BTtlPr11gUBDs6L4g4jTNHiPXrp2aoQ5bChs,3414
-isa_model/inference/providers/triton_provider.py,sha256=JRzj15a3HtuaZpLbgPxGfjDubVXzZCecUwfqnjHHa-g,15251
-isa_model/inference/providers/vllm_provider.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-isa_model/inference/providers/yyds_provider.py,sha256=h0rAtEvsq4B1x94WAZkUY6hhbnQ1XycW1zV440Zio7w,3028
+isa_model/inference/providers/openai_provider.py,sha256=8ywUsrvlvC7VY3LNOVJP1IcRwBMi1NvG0PoI0lYo4jM,3881
+isa_model/inference/providers/replicate_provider.py,sha256=qXnK3Yzy5-gaduVJVY8asrIIi-97m4WGUkG963_4ifk,3948
+isa_model/inference/providers/triton_provider.py,sha256=GKlth7cTOx6ERbsXXJ0gDNby3kVGQNULBDt098BXBSU,15258
 isa_model/inference/services/__init__.py,sha256=p-UlEGMnadGUD6zzwfAjf367S2QQ-z1sD6TP-K4EjEM,353
 isa_model/inference/services/base_service.py,sha256=PB6eZp-PynUdo9a0QofvHgrrJLUFYM_FSafTg7fvWrY,3083
-isa_model/inference/services/base_tts_service.py,sha256=UqfcjS9aE5eMURc0bU2nSmUTyn8QxeKEqU5kUwK-W5E,1934
-isa_model/inference/services/audio/runpod_tts_fish_service.py,sha256=CLeV8O68Y_L-ipaSj9aq348HavTpYAFE5yBDfZ_gfA0,7831
-isa_model/inference/services/audio/triton_speech_service.py,sha256=X3P8YsQmuOER7G7-8HaGlvhbuDAmMisV8M7S-ai3cuc,5033
-isa_model/inference/services/audio/whisper_service.py,sha256=fBc1z7YmvZTqn_CPkSDGsJj4emdDnomIBBwOQzHg2EM,6109
-isa_model/inference/services/audio/yyds_audio_service.py,sha256=mitm6o4a6N4wZAWyCl5_1B4-LMzlGDfVT87OP9mso30,2553
-isa_model/inference/services/audio/fish_speech/handler.py,sha256=YuFfxJiu6VvrsYbAzH_hQI1iwTWD6bTgTk8pcKwKWJ4,6673
-isa_model/inference/services/embedding/bge_service.py,sha256=Bx7jScA9RYaQD-9t6QgKeLIY9pmd99JnZCYJgXSrTcQ,6058
-isa_model/inference/services/embedding/ollama_embed_service.py,sha256=zoTHH8Z1IRkDMNciNJghjbV7uzxalIbWc1FYB6-nNoI,3168
-isa_model/inference/services/embedding/ollama_rerank_service.py,sha256=NdlH2fDGbFUdTVtmRLTEcer-f7PcmTDmf0bDkSCTPdI,4276
-isa_model/inference/services/embedding/onnx_rerank_service.py,sha256=GPxezAyZoDpkAdaxuGZ_Fjx3EPpuvSd9b0cQMk_4_8w,2698
-isa_model/inference/services/llm/__init__.py,sha256=hV0WaIb_-fbzzxPgqFihZN5-OcZYVpxYt3bhCJCZl3k,424
-isa_model/inference/services/llm/gemma_service.py,sha256=P8zh-FEYxpiRQJIal3TtZeplxs_GUqMa6C8FvwkQgp8,4396
-isa_model/inference/services/llm/llama_service.py,sha256=XlqVxG_THjNRrQ4cbSeLv3L-Mln5XVqp6gWQF0GtGlo,4396
-isa_model/inference/services/llm/ollama_llm_service.py,sha256=H2_m83taVFQCgIXtiYGfBrCo9YOuKcikzwHmHSf-_HI,4290
-isa_model/inference/services/llm/openai_llm_service.py,sha256=WE9YtjRJepZG756EoluJSr1NLtPTBjV1vqRs3EqufkM,4960
-isa_model/inference/services/llm/replicate_llm_service.py,sha256=ZNAsGrIrTYvj6cguVmqAGtAhW9_FTO8aJj8Xh11kwrQ,6962
-isa_model/inference/services/llm/triton_llm_service.py,sha256=V8XgJ1e9NLenX0SICvoJdGYsqAG7HnK2G_Pqqv5ON68,8102
+isa_model/inference/services/audio/base_stt_service.py,sha256=tIfdRLEppcFEyTEmI8zi8OwMd7wVP423MQDN4iYDEcE,2800
+isa_model/inference/services/audio/base_tts_service.py,sha256=BzZ3JrrLpm4COthNyNrIO2QgP7RZkXDNPEELEKHzIbA,4164
+isa_model/inference/services/audio/openai_tts_service.py,sha256=0R3-AFSAU0sOCx9iXmRSLxgAh6Tm1n887mPK4_MGTgY,2560
+isa_model/inference/services/embedding/ollama_embed_service.py,sha256=qspgGDcLPakG0yirdKDT0r7asgUkMO-soM2J1OaqE6g,3700
+isa_model/inference/services/embedding/openai_embed_service.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+isa_model/inference/services/llm/__init__.py,sha256=Yf6zMjcHs-eGLzl9mRGRf75S_5oBuNxxpc2r3mDw-CE,269
+isa_model/inference/services/llm/base_llm_service.py,sha256=HtlTArjeCywvkzlAp4R4iWkoaOEQg1RdltOZdbeRYFQ,3982
+isa_model/inference/services/llm/ollama_llm_service.py,sha256=WYCuJG16x9RtQm0vFJNxQWSVKFtNnCk8kc3_HZB4UKs,3875
+isa_model/inference/services/llm/openai_llm_service.py,sha256=EuduDfZ-10PEoFrjRr7KmZvxew2B-GQSYlvmqKQcVXA,5394
 isa_model/inference/services/others/table_transformer_service.py,sha256=r74h6QUSwSj6jTt-gRProz9SgwBwKWDe50NR0uqW0ZI,2367
-isa_model/inference/services/vision/__init__.py,sha256=ddHlbtZ_P2LaQHP2LiJc-yOqkXwPVRv6_q3qCjwrkng,274
-isa_model/inference/services/vision/ollama_vision_service.py,sha256=zPe9pRSP82K95WAaikQYDhzCcjKUrxioi3Qsltf9SLI,1997
-isa_model/inference/services/vision/replicate_vision_service.py,sha256=kfjzOIWK7S4FccEzLxFM77EVVkK9V4Rwh1w4EplfL5w,8405
-isa_model/inference/services/vision/triton_vision_service.py,sha256=XUs8bqZ-FN300ECyiw-C-fg1AbvhoespkJhawQkzEzo,7220
-isa_model/inference/services/vision/yyds_vision_service.py,sha256=hiBy_4s1L7k_4p6VX1Hu2GOgdTSheYf7ZgrRoy3Kpmc,2911
+isa_model/inference/services/vision/__init__.py,sha256=t06-E1Fo89MTLJweHx3ai892HHbvnwh5G0ovj0Y-2wk,277
+isa_model/inference/services/vision/ollama_vision_service.py,sha256=aGWMF11YZ-4-6kSkX5af0m1u704OYutO0wwmfWszhBE,2004
+isa_model/inference/services/vision/openai_vision_service.py,sha256=5M182cV-wKCnV_U0CGWu4uFrggo--3YLD_0_FpNW9Ak,2920
+isa_model/inference/services/vision/replicate_image_gen_service.py,sha256=03jhK31C_4p0Xj5V9GiCRlgF-UpNw7aHjCYiCCiqWNw,7826
 isa_model/inference/services/vision/helpers/image_utils.py,sha256=hTZi4MLktETupPIbE-TXMSi1kix6h8UfLiyEIDt2rzA,1751
 isa_model/inference/services/vision/helpers/text_splitter.py,sha256=6AbvcQ7H6MS54B9d9T1XBGg4GhvmKfZqp00lKp9pF-U,1635
 isa_model/inference/utils/conversion/bge_rerank_convert.py,sha256=1dvtxe5-PPCe2Au6SO8F2XaD-xdIoeA4zDTcid2L9FU,2691
@@ -81,6 +54,8 @@ isa_model/scripts/mlflow_manager.py,sha256=7xMN0_wELr1jcALuTW9WeWirRkPZPlE2LlFfZ
 isa_model/scripts/model_registry.py,sha256=7rycPkVk8WHUO3LJaHfdyy5Yq8qmd_4WkGk4wKan-2w,14279
 isa_model/scripts/start_mlflow.py,sha256=3AGKBzByjzbZ56I8w0IOfYnp3V6EU2Lv9NtX9maSqL8,2571
 isa_model/scripts/training_tracker.py,sha256=cnXPi8ip2OK76-aWAOgC-dKx90PqZLEnP6UbHso7Fwc,8080
+isa_model/training/__init__.py,sha256=RQDQ0m8p9YXBXgyyFxADeRA_-m18-wgNyWpjJhJfudU,950
+isa_model/training/factory.py,sha256=iX-OkKRud09F2VfGXKKKj3w9d26kh9Po4FKvxTqmFiI,12581
 isa_model/training/engine/llama_factory/__init__.py,sha256=WCqmUHTidASN4owGDOPSnKeLdG1gbK1MXQrRAzjP0z4,969
 isa_model/training/engine/llama_factory/config.py,sha256=3OvjuXs9IyfcY52pB1SpXSOe0VwmKZvsmy8VK9Ig6Ss,3178
 isa_model/training/engine/llama_factory/data_adapter.py,sha256=krqLp6Jy-IFQ6_M8O3FCtU-qqzUFJ65aNHpVq9C4Zyk,8865
@@ -110,8 +85,8 @@ isa_model/training/llm_model/annotation/tests/test_annotation_flow.py,sha256=DXY
 isa_model/training/llm_model/annotation/tests/test_minio copy.py,sha256=EI-PlH5xttAZF14Z_xn6LjgIJBkvP2qjLcvbX2hc0RM,3946
 isa_model/training/llm_model/annotation/tests/test_minio_upload.py,sha256=fL1eMubwR6L9lYc3zEwlWU9yjJuTsIYi93i0l9QUjm0,1109
 isa_model/training/llm_model/annotation/views/annotation_controller.py,sha256=3VzJ52yI-YIpcaAAXy2qac7sr4hTnFdtn-ZEKTt4IkM,5792
-isa_model-0.1.0.dist-info/licenses/LICENSE,sha256=nNPdMBBVrQz3f7AgKFZuyQgdar9d90Vdw51es-P72Dw,1084
-isa_model-0.1.0.dist-info/METADATA,sha256=qKxBtPmgD-U5QhkbO0LDAbVB0KQb9fxUXH6Hskfkk6g,3004
-isa_model-0.1.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-isa_model-0.1.0.dist-info/top_level.txt,sha256=eHSy_Xb3kNkh2kK11mi1mZh0Wz91AQ5b8k2KFYO-rE8,10
-isa_model-0.1.0.dist-info/RECORD,,
+isa_model-0.1.1.dist-info/licenses/LICENSE,sha256=nNPdMBBVrQz3f7AgKFZuyQgdar9d90Vdw51es-P72Dw,1084
+isa_model-0.1.1.dist-info/METADATA,sha256=hTYSsOkklHerhi4whQn44KV0TOrbrmmNLpqVnVf6Cz4,8105
+isa_model-0.1.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+isa_model-0.1.1.dist-info/top_level.txt,sha256=eHSy_Xb3kNkh2kK11mi1mZh0Wz91AQ5b8k2KFYO-rE8,10
+isa_model-0.1.1.dist-info/RECORD,,

isa_model/deployment/mlflow_gateway/__init__.py DELETED Viewed

@@ -1,8 +0,0 @@
-"""
-MLflow Gateway module for IsA Model.
-Replaces the custom adapter with industry-standard MLflow Gateway.
-"""
-from .start_gateway import start_mlflow_gateway
-__all__ = ["start_mlflow_gateway"]

isa_model/deployment/mlflow_gateway/start_gateway.py DELETED Viewed

@@ -1,65 +0,0 @@
-#!/usr/bin/env python3
-"""
-MLflow Gateway starter script.
-Replaces the custom adapter with industry-standard MLflow Gateway.
-Usage:
-    python -m isa_model.deployment.mlflow_gateway.start_gateway
-"""
-import os
-import sys
-import logging
-import subprocess
-from pathlib import Path
-# Configure logging
-logging.basicConfig(
-    level=logging.INFO,
-    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
-)
-logger = logging.getLogger(__name__)
-def start_mlflow_gateway():
-    """Start MLflow Gateway with our configuration."""
-    # Get the directory containing this script
-    script_dir = Path(__file__).parent
-    config_file = script_dir / "gateway_config.yaml"
-    if not config_file.exists():
-        logger.error(f"Gateway config file not found: {config_file}")
-        sys.exit(1)
-    # Set environment variables
-    os.environ["MLFLOW_GATEWAY_CONFIG_PATH"] = str(config_file)
-    # MLflow Gateway command
-    cmd = [
-        "mlflow", "gateway", "start",
-        "--config-path", str(config_file),
-        "--host", "0.0.0.0",
-        "--port", "8000"
-    ]
-    logger.info("🚀 Starting MLflow Gateway...")
-    logger.info(f"📁 Config file: {config_file}")
-    logger.info(f"🌐 Server: http://localhost:8000")
-    logger.info(f"📚 Docs: http://localhost:8000/docs")
-    try:
-        # Start the gateway
-        subprocess.run(cmd, check=True)
-    except KeyboardInterrupt:
-        logger.info("MLflow Gateway stopped by user")
-    except subprocess.CalledProcessError as e:
-        logger.error(f"MLflow Gateway failed to start: {e}")
-        sys.exit(1)
-    except Exception as e:
-        logger.error(f"Unexpected error: {e}")
-        sys.exit(1)
-if __name__ == "__main__":
-    start_mlflow_gateway()

isa-model 0.1.0__py3-none-any.whl → 0.1.1__py3-none-any.whl

isa-model 0.1.0py3-none-any.whl → 0.1.1py3-none-any.whl