isa-model 0.4.3__tar.gz → 0.4.5__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {isa_model-0.4.3 → isa_model-0.4.5}/PKG-INFO +6 -1
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/config.py +3 -3
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/logging/__init__.py +14 -13
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_manager.py +1 -69
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_storage.py +4 -2
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model.egg-info/PKG-INFO +6 -1
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model.egg-info/SOURCES.txt +0 -14
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model.egg-info/requires.txt +6 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/pyproject.toml +9 -1
- isa_model-0.4.3/isa_model/core/logging/influx_logger.py +0 -523
- isa_model-0.4.3/isa_model/core/security/secrets.py +0 -358
- isa_model-0.4.3/isa_model/core/storage/hf_storage.py +0 -419
- isa_model-0.4.3/isa_model/deployment/local/__init__.py +0 -31
- isa_model-0.4.3/isa_model/deployment/local/config.py +0 -248
- isa_model-0.4.3/isa_model/deployment/local/gpu_gateway.py +0 -607
- isa_model-0.4.3/isa_model/deployment/local/health_checker.py +0 -428
- isa_model-0.4.3/isa_model/deployment/local/provider.py +0 -586
- isa_model-0.4.3/isa_model/deployment/local/tensorrt_service.py +0 -621
- isa_model-0.4.3/isa_model/deployment/local/transformers_service.py +0 -644
- isa_model-0.4.3/isa_model/deployment/local/vllm_service.py +0 -527
- isa_model-0.4.3/isa_model/inference/services/custom_model_manager.py +0 -277
- isa_model-0.4.3/isa_model/inference/services/llm/local_llm_service.py +0 -747
- isa_model-0.4.3/isa_model/inference/services/vision/blip_vision_service.py +0 -359
- {isa_model-0.4.3 → isa_model-0.4.5}/MANIFEST.in +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/README.md +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/client.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/cache/redis_cache.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/config/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/config/config_manager.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/database/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/database/direct_db_client.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/database/migration_manager.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/database/migrations.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/database/supabase_client.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/dependencies.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/discovery/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/discovery/consul_discovery.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/logging/loki_logger.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/config_models.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/deployment_billing_tracker.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_billing_tracker.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_metadata.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_repo.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_statistics_tracker.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_version_manager.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/system_models.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/pricing_manager.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/repositories/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/repositories/config_repository.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/resilience/circuit_breaker.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/services/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/services/intelligent_model_selector.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/storage/local_storage.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/types.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/core/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/core/deployment_manager.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/config.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/deployer.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/audio/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/audio/isa_audio_chatTTS_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/audio/isa_audio_fish_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/audio/isa_audio_openvoice_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/audio/isa_audio_service_v2.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/embedding/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/embedding/isa_embed_rerank_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/llm/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/llm/isa_llm_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/video/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/video/isa_video_hunyuan_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/isa_vision_ocr_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/isa_vision_qwen25_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/isa_vision_table_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/isa_vision_ui_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/isa_vision_ui_service_optimized.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/simple_auto_deploy_vision_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/models/org-org-acme-corp-tenant-a-service-llm-20250825-225822/tenant-a-service_modal_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/models/org-test-org-123-prefix-test-service-llm-20250825-225822/prefix-test-service_modal_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/models/test-llm-service-llm-20250825-204442/test-llm-service_modal_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/models/test-monitoring-gpt2-llm-20250825-212906/test-monitoring-gpt2_modal_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/models/test-monitoring-gpt2-llm-20250825-213009/test-monitoring-gpt2_modal_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/storage/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/storage/deployment_repository.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/triton/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/triton/config.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/triton/configs/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/triton/provider.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/triton/scripts/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/triton/templates/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/ai_factory.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/base.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/legacy_services/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/legacy_services/model_evaluation.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/legacy_services/model_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/legacy_services/model_serving.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/legacy_services/model_training.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/models/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/models/inference_config.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/models/inference_record.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/models/performance_models.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/repositories/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/repositories/inference_repository.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/base_realtime_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/base_stt_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/base_tts_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/isa_tts_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/openai_realtime_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/openai_stt_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/openai_tts_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/replicate_tts_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/base_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/base_embed_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/helpers/text_splitter.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/isa_embed_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/ollama_embed_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/openai_embed_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/resilient_embed_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/tests/test_embedding.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/base_image_gen_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/replicate_image_gen_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/services/replicate_face_swap.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/services/replicate_flux.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/services/replicate_flux_kontext.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/services/replicate_sticker_maker.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/tests/test_img_client.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/base_llm_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/cerebras_llm_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/helpers/llm_adapter.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/helpers/llm_prompts.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/helpers/llm_utils.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/huggingface_llm_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/ollama_llm_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/openai_llm_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/yyds_llm_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/ml/base_ml_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/ml/sklearn_ml_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/base_vision_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/disabled/isA_vision_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/helpers/image_utils.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/helpers/vision_prompts.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/isa_vision_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/openai_vision_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/replicate_vision_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/tests/test_ocr_client.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/vgg16_vision_service.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/utils/conversion/bge_rerank_convert.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/utils/conversion/onnx_converter.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/utils/conversion/torch_converter.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/cache_manager.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/dependencies/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/dependencies/auth.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/dependencies/database.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/error_handlers.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/fastapi_server.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/middleware/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/middleware/auth.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/middleware/request_logger.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/middleware/security.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/middleware/tenant_context.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/analytics.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/config.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/deployment_billing.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/deployments.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/gpu_gateway.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/health.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/inference_monitoring.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/llm.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/local_deployments.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/logs.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/settings.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/tenants.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/ui_analysis.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/unified.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/vision.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/webhooks.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/schemas/__init__.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/schemas/common.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/schemas/ui_analysis.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/startup.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/modal_proxy_server.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/utils/gpu_utils.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model.egg-info/dependency_links.txt +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/isa_model.egg-info/top_level.txt +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/setup.cfg +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/setup.py +0 -0
- {isa_model-0.4.3 → isa_model-0.4.5}/tests/test_inference_service.py +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: isa_model
|
3
|
-
Version: 0.4.
|
3
|
+
Version: 0.4.5
|
4
4
|
Summary: Unified AI model serving framework
|
5
5
|
Author: isA_Model Contributors
|
6
6
|
Classifier: Development Status :: 3 - Alpha
|
@@ -89,6 +89,11 @@ Requires-Dist: isa-model[cloud,k8s,monitoring,storage]; extra == "production"
|
|
89
89
|
Provides-Extra: staging
|
90
90
|
Requires-Dist: isa-model[cloud,langchain,monitoring,storage]; extra == "staging"
|
91
91
|
Requires-Dist: python-consul>=1.1.0; extra == "staging"
|
92
|
+
Provides-Extra: staging-minimal
|
93
|
+
Requires-Dist: isa-model[cloud,langchain,storage]; extra == "staging-minimal"
|
94
|
+
Requires-Dist: influxdb-client>=1.36.0; extra == "staging-minimal"
|
95
|
+
Requires-Dist: python-logging-loki>=0.3.1; extra == "staging-minimal"
|
96
|
+
Requires-Dist: python-consul>=1.1.0; extra == "staging-minimal"
|
92
97
|
Provides-Extra: all
|
93
98
|
Requires-Dist: isa-model[audio,cloud,gpu-cloud,k8s,langchain,local,monitoring,storage,training,vision]; extra == "all"
|
94
99
|
|
@@ -54,7 +54,7 @@ class LocalGPUGlobalConfig:
|
|
54
54
|
enable_local_gpu: bool = True
|
55
55
|
auto_detect_gpu: bool = True
|
56
56
|
workspace_dir: str = "./local_deployments"
|
57
|
-
preferred_backend: str = "
|
57
|
+
preferred_backend: str = "api" # cloud api only
|
58
58
|
|
59
59
|
# Default resource settings
|
60
60
|
default_gpu_memory_fraction: float = 0.9
|
@@ -114,7 +114,7 @@ class GlobalConfig:
|
|
114
114
|
local_gpu_memory_fraction: float = 0.9
|
115
115
|
local_workspace_dir: str = "./local_deployments"
|
116
116
|
auto_detect_gpu: bool = True
|
117
|
-
preferred_local_backend: str = "
|
117
|
+
preferred_local_backend: str = "api" # cloud api only
|
118
118
|
|
119
119
|
# Local service defaults
|
120
120
|
local_health_check_interval: int = 30 # seconds
|
@@ -263,7 +263,7 @@ class ConfigManager:
|
|
263
263
|
"enable_local_gpu": os.getenv("ISA_ENABLE_LOCAL_GPU", "true").lower() == "true",
|
264
264
|
"auto_detect_gpu": os.getenv("ISA_AUTO_DETECT_GPU", "true").lower() == "true",
|
265
265
|
"workspace_dir": os.getenv("ISA_LOCAL_WORKSPACE_DIR", "./local_deployments"),
|
266
|
-
"preferred_backend": os.getenv("ISA_PREFERRED_LOCAL_BACKEND", "
|
266
|
+
"preferred_backend": os.getenv("ISA_PREFERRED_LOCAL_BACKEND", "api"),
|
267
267
|
"default_gpu_memory_fraction": float(os.getenv("ISA_GPU_MEMORY_FRACTION", "0.9")),
|
268
268
|
"health_check_interval": int(os.getenv("ISA_LOCAL_HEALTH_CHECK_INTERVAL", "30")),
|
269
269
|
"max_concurrent_services": int(os.getenv("ISA_MAX_CONCURRENT_SERVICES", "3")),
|
@@ -3,21 +3,24 @@ Logging module for ISA Model
|
|
3
3
|
|
4
4
|
Provides comprehensive logging capabilities including:
|
5
5
|
- Loki-based centralized application logging (via loki_logger)
|
6
|
-
-
|
7
|
-
- Real-time monitoring and alerting
|
6
|
+
- Basic inference logging with request tracking
|
8
7
|
|
9
8
|
Architecture:
|
10
9
|
- Loki: General application logs (INFO, WARNING, ERROR, DEBUG)
|
11
|
-
-
|
10
|
+
- Basic logging: Simple request tracking and basic metrics
|
12
11
|
"""
|
13
12
|
|
14
|
-
#
|
15
|
-
|
16
|
-
|
17
|
-
|
18
|
-
|
19
|
-
|
20
|
-
)
|
13
|
+
# Basic inference logging (no external dependencies)
|
14
|
+
import uuid
|
15
|
+
import logging
|
16
|
+
|
17
|
+
def generate_request_id():
|
18
|
+
"""Generate unique request ID for tracking"""
|
19
|
+
return str(uuid.uuid4())
|
20
|
+
|
21
|
+
def get_inference_logger():
|
22
|
+
"""Get basic inference logger"""
|
23
|
+
return logging.getLogger("isa_model.inference")
|
21
24
|
|
22
25
|
# Loki centralized application logging
|
23
26
|
from .loki_logger import (
|
@@ -34,9 +37,7 @@ from .loki_logger import (
|
|
34
37
|
)
|
35
38
|
|
36
39
|
__all__ = [
|
37
|
-
#
|
38
|
-
'InfluxInferenceLogger',
|
39
|
-
'InferenceLogEntry',
|
40
|
+
# Basic inference logging
|
40
41
|
'get_inference_logger',
|
41
42
|
'generate_request_id',
|
42
43
|
|
@@ -2,8 +2,6 @@ from typing import Dict, Optional, List, Any
|
|
2
2
|
import logging
|
3
3
|
from pathlib import Path
|
4
4
|
from datetime import datetime
|
5
|
-
from huggingface_hub import hf_hub_download, snapshot_download
|
6
|
-
from huggingface_hub.errors import HfHubHTTPError
|
7
5
|
from .model_storage import ModelStorage, LocalModelStorage
|
8
6
|
from .model_repo import ModelRegistry, ModelType, ModelCapability
|
9
7
|
from .model_billing_tracker import ModelBillingTracker, ModelOperationType
|
@@ -102,73 +100,7 @@ class ModelManager:
|
|
102
100
|
logger.warning(f"Failed to find cheapest model for {provider}: {e}")
|
103
101
|
return None
|
104
102
|
|
105
|
-
|
106
|
-
model_id: str,
|
107
|
-
repo_id: str,
|
108
|
-
model_type: ModelType,
|
109
|
-
capabilities: List[ModelCapability],
|
110
|
-
revision: Optional[str] = None,
|
111
|
-
force_download: bool = False) -> Optional[Path]:
|
112
|
-
"""
|
113
|
-
Get model files, downloading if necessary
|
114
|
-
|
115
|
-
Args:
|
116
|
-
model_id: Unique identifier for the model
|
117
|
-
repo_id: Hugging Face repository ID
|
118
|
-
model_type: Type of model (LLM, embedding, etc.)
|
119
|
-
capabilities: List of model capabilities
|
120
|
-
revision: Specific model version/tag
|
121
|
-
force_download: Force re-download even if cached
|
122
|
-
|
123
|
-
Returns:
|
124
|
-
Path to the model files or None if failed
|
125
|
-
"""
|
126
|
-
# Check if model is already downloaded
|
127
|
-
if not force_download:
|
128
|
-
model_path = await self.storage.load_model(model_id)
|
129
|
-
if model_path:
|
130
|
-
logger.info(f"Using cached model {model_id}")
|
131
|
-
return model_path
|
132
|
-
|
133
|
-
try:
|
134
|
-
# Download model files
|
135
|
-
logger.info(f"Downloading model {model_id} from {repo_id}")
|
136
|
-
model_dir = Path(f"./models/temp/{model_id}")
|
137
|
-
model_dir.mkdir(parents=True, exist_ok=True)
|
138
|
-
|
139
|
-
snapshot_download(
|
140
|
-
repo_id=repo_id,
|
141
|
-
revision=revision,
|
142
|
-
local_dir=model_dir,
|
143
|
-
local_dir_use_symlinks=False
|
144
|
-
)
|
145
|
-
|
146
|
-
# Save model and metadata
|
147
|
-
metadata = {
|
148
|
-
"repo_id": repo_id,
|
149
|
-
"revision": revision,
|
150
|
-
"downloaded_at": str(Path(model_dir).stat().st_mtime)
|
151
|
-
}
|
152
|
-
|
153
|
-
# Register model
|
154
|
-
self.registry.register_model(
|
155
|
-
model_id=model_id,
|
156
|
-
model_type=model_type,
|
157
|
-
capabilities=capabilities,
|
158
|
-
metadata=metadata
|
159
|
-
)
|
160
|
-
|
161
|
-
# Save model files
|
162
|
-
await self.storage.save_model(model_id, str(model_dir), metadata)
|
163
|
-
|
164
|
-
return await self.storage.load_model(model_id)
|
165
|
-
|
166
|
-
except HfHubHTTPError as e:
|
167
|
-
logger.error(f"Failed to download model {model_id}: {e}")
|
168
|
-
return None
|
169
|
-
except Exception as e:
|
170
|
-
logger.error(f"Unexpected error downloading model {model_id}: {e}")
|
171
|
-
return None
|
103
|
+
# Local model download functionality removed - use cloud API services only
|
172
104
|
|
173
105
|
async def list_models(self) -> List[Dict[str, Any]]:
|
174
106
|
"""List all downloaded models with their metadata"""
|
@@ -39,11 +39,13 @@ class ModelStorage(ABC):
|
|
39
39
|
class LocalModelStorage(ModelStorage):
|
40
40
|
"""Local file system based model storage"""
|
41
41
|
|
42
|
-
def __init__(self, base_dir: str = "./models"):
|
42
|
+
def __init__(self, base_dir: str = "./models", auto_create: bool = False):
|
43
43
|
self.base_dir = Path(base_dir)
|
44
44
|
self.models_dir = self.base_dir / "models"
|
45
45
|
self.metadata_file = self.base_dir / "model_metadata.json"
|
46
|
-
self.
|
46
|
+
self.auto_create = auto_create
|
47
|
+
if auto_create:
|
48
|
+
self._ensure_directories()
|
47
49
|
self._load_metadata()
|
48
50
|
|
49
51
|
def _ensure_directories(self):
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: isa_model
|
3
|
-
Version: 0.4.
|
3
|
+
Version: 0.4.5
|
4
4
|
Summary: Unified AI model serving framework
|
5
5
|
Author: isA_Model Contributors
|
6
6
|
Classifier: Development Status :: 3 - Alpha
|
@@ -89,6 +89,11 @@ Requires-Dist: isa-model[cloud,k8s,monitoring,storage]; extra == "production"
|
|
89
89
|
Provides-Extra: staging
|
90
90
|
Requires-Dist: isa-model[cloud,langchain,monitoring,storage]; extra == "staging"
|
91
91
|
Requires-Dist: python-consul>=1.1.0; extra == "staging"
|
92
|
+
Provides-Extra: staging-minimal
|
93
|
+
Requires-Dist: isa-model[cloud,langchain,storage]; extra == "staging-minimal"
|
94
|
+
Requires-Dist: influxdb-client>=1.36.0; extra == "staging-minimal"
|
95
|
+
Requires-Dist: python-logging-loki>=0.3.1; extra == "staging-minimal"
|
96
|
+
Requires-Dist: python-consul>=1.1.0; extra == "staging-minimal"
|
92
97
|
Provides-Extra: all
|
93
98
|
Requires-Dist: isa-model[audio,cloud,gpu-cloud,k8s,langchain,local,monitoring,storage,training,vision]; extra == "all"
|
94
99
|
|
@@ -24,7 +24,6 @@ isa_model/core/database/supabase_client.py
|
|
24
24
|
isa_model/core/discovery/__init__.py
|
25
25
|
isa_model/core/discovery/consul_discovery.py
|
26
26
|
isa_model/core/logging/__init__.py
|
27
|
-
isa_model/core/logging/influx_logger.py
|
28
27
|
isa_model/core/logging/loki_logger.py
|
29
28
|
isa_model/core/models/__init__.py
|
30
29
|
isa_model/core/models/config_models.py
|
@@ -40,22 +39,12 @@ isa_model/core/models/system_models.py
|
|
40
39
|
isa_model/core/repositories/__init__.py
|
41
40
|
isa_model/core/repositories/config_repository.py
|
42
41
|
isa_model/core/resilience/circuit_breaker.py
|
43
|
-
isa_model/core/security/secrets.py
|
44
42
|
isa_model/core/services/__init__.py
|
45
43
|
isa_model/core/services/intelligent_model_selector.py
|
46
|
-
isa_model/core/storage/hf_storage.py
|
47
44
|
isa_model/core/storage/local_storage.py
|
48
45
|
isa_model/deployment/__init__.py
|
49
46
|
isa_model/deployment/core/__init__.py
|
50
47
|
isa_model/deployment/core/deployment_manager.py
|
51
|
-
isa_model/deployment/local/__init__.py
|
52
|
-
isa_model/deployment/local/config.py
|
53
|
-
isa_model/deployment/local/gpu_gateway.py
|
54
|
-
isa_model/deployment/local/health_checker.py
|
55
|
-
isa_model/deployment/local/provider.py
|
56
|
-
isa_model/deployment/local/tensorrt_service.py
|
57
|
-
isa_model/deployment/local/transformers_service.py
|
58
|
-
isa_model/deployment/local/vllm_service.py
|
59
48
|
isa_model/deployment/modal/__init__.py
|
60
49
|
isa_model/deployment/modal/config.py
|
61
50
|
isa_model/deployment/modal/deployer.py
|
@@ -107,7 +96,6 @@ isa_model/inference/repositories/__init__.py
|
|
107
96
|
isa_model/inference/repositories/inference_repository.py
|
108
97
|
isa_model/inference/services/__init__.py
|
109
98
|
isa_model/inference/services/base_service.py
|
110
|
-
isa_model/inference/services/custom_model_manager.py
|
111
99
|
isa_model/inference/services/audio/__init__.py
|
112
100
|
isa_model/inference/services/audio/base_realtime_service.py
|
113
101
|
isa_model/inference/services/audio/base_stt_service.py
|
@@ -137,7 +125,6 @@ isa_model/inference/services/llm/__init__.py
|
|
137
125
|
isa_model/inference/services/llm/base_llm_service.py
|
138
126
|
isa_model/inference/services/llm/cerebras_llm_service.py
|
139
127
|
isa_model/inference/services/llm/huggingface_llm_service.py
|
140
|
-
isa_model/inference/services/llm/local_llm_service.py
|
141
128
|
isa_model/inference/services/llm/ollama_llm_service.py
|
142
129
|
isa_model/inference/services/llm/openai_llm_service.py
|
143
130
|
isa_model/inference/services/llm/yyds_llm_service.py
|
@@ -148,7 +135,6 @@ isa_model/inference/services/ml/base_ml_service.py
|
|
148
135
|
isa_model/inference/services/ml/sklearn_ml_service.py
|
149
136
|
isa_model/inference/services/vision/__init__.py
|
150
137
|
isa_model/inference/services/vision/base_vision_service.py
|
151
|
-
isa_model/inference/services/vision/blip_vision_service.py
|
152
138
|
isa_model/inference/services/vision/isa_vision_service.py
|
153
139
|
isa_model/inference/services/vision/openai_vision_service.py
|
154
140
|
isa_model/inference/services/vision/replicate_vision_service.py
|
@@ -83,6 +83,12 @@ isa-model[cloud,k8s,monitoring,storage]
|
|
83
83
|
isa-model[cloud,langchain,monitoring,storage]
|
84
84
|
python-consul>=1.1.0
|
85
85
|
|
86
|
+
[staging-minimal]
|
87
|
+
isa-model[cloud,langchain,storage]
|
88
|
+
influxdb-client>=1.36.0
|
89
|
+
python-logging-loki>=0.3.1
|
90
|
+
python-consul>=1.1.0
|
91
|
+
|
86
92
|
[storage]
|
87
93
|
boto3>=1.26.0
|
88
94
|
google-cloud-storage>=2.7.0
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
4
4
|
|
5
5
|
[project]
|
6
6
|
name = "isa_model"
|
7
|
-
version = "0.4.
|
7
|
+
version = "0.4.5"
|
8
8
|
description = "Unified AI model serving framework"
|
9
9
|
authors = [{name = "isA_Model Contributors"}]
|
10
10
|
readme = "README.md"
|
@@ -152,6 +152,14 @@ staging = [
|
|
152
152
|
"python-consul>=1.1.0", # Service discovery
|
153
153
|
]
|
154
154
|
|
155
|
+
# Ultra-lightweight staging (no MLflow monitoring)
|
156
|
+
staging-minimal = [
|
157
|
+
"isa-model[cloud,storage,langchain]",
|
158
|
+
"influxdb-client>=1.36.0", # Basic logging only
|
159
|
+
"python-logging-loki>=0.3.1", # Centralized logging
|
160
|
+
"python-consul>=1.1.0", # Service discovery
|
161
|
+
]
|
162
|
+
|
155
163
|
all = [
|
156
164
|
"isa-model[cloud,local,training,audio,vision,langchain,storage,monitoring,k8s,gpu-cloud]",
|
157
165
|
]
|