isa-model 0.4.3__tar.gz → 0.4.5__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (201) hide show
  1. {isa_model-0.4.3 → isa_model-0.4.5}/PKG-INFO +6 -1
  2. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/config.py +3 -3
  3. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/logging/__init__.py +14 -13
  4. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_manager.py +1 -69
  5. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_storage.py +4 -2
  6. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model.egg-info/PKG-INFO +6 -1
  7. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model.egg-info/SOURCES.txt +0 -14
  8. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model.egg-info/requires.txt +6 -0
  9. {isa_model-0.4.3 → isa_model-0.4.5}/pyproject.toml +9 -1
  10. isa_model-0.4.3/isa_model/core/logging/influx_logger.py +0 -523
  11. isa_model-0.4.3/isa_model/core/security/secrets.py +0 -358
  12. isa_model-0.4.3/isa_model/core/storage/hf_storage.py +0 -419
  13. isa_model-0.4.3/isa_model/deployment/local/__init__.py +0 -31
  14. isa_model-0.4.3/isa_model/deployment/local/config.py +0 -248
  15. isa_model-0.4.3/isa_model/deployment/local/gpu_gateway.py +0 -607
  16. isa_model-0.4.3/isa_model/deployment/local/health_checker.py +0 -428
  17. isa_model-0.4.3/isa_model/deployment/local/provider.py +0 -586
  18. isa_model-0.4.3/isa_model/deployment/local/tensorrt_service.py +0 -621
  19. isa_model-0.4.3/isa_model/deployment/local/transformers_service.py +0 -644
  20. isa_model-0.4.3/isa_model/deployment/local/vllm_service.py +0 -527
  21. isa_model-0.4.3/isa_model/inference/services/custom_model_manager.py +0 -277
  22. isa_model-0.4.3/isa_model/inference/services/llm/local_llm_service.py +0 -747
  23. isa_model-0.4.3/isa_model/inference/services/vision/blip_vision_service.py +0 -359
  24. {isa_model-0.4.3 → isa_model-0.4.5}/MANIFEST.in +0 -0
  25. {isa_model-0.4.3 → isa_model-0.4.5}/README.md +0 -0
  26. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/__init__.py +0 -0
  27. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/client.py +0 -0
  28. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/cache/redis_cache.py +0 -0
  29. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/config/__init__.py +0 -0
  30. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/config/config_manager.py +0 -0
  31. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/database/__init__.py +0 -0
  32. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/database/direct_db_client.py +0 -0
  33. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/database/migration_manager.py +0 -0
  34. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/database/migrations.py +0 -0
  35. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/database/supabase_client.py +0 -0
  36. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/dependencies.py +0 -0
  37. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/discovery/__init__.py +0 -0
  38. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/discovery/consul_discovery.py +0 -0
  39. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/logging/loki_logger.py +0 -0
  40. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/__init__.py +0 -0
  41. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/config_models.py +0 -0
  42. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/deployment_billing_tracker.py +0 -0
  43. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_billing_tracker.py +0 -0
  44. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_metadata.py +0 -0
  45. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_repo.py +0 -0
  46. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_statistics_tracker.py +0 -0
  47. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/model_version_manager.py +0 -0
  48. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/models/system_models.py +0 -0
  49. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/pricing_manager.py +0 -0
  50. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/repositories/__init__.py +0 -0
  51. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/repositories/config_repository.py +0 -0
  52. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/resilience/circuit_breaker.py +0 -0
  53. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/services/__init__.py +0 -0
  54. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/services/intelligent_model_selector.py +0 -0
  55. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/storage/local_storage.py +0 -0
  56. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/core/types.py +0 -0
  57. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/__init__.py +0 -0
  58. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/core/__init__.py +0 -0
  59. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/core/deployment_manager.py +0 -0
  60. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/__init__.py +0 -0
  61. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/config.py +0 -0
  62. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/deployer.py +0 -0
  63. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/__init__.py +0 -0
  64. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/audio/__init__.py +0 -0
  65. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/audio/isa_audio_chatTTS_service.py +0 -0
  66. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/audio/isa_audio_fish_service.py +0 -0
  67. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/audio/isa_audio_openvoice_service.py +0 -0
  68. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/audio/isa_audio_service_v2.py +0 -0
  69. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/embedding/__init__.py +0 -0
  70. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/embedding/isa_embed_rerank_service.py +0 -0
  71. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/llm/__init__.py +0 -0
  72. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/llm/isa_llm_service.py +0 -0
  73. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/video/__init__.py +0 -0
  74. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/video/isa_video_hunyuan_service.py +0 -0
  75. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/__init__.py +0 -0
  76. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/isa_vision_ocr_service.py +0 -0
  77. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/isa_vision_qwen25_service.py +0 -0
  78. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/isa_vision_table_service.py +0 -0
  79. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/isa_vision_ui_service.py +0 -0
  80. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/isa_vision_ui_service_optimized.py +0 -0
  81. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/modal/services/vision/simple_auto_deploy_vision_service.py +0 -0
  82. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/models/org-org-acme-corp-tenant-a-service-llm-20250825-225822/tenant-a-service_modal_service.py +0 -0
  83. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/models/org-test-org-123-prefix-test-service-llm-20250825-225822/prefix-test-service_modal_service.py +0 -0
  84. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/models/test-llm-service-llm-20250825-204442/test-llm-service_modal_service.py +0 -0
  85. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/models/test-monitoring-gpt2-llm-20250825-212906/test-monitoring-gpt2_modal_service.py +0 -0
  86. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/models/test-monitoring-gpt2-llm-20250825-213009/test-monitoring-gpt2_modal_service.py +0 -0
  87. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/storage/__init__.py +0 -0
  88. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/storage/deployment_repository.py +0 -0
  89. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/triton/__init__.py +0 -0
  90. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/triton/config.py +0 -0
  91. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/triton/configs/__init__.py +0 -0
  92. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/triton/provider.py +0 -0
  93. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/triton/scripts/__init__.py +0 -0
  94. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/deployment/triton/templates/__init__.py +0 -0
  95. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/__init__.py +0 -0
  96. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/ai_factory.py +0 -0
  97. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/base.py +0 -0
  98. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/legacy_services/__init__.py +0 -0
  99. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/legacy_services/model_evaluation.py +0 -0
  100. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/legacy_services/model_service.py +0 -0
  101. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/legacy_services/model_serving.py +0 -0
  102. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/legacy_services/model_training.py +0 -0
  103. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/models/__init__.py +0 -0
  104. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/models/inference_config.py +0 -0
  105. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/models/inference_record.py +0 -0
  106. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/models/performance_models.py +0 -0
  107. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/repositories/__init__.py +0 -0
  108. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/repositories/inference_repository.py +0 -0
  109. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/__init__.py +0 -0
  110. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/__init__.py +0 -0
  111. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/base_realtime_service.py +0 -0
  112. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/base_stt_service.py +0 -0
  113. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/base_tts_service.py +0 -0
  114. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/isa_tts_service.py +0 -0
  115. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/openai_realtime_service.py +0 -0
  116. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/openai_stt_service.py +0 -0
  117. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/openai_tts_service.py +0 -0
  118. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/audio/replicate_tts_service.py +0 -0
  119. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/base_service.py +0 -0
  120. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/__init__.py +0 -0
  121. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/base_embed_service.py +0 -0
  122. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/helpers/text_splitter.py +0 -0
  123. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/isa_embed_service.py +0 -0
  124. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/ollama_embed_service.py +0 -0
  125. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/openai_embed_service.py +0 -0
  126. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/resilient_embed_service.py +0 -0
  127. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/embedding/tests/test_embedding.py +0 -0
  128. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/__init__.py +0 -0
  129. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/base_image_gen_service.py +0 -0
  130. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/replicate_image_gen_service.py +0 -0
  131. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/services/replicate_face_swap.py +0 -0
  132. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/services/replicate_flux.py +0 -0
  133. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/services/replicate_flux_kontext.py +0 -0
  134. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/services/replicate_sticker_maker.py +0 -0
  135. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/img/tests/test_img_client.py +0 -0
  136. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/__init__.py +0 -0
  137. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/base_llm_service.py +0 -0
  138. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/cerebras_llm_service.py +0 -0
  139. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/helpers/llm_adapter.py +0 -0
  140. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/helpers/llm_prompts.py +0 -0
  141. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/helpers/llm_utils.py +0 -0
  142. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/huggingface_llm_service.py +0 -0
  143. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/ollama_llm_service.py +0 -0
  144. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/openai_llm_service.py +0 -0
  145. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/llm/yyds_llm_service.py +0 -0
  146. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/ml/base_ml_service.py +0 -0
  147. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/ml/sklearn_ml_service.py +0 -0
  148. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/__init__.py +0 -0
  149. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/base_vision_service.py +0 -0
  150. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/disabled/isA_vision_service.py +0 -0
  151. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/helpers/image_utils.py +0 -0
  152. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/helpers/vision_prompts.py +0 -0
  153. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/isa_vision_service.py +0 -0
  154. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/openai_vision_service.py +0 -0
  155. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/replicate_vision_service.py +0 -0
  156. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/tests/test_ocr_client.py +0 -0
  157. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/services/vision/vgg16_vision_service.py +0 -0
  158. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/utils/conversion/bge_rerank_convert.py +0 -0
  159. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/utils/conversion/onnx_converter.py +0 -0
  160. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/inference/utils/conversion/torch_converter.py +0 -0
  161. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/__init__.py +0 -0
  162. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/__init__.py +0 -0
  163. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/cache_manager.py +0 -0
  164. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/dependencies/__init__.py +0 -0
  165. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/dependencies/auth.py +0 -0
  166. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/dependencies/database.py +0 -0
  167. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/error_handlers.py +0 -0
  168. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/fastapi_server.py +0 -0
  169. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/middleware/__init__.py +0 -0
  170. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/middleware/auth.py +0 -0
  171. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/middleware/request_logger.py +0 -0
  172. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/middleware/security.py +0 -0
  173. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/middleware/tenant_context.py +0 -0
  174. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/__init__.py +0 -0
  175. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/analytics.py +0 -0
  176. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/config.py +0 -0
  177. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/deployment_billing.py +0 -0
  178. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/deployments.py +0 -0
  179. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/gpu_gateway.py +0 -0
  180. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/health.py +0 -0
  181. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/inference_monitoring.py +0 -0
  182. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/llm.py +0 -0
  183. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/local_deployments.py +0 -0
  184. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/logs.py +0 -0
  185. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/settings.py +0 -0
  186. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/tenants.py +0 -0
  187. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/ui_analysis.py +0 -0
  188. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/unified.py +0 -0
  189. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/vision.py +0 -0
  190. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/routes/webhooks.py +0 -0
  191. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/schemas/__init__.py +0 -0
  192. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/schemas/common.py +0 -0
  193. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/schemas/ui_analysis.py +0 -0
  194. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/api/startup.py +0 -0
  195. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/serving/modal_proxy_server.py +0 -0
  196. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model/utils/gpu_utils.py +0 -0
  197. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model.egg-info/dependency_links.txt +0 -0
  198. {isa_model-0.4.3 → isa_model-0.4.5}/isa_model.egg-info/top_level.txt +0 -0
  199. {isa_model-0.4.3 → isa_model-0.4.5}/setup.cfg +0 -0
  200. {isa_model-0.4.3 → isa_model-0.4.5}/setup.py +0 -0
  201. {isa_model-0.4.3 → isa_model-0.4.5}/tests/test_inference_service.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: isa_model
3
- Version: 0.4.3
3
+ Version: 0.4.5
4
4
  Summary: Unified AI model serving framework
5
5
  Author: isA_Model Contributors
6
6
  Classifier: Development Status :: 3 - Alpha
@@ -89,6 +89,11 @@ Requires-Dist: isa-model[cloud,k8s,monitoring,storage]; extra == "production"
89
89
  Provides-Extra: staging
90
90
  Requires-Dist: isa-model[cloud,langchain,monitoring,storage]; extra == "staging"
91
91
  Requires-Dist: python-consul>=1.1.0; extra == "staging"
92
+ Provides-Extra: staging-minimal
93
+ Requires-Dist: isa-model[cloud,langchain,storage]; extra == "staging-minimal"
94
+ Requires-Dist: influxdb-client>=1.36.0; extra == "staging-minimal"
95
+ Requires-Dist: python-logging-loki>=0.3.1; extra == "staging-minimal"
96
+ Requires-Dist: python-consul>=1.1.0; extra == "staging-minimal"
92
97
  Provides-Extra: all
93
98
  Requires-Dist: isa-model[audio,cloud,gpu-cloud,k8s,langchain,local,monitoring,storage,training,vision]; extra == "all"
94
99
 
@@ -54,7 +54,7 @@ class LocalGPUGlobalConfig:
54
54
  enable_local_gpu: bool = True
55
55
  auto_detect_gpu: bool = True
56
56
  workspace_dir: str = "./local_deployments"
57
- preferred_backend: str = "transformers" # vllm, tensorrt_llm, transformers
57
+ preferred_backend: str = "api" # cloud api only
58
58
 
59
59
  # Default resource settings
60
60
  default_gpu_memory_fraction: float = 0.9
@@ -114,7 +114,7 @@ class GlobalConfig:
114
114
  local_gpu_memory_fraction: float = 0.9
115
115
  local_workspace_dir: str = "./local_deployments"
116
116
  auto_detect_gpu: bool = True
117
- preferred_local_backend: str = "transformers" # vllm, tensorrt_llm, transformers
117
+ preferred_local_backend: str = "api" # cloud api only
118
118
 
119
119
  # Local service defaults
120
120
  local_health_check_interval: int = 30 # seconds
@@ -263,7 +263,7 @@ class ConfigManager:
263
263
  "enable_local_gpu": os.getenv("ISA_ENABLE_LOCAL_GPU", "true").lower() == "true",
264
264
  "auto_detect_gpu": os.getenv("ISA_AUTO_DETECT_GPU", "true").lower() == "true",
265
265
  "workspace_dir": os.getenv("ISA_LOCAL_WORKSPACE_DIR", "./local_deployments"),
266
- "preferred_backend": os.getenv("ISA_PREFERRED_LOCAL_BACKEND", "transformers"),
266
+ "preferred_backend": os.getenv("ISA_PREFERRED_LOCAL_BACKEND", "api"),
267
267
  "default_gpu_memory_fraction": float(os.getenv("ISA_GPU_MEMORY_FRACTION", "0.9")),
268
268
  "health_check_interval": int(os.getenv("ISA_LOCAL_HEALTH_CHECK_INTERVAL", "30")),
269
269
  "max_concurrent_services": int(os.getenv("ISA_MAX_CONCURRENT_SERVICES", "3")),
@@ -3,21 +3,24 @@ Logging module for ISA Model
3
3
 
4
4
  Provides comprehensive logging capabilities including:
5
5
  - Loki-based centralized application logging (via loki_logger)
6
- - InfluxDB-based inference metrics logging (via influx_logger)
7
- - Real-time monitoring and alerting
6
+ - Basic inference logging with request tracking
8
7
 
9
8
  Architecture:
10
9
  - Loki: General application logs (INFO, WARNING, ERROR, DEBUG)
11
- - InfluxDB: Inference metrics (tokens, costs, performance data)
10
+ - Basic logging: Simple request tracking and basic metrics
12
11
  """
13
12
 
14
- # InfluxDB inference metrics logging
15
- from .influx_logger import (
16
- InfluxInferenceLogger,
17
- InferenceLogEntry,
18
- get_inference_logger,
19
- generate_request_id
20
- )
13
+ # Basic inference logging (no external dependencies)
14
+ import uuid
15
+ import logging
16
+
17
+ def generate_request_id():
18
+ """Generate unique request ID for tracking"""
19
+ return str(uuid.uuid4())
20
+
21
+ def get_inference_logger():
22
+ """Get basic inference logger"""
23
+ return logging.getLogger("isa_model.inference")
21
24
 
22
25
  # Loki centralized application logging
23
26
  from .loki_logger import (
@@ -34,9 +37,7 @@ from .loki_logger import (
34
37
  )
35
38
 
36
39
  __all__ = [
37
- # InfluxDB inference logging
38
- 'InfluxInferenceLogger',
39
- 'InferenceLogEntry',
40
+ # Basic inference logging
40
41
  'get_inference_logger',
41
42
  'generate_request_id',
42
43
 
@@ -2,8 +2,6 @@ from typing import Dict, Optional, List, Any
2
2
  import logging
3
3
  from pathlib import Path
4
4
  from datetime import datetime
5
- from huggingface_hub import hf_hub_download, snapshot_download
6
- from huggingface_hub.errors import HfHubHTTPError
7
5
  from .model_storage import ModelStorage, LocalModelStorage
8
6
  from .model_repo import ModelRegistry, ModelType, ModelCapability
9
7
  from .model_billing_tracker import ModelBillingTracker, ModelOperationType
@@ -102,73 +100,7 @@ class ModelManager:
102
100
  logger.warning(f"Failed to find cheapest model for {provider}: {e}")
103
101
  return None
104
102
 
105
- async def get_model(self,
106
- model_id: str,
107
- repo_id: str,
108
- model_type: ModelType,
109
- capabilities: List[ModelCapability],
110
- revision: Optional[str] = None,
111
- force_download: bool = False) -> Optional[Path]:
112
- """
113
- Get model files, downloading if necessary
114
-
115
- Args:
116
- model_id: Unique identifier for the model
117
- repo_id: Hugging Face repository ID
118
- model_type: Type of model (LLM, embedding, etc.)
119
- capabilities: List of model capabilities
120
- revision: Specific model version/tag
121
- force_download: Force re-download even if cached
122
-
123
- Returns:
124
- Path to the model files or None if failed
125
- """
126
- # Check if model is already downloaded
127
- if not force_download:
128
- model_path = await self.storage.load_model(model_id)
129
- if model_path:
130
- logger.info(f"Using cached model {model_id}")
131
- return model_path
132
-
133
- try:
134
- # Download model files
135
- logger.info(f"Downloading model {model_id} from {repo_id}")
136
- model_dir = Path(f"./models/temp/{model_id}")
137
- model_dir.mkdir(parents=True, exist_ok=True)
138
-
139
- snapshot_download(
140
- repo_id=repo_id,
141
- revision=revision,
142
- local_dir=model_dir,
143
- local_dir_use_symlinks=False
144
- )
145
-
146
- # Save model and metadata
147
- metadata = {
148
- "repo_id": repo_id,
149
- "revision": revision,
150
- "downloaded_at": str(Path(model_dir).stat().st_mtime)
151
- }
152
-
153
- # Register model
154
- self.registry.register_model(
155
- model_id=model_id,
156
- model_type=model_type,
157
- capabilities=capabilities,
158
- metadata=metadata
159
- )
160
-
161
- # Save model files
162
- await self.storage.save_model(model_id, str(model_dir), metadata)
163
-
164
- return await self.storage.load_model(model_id)
165
-
166
- except HfHubHTTPError as e:
167
- logger.error(f"Failed to download model {model_id}: {e}")
168
- return None
169
- except Exception as e:
170
- logger.error(f"Unexpected error downloading model {model_id}: {e}")
171
- return None
103
+ # Local model download functionality removed - use cloud API services only
172
104
 
173
105
  async def list_models(self) -> List[Dict[str, Any]]:
174
106
  """List all downloaded models with their metadata"""
@@ -39,11 +39,13 @@ class ModelStorage(ABC):
39
39
  class LocalModelStorage(ModelStorage):
40
40
  """Local file system based model storage"""
41
41
 
42
- def __init__(self, base_dir: str = "./models"):
42
+ def __init__(self, base_dir: str = "./models", auto_create: bool = False):
43
43
  self.base_dir = Path(base_dir)
44
44
  self.models_dir = self.base_dir / "models"
45
45
  self.metadata_file = self.base_dir / "model_metadata.json"
46
- self._ensure_directories()
46
+ self.auto_create = auto_create
47
+ if auto_create:
48
+ self._ensure_directories()
47
49
  self._load_metadata()
48
50
 
49
51
  def _ensure_directories(self):
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: isa_model
3
- Version: 0.4.3
3
+ Version: 0.4.5
4
4
  Summary: Unified AI model serving framework
5
5
  Author: isA_Model Contributors
6
6
  Classifier: Development Status :: 3 - Alpha
@@ -89,6 +89,11 @@ Requires-Dist: isa-model[cloud,k8s,monitoring,storage]; extra == "production"
89
89
  Provides-Extra: staging
90
90
  Requires-Dist: isa-model[cloud,langchain,monitoring,storage]; extra == "staging"
91
91
  Requires-Dist: python-consul>=1.1.0; extra == "staging"
92
+ Provides-Extra: staging-minimal
93
+ Requires-Dist: isa-model[cloud,langchain,storage]; extra == "staging-minimal"
94
+ Requires-Dist: influxdb-client>=1.36.0; extra == "staging-minimal"
95
+ Requires-Dist: python-logging-loki>=0.3.1; extra == "staging-minimal"
96
+ Requires-Dist: python-consul>=1.1.0; extra == "staging-minimal"
92
97
  Provides-Extra: all
93
98
  Requires-Dist: isa-model[audio,cloud,gpu-cloud,k8s,langchain,local,monitoring,storage,training,vision]; extra == "all"
94
99
 
@@ -24,7 +24,6 @@ isa_model/core/database/supabase_client.py
24
24
  isa_model/core/discovery/__init__.py
25
25
  isa_model/core/discovery/consul_discovery.py
26
26
  isa_model/core/logging/__init__.py
27
- isa_model/core/logging/influx_logger.py
28
27
  isa_model/core/logging/loki_logger.py
29
28
  isa_model/core/models/__init__.py
30
29
  isa_model/core/models/config_models.py
@@ -40,22 +39,12 @@ isa_model/core/models/system_models.py
40
39
  isa_model/core/repositories/__init__.py
41
40
  isa_model/core/repositories/config_repository.py
42
41
  isa_model/core/resilience/circuit_breaker.py
43
- isa_model/core/security/secrets.py
44
42
  isa_model/core/services/__init__.py
45
43
  isa_model/core/services/intelligent_model_selector.py
46
- isa_model/core/storage/hf_storage.py
47
44
  isa_model/core/storage/local_storage.py
48
45
  isa_model/deployment/__init__.py
49
46
  isa_model/deployment/core/__init__.py
50
47
  isa_model/deployment/core/deployment_manager.py
51
- isa_model/deployment/local/__init__.py
52
- isa_model/deployment/local/config.py
53
- isa_model/deployment/local/gpu_gateway.py
54
- isa_model/deployment/local/health_checker.py
55
- isa_model/deployment/local/provider.py
56
- isa_model/deployment/local/tensorrt_service.py
57
- isa_model/deployment/local/transformers_service.py
58
- isa_model/deployment/local/vllm_service.py
59
48
  isa_model/deployment/modal/__init__.py
60
49
  isa_model/deployment/modal/config.py
61
50
  isa_model/deployment/modal/deployer.py
@@ -107,7 +96,6 @@ isa_model/inference/repositories/__init__.py
107
96
  isa_model/inference/repositories/inference_repository.py
108
97
  isa_model/inference/services/__init__.py
109
98
  isa_model/inference/services/base_service.py
110
- isa_model/inference/services/custom_model_manager.py
111
99
  isa_model/inference/services/audio/__init__.py
112
100
  isa_model/inference/services/audio/base_realtime_service.py
113
101
  isa_model/inference/services/audio/base_stt_service.py
@@ -137,7 +125,6 @@ isa_model/inference/services/llm/__init__.py
137
125
  isa_model/inference/services/llm/base_llm_service.py
138
126
  isa_model/inference/services/llm/cerebras_llm_service.py
139
127
  isa_model/inference/services/llm/huggingface_llm_service.py
140
- isa_model/inference/services/llm/local_llm_service.py
141
128
  isa_model/inference/services/llm/ollama_llm_service.py
142
129
  isa_model/inference/services/llm/openai_llm_service.py
143
130
  isa_model/inference/services/llm/yyds_llm_service.py
@@ -148,7 +135,6 @@ isa_model/inference/services/ml/base_ml_service.py
148
135
  isa_model/inference/services/ml/sklearn_ml_service.py
149
136
  isa_model/inference/services/vision/__init__.py
150
137
  isa_model/inference/services/vision/base_vision_service.py
151
- isa_model/inference/services/vision/blip_vision_service.py
152
138
  isa_model/inference/services/vision/isa_vision_service.py
153
139
  isa_model/inference/services/vision/openai_vision_service.py
154
140
  isa_model/inference/services/vision/replicate_vision_service.py
@@ -83,6 +83,12 @@ isa-model[cloud,k8s,monitoring,storage]
83
83
  isa-model[cloud,langchain,monitoring,storage]
84
84
  python-consul>=1.1.0
85
85
 
86
+ [staging-minimal]
87
+ isa-model[cloud,langchain,storage]
88
+ influxdb-client>=1.36.0
89
+ python-logging-loki>=0.3.1
90
+ python-consul>=1.1.0
91
+
86
92
  [storage]
87
93
  boto3>=1.26.0
88
94
  google-cloud-storage>=2.7.0
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "isa_model"
7
- version = "0.4.3"
7
+ version = "0.4.5"
8
8
  description = "Unified AI model serving framework"
9
9
  authors = [{name = "isA_Model Contributors"}]
10
10
  readme = "README.md"
@@ -152,6 +152,14 @@ staging = [
152
152
  "python-consul>=1.1.0", # Service discovery
153
153
  ]
154
154
 
155
+ # Ultra-lightweight staging (no MLflow monitoring)
156
+ staging-minimal = [
157
+ "isa-model[cloud,storage,langchain]",
158
+ "influxdb-client>=1.36.0", # Basic logging only
159
+ "python-logging-loki>=0.3.1", # Centralized logging
160
+ "python-consul>=1.1.0", # Service discovery
161
+ ]
162
+
155
163
  all = [
156
164
  "isa-model[cloud,local,training,audio,vision,langchain,storage,monitoring,k8s,gpu-cloud]",
157
165
  ]