sie-server 0.6.0__tar.gz → 0.6.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (439) hide show
  1. {sie_server-0.6.0 → sie_server-0.6.2}/Dockerfile.cuda12 +2 -0
  2. {sie_server-0.6.0 → sie_server-0.6.2}/PKG-INFO +1 -1
  3. sie_server-0.6.2/models/Snowflake__snowflake-arctic-embed-l-v2.0.yaml +28 -0
  4. sie_server-0.6.2/models/mixedbread-ai__mxbai-embed-large-v1.yaml +28 -0
  5. sie_server-0.6.2/models/nomic-ai__modernbert-embed-base.yaml +28 -0
  6. {sie_server-0.6.0 → sie_server-0.6.2}/openapi.json +1 -1
  7. {sie_server-0.6.0 → sie_server-0.6.2}/pyproject.toml +1 -1
  8. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/qwen3_vl_embedding/__init__.py +16 -4
  9. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/cli.py +17 -2
  10. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/logging.py +18 -4
  11. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/main.py +9 -1
  12. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_loader.py +14 -0
  13. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_logging.py +33 -0
  14. {sie_server-0.6.0 → sie_server-0.6.2}/.gitignore +0 -0
  15. {sie_server-0.6.0 → sie_server-0.6.2}/CONTRIBUTING.md +0 -0
  16. {sie_server-0.6.0 → sie_server-0.6.2}/Dockerfile.cpu +0 -0
  17. {sie_server-0.6.0 → sie_server-0.6.2}/LICENSE +0 -0
  18. {sie_server-0.6.0 → sie_server-0.6.2}/README.md +0 -0
  19. {sie_server-0.6.0 → sie_server-0.6.2}/bundles/default.yaml +0 -0
  20. {sie_server-0.6.0 → sie_server-0.6.2}/bundles/sglang-embedding.yaml +0 -0
  21. {sie_server-0.6.0 → sie_server-0.6.2}/bundles/sglang.yaml +0 -0
  22. {sie_server-0.6.0 → sie_server-0.6.2}/bundles/transformers5.yaml +0 -0
  23. {sie_server-0.6.0 → sie_server-0.6.2}/models/Alibaba-NLP__gte-Qwen2-1.5B-instruct.yaml +0 -0
  24. {sie_server-0.6.0 → sie_server-0.6.2}/models/Alibaba-NLP__gte-Qwen2-7B-instruct.yaml +0 -0
  25. {sie_server-0.6.0 → sie_server-0.6.2}/models/Alibaba-NLP__gte-modernbert-base.yaml +0 -0
  26. {sie_server-0.6.0 → sie_server-0.6.2}/models/Alibaba-NLP__gte-multilingual-base.yaml +0 -0
  27. {sie_server-0.6.0 → sie_server-0.6.2}/models/Alibaba-NLP__gte-reranker-modernbert-base.yaml +0 -0
  28. {sie_server-0.6.0 → sie_server-0.6.2}/models/BAAI__bge-m3.yaml +0 -0
  29. {sie_server-0.6.0 → sie_server-0.6.2}/models/BAAI__bge-reranker-base.yaml +0 -0
  30. {sie_server-0.6.0 → sie_server-0.6.2}/models/BAAI__bge-reranker-large.yaml +0 -0
  31. {sie_server-0.6.0 → sie_server-0.6.2}/models/BAAI__bge-reranker-v2-m3.yaml +0 -0
  32. {sie_server-0.6.0 → sie_server-0.6.2}/models/EmergentMethods__gliner_large_news-v2.1.yaml +0 -0
  33. {sie_server-0.6.0 → sie_server-0.6.2}/models/GritLM__GritLM-7B.yaml +0 -0
  34. {sie_server-0.6.0 → sie_server-0.6.2}/models/IDEA-Research__grounding-dino-base.yaml +0 -0
  35. {sie_server-0.6.0 → sie_server-0.6.2}/models/IDEA-Research__grounding-dino-tiny.yaml +0 -0
  36. {sie_server-0.6.0 → sie_server-0.6.2}/models/Ihor__gliner-biomed-large-v1.0.yaml +0 -0
  37. {sie_server-0.6.0 → sie_server-0.6.2}/models/Linq-AI-Research__Linq-Embed-Mistral.yaml +0 -0
  38. {sie_server-0.6.0 → sie_server-0.6.2}/models/Marqo__marqo-ecommerce-embeddings-B.yaml +0 -0
  39. {sie_server-0.6.0 → sie_server-0.6.2}/models/Marqo__marqo-fashionSigLIP.yaml +0 -0
  40. {sie_server-0.6.0 → sie_server-0.6.2}/models/MoritzLaurer__deberta-v3-base-zeroshot-v2.0.yaml +0 -0
  41. {sie_server-0.6.0 → sie_server-0.6.2}/models/MoritzLaurer__deberta-v3-large-zeroshot-v2.0.yaml +0 -0
  42. {sie_server-0.6.0 → sie_server-0.6.2}/models/NeuML__gliner-bert-tiny.yaml +0 -0
  43. {sie_server-0.6.0 → sie_server-0.6.2}/models/NovaSearch__stella_en_1.5B_v5.yaml +0 -0
  44. {sie_server-0.6.0 → sie_server-0.6.2}/models/NovaSearch__stella_en_400M_v5.yaml +0 -0
  45. {sie_server-0.6.0 → sie_server-0.6.2}/models/PaddlePaddle__PaddleOCR-VL-1.5.yaml +0 -0
  46. {sie_server-0.6.0 → sie_server-0.6.2}/models/Qwen__Qwen3-0.6B.yaml +0 -0
  47. {sie_server-0.6.0 → sie_server-0.6.2}/models/Qwen__Qwen3-4B-Instruct-2507.yaml +0 -0
  48. {sie_server-0.6.0 → sie_server-0.6.2}/models/Qwen__Qwen3-Embedding-0.6B.yaml +0 -0
  49. {sie_server-0.6.0 → sie_server-0.6.2}/models/Qwen__Qwen3-Embedding-4B.yaml +0 -0
  50. {sie_server-0.6.0 → sie_server-0.6.2}/models/Qwen__Qwen3-Reranker-0.6B.yaml +0 -0
  51. {sie_server-0.6.0 → sie_server-0.6.2}/models/Qwen__Qwen3-Reranker-4B.yaml +0 -0
  52. {sie_server-0.6.0 → sie_server-0.6.2}/models/Qwen__Qwen3-VL-Embedding-2B.yaml +0 -0
  53. {sie_server-0.6.0 → sie_server-0.6.2}/models/Qwen__Qwen3-VL-Reranker-2B.yaml +0 -0
  54. {sie_server-0.6.0 → sie_server-0.6.2}/models/Qwen__Qwen3.5-4B.yaml +0 -0
  55. {sie_server-0.6.0 → sie_server-0.6.2}/models/Qwen__Qwen3.6-27B.yaml +0 -0
  56. {sie_server-0.6.0 → sie_server-0.6.2}/models/Salesforce__SFR-Embedding-2_R.yaml +0 -0
  57. {sie_server-0.6.0 → sie_server-0.6.2}/models/Salesforce__SFR-Embedding-Mistral.yaml +0 -0
  58. {sie_server-0.6.0 → sie_server-0.6.2}/models/Snowflake__snowflake-arctic-embed-m-v2.0.yaml +0 -0
  59. {sie_server-0.6.0 → sie_server-0.6.2}/models/TomoroAI__tomoro-colqwen3-embed-4b.yaml +0 -0
  60. {sie_server-0.6.0 → sie_server-0.6.2}/models/answerdotai__ModernBERT-base.yaml +0 -0
  61. {sie_server-0.6.0 → sie_server-0.6.2}/models/answerdotai__answerai-colbert-small-v1.yaml +0 -0
  62. {sie_server-0.6.0 → sie_server-0.6.2}/models/colbert-ir__colbertv2.0.yaml +0 -0
  63. {sie_server-0.6.0 → sie_server-0.6.2}/models/cross-encoder__ms-marco-MiniLM-L-12-v2.yaml +0 -0
  64. {sie_server-0.6.0 → sie_server-0.6.2}/models/cross-encoder__ms-marco-MiniLM-L-6-v2.yaml +0 -0
  65. {sie_server-0.6.0 → sie_server-0.6.2}/models/cross-encoder__nli-deberta-v3-base.yaml +0 -0
  66. {sie_server-0.6.0 → sie_server-0.6.2}/models/defog__sqlcoder-7b-2.yaml +0 -0
  67. {sie_server-0.6.0 → sie_server-0.6.2}/models/docling.yaml +0 -0
  68. {sie_server-0.6.0 → sie_server-0.6.2}/models/fastino__gliner2-base-v1.yaml +0 -0
  69. {sie_server-0.6.0 → sie_server-0.6.2}/models/gliner-community__gliner_large-v2.5.yaml +0 -0
  70. {sie_server-0.6.0 → sie_server-0.6.2}/models/gliner-community__gliner_medium-v2.5.yaml +0 -0
  71. {sie_server-0.6.0 → sie_server-0.6.2}/models/gliner-community__gliner_small-v2.5.yaml +0 -0
  72. {sie_server-0.6.0 → sie_server-0.6.2}/models/google__embeddinggemma-300m.yaml +0 -0
  73. {sie_server-0.6.0 → sie_server-0.6.2}/models/google__owlv2-base-patch16-ensemble.yaml +0 -0
  74. {sie_server-0.6.0 → sie_server-0.6.2}/models/google__siglip-so400m-patch14-224.yaml +0 -0
  75. {sie_server-0.6.0 → sie_server-0.6.2}/models/google__siglip-so400m-patch14-384.yaml +0 -0
  76. {sie_server-0.6.0 → sie_server-0.6.2}/models/google__siglip2-base-patch16-224.yaml +0 -0
  77. {sie_server-0.6.0 → sie_server-0.6.2}/models/ibm-granite__granite-embedding-30m-sparse.yaml +0 -0
  78. {sie_server-0.6.0 → sie_server-0.6.2}/models/ibm-granite__granite-embedding-english-r2.yaml +0 -0
  79. {sie_server-0.6.0 → sie_server-0.6.2}/models/ibm-granite__granite-embedding-small-english-r2.yaml +0 -0
  80. {sie_server-0.6.0 → sie_server-0.6.2}/models/ibm-granite__granite-guardian-3.0-2b.yaml +0 -0
  81. {sie_server-0.6.0 → sie_server-0.6.2}/models/intfloat__e5-base-v2.yaml +0 -0
  82. {sie_server-0.6.0 → sie_server-0.6.2}/models/intfloat__e5-large-v2.yaml +0 -0
  83. {sie_server-0.6.0 → sie_server-0.6.2}/models/intfloat__e5-mistral-7b-instruct.yaml +0 -0
  84. {sie_server-0.6.0 → sie_server-0.6.2}/models/intfloat__e5-small-v2.yaml +0 -0
  85. {sie_server-0.6.0 → sie_server-0.6.2}/models/intfloat__multilingual-e5-large-instruct.yaml +0 -0
  86. {sie_server-0.6.0 → sie_server-0.6.2}/models/intfloat__multilingual-e5-large.yaml +0 -0
  87. {sie_server-0.6.0 → sie_server-0.6.2}/models/jackboyla__glirel-large-v0.yaml +0 -0
  88. {sie_server-0.6.0 → sie_server-0.6.2}/models/jinaai__jina-colbert-v2.yaml +0 -0
  89. {sie_server-0.6.0 → sie_server-0.6.2}/models/jinaai__jina-reranker-v2-base-multilingual.yaml +0 -0
  90. {sie_server-0.6.0 → sie_server-0.6.2}/models/knowledgator__gliclass-base-v1.0.yaml +0 -0
  91. {sie_server-0.6.0 → sie_server-0.6.2}/models/knowledgator__gliclass-large-v1.0.yaml +0 -0
  92. {sie_server-0.6.0 → sie_server-0.6.2}/models/knowledgator__gliclass-large-v3.0.yaml +0 -0
  93. {sie_server-0.6.0 → sie_server-0.6.2}/models/knowledgator__gliclass-small-v1.0.yaml +0 -0
  94. {sie_server-0.6.0 → sie_server-0.6.2}/models/knowledgator__gliner-bi-base-v2.0.yaml +0 -0
  95. {sie_server-0.6.0 → sie_server-0.6.2}/models/knowledgator__modern-gliner-bi-base-v1.0.yaml +0 -0
  96. {sie_server-0.6.0 → sie_server-0.6.2}/models/laion__CLIP-ViT-B-32-laion2B-s34B-b79K.yaml +0 -0
  97. {sie_server-0.6.0 → sie_server-0.6.2}/models/laion__CLIP-ViT-H-14-laion2B-s32B-b79K.yaml +0 -0
  98. {sie_server-0.6.0 → sie_server-0.6.2}/models/lightonai__GTE-ModernColBERT-v1.yaml +0 -0
  99. {sie_server-0.6.0 → sie_server-0.6.2}/models/lightonai__LightOnOCR-2-1B.yaml +0 -0
  100. {sie_server-0.6.0 → sie_server-0.6.2}/models/lightonai__Reason-ModernColBERT.yaml +0 -0
  101. {sie_server-0.6.0 → sie_server-0.6.2}/models/microsoft__Florence-2-base-ft.yaml +0 -0
  102. {sie_server-0.6.0 → sie_server-0.6.2}/models/microsoft__Florence-2-base.yaml +0 -0
  103. {sie_server-0.6.0 → sie_server-0.6.2}/models/microsoft__Florence-2-large.yaml +0 -0
  104. {sie_server-0.6.0 → sie_server-0.6.2}/models/mixedbread-ai__mxbai-colbert-large-v1.yaml +0 -0
  105. {sie_server-0.6.0 → sie_server-0.6.2}/models/mixedbread-ai__mxbai-edge-colbert-v0-32m.yaml +0 -0
  106. {sie_server-0.6.0 → sie_server-0.6.2}/models/mixedbread-ai__mxbai-rerank-base-v2.yaml +0 -0
  107. {sie_server-0.6.0 → sie_server-0.6.2}/models/mixedbread-ai__mxbai-rerank-large-v2.yaml +0 -0
  108. {sie_server-0.6.0 → sie_server-0.6.2}/models/mynkchaudhry__Florence-2-FT-DocVQA.yaml +0 -0
  109. {sie_server-0.6.0 → sie_server-0.6.2}/models/naver-clova-ix__donut-base-finetuned-cord-v2.yaml +0 -0
  110. {sie_server-0.6.0 → sie_server-0.6.2}/models/naver-clova-ix__donut-base-finetuned-docvqa.yaml +0 -0
  111. {sie_server-0.6.0 → sie_server-0.6.2}/models/naver-clova-ix__donut-base-finetuned-rvlcdip.yaml +0 -0
  112. {sie_server-0.6.0 → sie_server-0.6.2}/models/naver__splade-cocondenser-selfdistil.yaml +0 -0
  113. {sie_server-0.6.0 → sie_server-0.6.2}/models/naver__splade-v3.yaml +0 -0
  114. {sie_server-0.6.0 → sie_server-0.6.2}/models/nomic-ai__nomic-embed-text-v2-moe.yaml +0 -0
  115. {sie_server-0.6.0 → sie_server-0.6.2}/models/numind__NuNER_Zero-span.yaml +0 -0
  116. {sie_server-0.6.0 → sie_server-0.6.2}/models/numind__NuNER_Zero.yaml +0 -0
  117. {sie_server-0.6.0 → sie_server-0.6.2}/models/nvidia__NV-Embed-v2.yaml +0 -0
  118. {sie_server-0.6.0 → sie_server-0.6.2}/models/nvidia__llama-embed-nemotron-8b.yaml +0 -0
  119. {sie_server-0.6.0 → sie_server-0.6.2}/models/nvidia__llama-nemoretriever-colembed-3b-v1.yaml +0 -0
  120. {sie_server-0.6.0 → sie_server-0.6.2}/models/nvidia__nemotron-colembed-vl-4b-v2.yaml +0 -0
  121. {sie_server-0.6.0 → sie_server-0.6.2}/models/openai__clip-vit-base-patch32.yaml +0 -0
  122. {sie_server-0.6.0 → sie_server-0.6.2}/models/openai__clip-vit-large-patch14.yaml +0 -0
  123. {sie_server-0.6.0 → sie_server-0.6.2}/models/opendatalab__MinerU2.5-Pro-2604-1.2B.yaml +0 -0
  124. {sie_server-0.6.0 → sie_server-0.6.2}/models/opensearch-project__opensearch-neural-sparse-encoding-doc-v2-distill.yaml +0 -0
  125. {sie_server-0.6.0 → sie_server-0.6.2}/models/opensearch-project__opensearch-neural-sparse-encoding-doc-v2-mini.yaml +0 -0
  126. {sie_server-0.6.0 → sie_server-0.6.2}/models/opensearch-project__opensearch-neural-sparse-encoding-doc-v3-distill.yaml +0 -0
  127. {sie_server-0.6.0 → sie_server-0.6.2}/models/opensearch-project__opensearch-neural-sparse-encoding-doc-v3-gte.yaml +0 -0
  128. {sie_server-0.6.0 → sie_server-0.6.2}/models/opensearch-project__opensearch-neural-sparse-encoding-v1.yaml +0 -0
  129. {sie_server-0.6.0 → sie_server-0.6.2}/models/opensearch-project__opensearch-neural-sparse-encoding-v2-distill.yaml +0 -0
  130. {sie_server-0.6.0 → sie_server-0.6.2}/models/prithivida__Splade_PP_en_v2.yaml +0 -0
  131. {sie_server-0.6.0 → sie_server-0.6.2}/models/rasyosef__splade-mini.yaml +0 -0
  132. {sie_server-0.6.0 → sie_server-0.6.2}/models/sentence-transformers__all-MiniLM-L6-v2.yaml +0 -0
  133. {sie_server-0.6.0 → sie_server-0.6.2}/models/sugiv__stablebridge-pruner-highlighter.yaml +0 -0
  134. {sie_server-0.6.0 → sie_server-0.6.2}/models/urchade__gliner_large-v2.1.yaml +0 -0
  135. {sie_server-0.6.0 → sie_server-0.6.2}/models/urchade__gliner_medium-v2.1.yaml +0 -0
  136. {sie_server-0.6.0 → sie_server-0.6.2}/models/urchade__gliner_multi-v2.1.yaml +0 -0
  137. {sie_server-0.6.0 → sie_server-0.6.2}/models/urchade__gliner_multi_pii-v1.yaml +0 -0
  138. {sie_server-0.6.0 → sie_server-0.6.2}/models/urchade__gliner_small-v2.1.yaml +0 -0
  139. {sie_server-0.6.0 → sie_server-0.6.2}/models/vidore__colpali-v1.3-hf.yaml +0 -0
  140. {sie_server-0.6.0 → sie_server-0.6.2}/models/vidore__colqwen2.5-v0.2.yaml +0 -0
  141. {sie_server-0.6.0 → sie_server-0.6.2}/models/zai-org__GLM-OCR.yaml +0 -0
  142. {sie_server-0.6.0 → sie_server-0.6.2}/scripts/generate_tokenize_fixture.py +0 -0
  143. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/__init__.py +0 -0
  144. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/_ipc_test_harness.py +0 -0
  145. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapter_call_loop.py +0 -0
  146. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/__init__.py +0 -0
  147. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/_base_adapter.py +0 -0
  148. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/_flash_base.py +0 -0
  149. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/_generation_base.py +0 -0
  150. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/_spec.py +0 -0
  151. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/_types.py +0 -0
  152. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/_utils.py +0 -0
  153. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/base.py +0 -0
  154. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/bert_flash/__init__.py +0 -0
  155. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/bert_flash_cross_encoder/__init__.py +0 -0
  156. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/bge_m3/__init__.py +0 -0
  157. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/bge_m3_flag/__init__.py +0 -0
  158. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/bge_m3_flash/__init__.py +0 -0
  159. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/bge_m3_score_mixin.py +0 -0
  160. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/clip/__init__.py +0 -0
  161. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/colbert/__init__.py +0 -0
  162. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/colbert_modernbert_flash/__init__.py +0 -0
  163. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/colbert_rotary_flash/__init__.py +0 -0
  164. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/colpali/__init__.py +0 -0
  165. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/colqwen2/__init__.py +0 -0
  166. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/colqwen3/__init__.py +0 -0
  167. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/cross_encoder/__init__.py +0 -0
  168. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/docling/__init__.py +0 -0
  169. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/donut/__init__.py +0 -0
  170. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/errors.py +0 -0
  171. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/florence2/__init__.py +0 -0
  172. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/gliclass/__init__.py +0 -0
  173. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/gliner/__init__.py +0 -0
  174. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/gliner2/__init__.py +0 -0
  175. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/gliner_bi/__init__.py +0 -0
  176. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/glirel/__init__.py +0 -0
  177. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/glm_ocr/__init__.py +0 -0
  178. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/grounding_dino/__init__.py +0 -0
  179. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/gte_sparse_flash/__init__.py +0 -0
  180. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/jina_flash_cross_encoder/__init__.py +0 -0
  181. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/lighton_ocr/__init__.py +0 -0
  182. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/mineru_vl/__init__.py +0 -0
  183. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/modernbert_flash/__init__.py +0 -0
  184. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/modernbert_flash_cross_encoder/__init__.py +0 -0
  185. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/nemo_colembed/__init__.py +0 -0
  186. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/nli_classification/__init__.py +0 -0
  187. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/nli_classification_flash/__init__.py +0 -0
  188. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/nomic_flash/__init__.py +0 -0
  189. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/owlv2/__init__.py +0 -0
  190. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/paddleocr_vl/__init__.py +0 -0
  191. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/peft_lora_mixin.py +0 -0
  192. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/pytorch_embedding/__init__.py +0 -0
  193. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/qwen2_flash/__init__.py +0 -0
  194. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/qwen2_flash_cross_encoder/__init__.py +0 -0
  195. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/qwen3_vl_reranker/__init__.py +0 -0
  196. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/rope_flash/__init__.py +0 -0
  197. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/sentence_transformer/__init__.py +0 -0
  198. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/sglang/__init__.py +0 -0
  199. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/sglang/_server.py +0 -0
  200. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/sglang/embedding.py +0 -0
  201. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/sglang/generation.py +0 -0
  202. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/siglip/__init__.py +0 -0
  203. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/splade_flash/__init__.py +0 -0
  204. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/stablebridge_pruner/__init__.py +0 -0
  205. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/adapters/xlm_roberta_flash/__init__.py +0 -0
  206. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/__init__.py +0 -0
  207. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/encode.py +0 -0
  208. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/extract.py +0 -0
  209. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/generate.py +0 -0
  210. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/health.py +0 -0
  211. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/helpers.py +0 -0
  212. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/metrics.py +0 -0
  213. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/models.py +0 -0
  214. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/openai_compat.py +0 -0
  215. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/openapi.py +0 -0
  216. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/options.py +0 -0
  217. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/root.py +0 -0
  218. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/score.py +0 -0
  219. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/serialization.py +0 -0
  220. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/validation.py +0 -0
  221. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/api/ws.py +0 -0
  222. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/app/__init__.py +0 -0
  223. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/app/app_factory.py +0 -0
  224. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/app/app_state_config.py +0 -0
  225. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/config/__init__.py +0 -0
  226. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/config/engine.py +0 -0
  227. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/config/model.py +0 -0
  228. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/__init__.py +0 -0
  229. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/adaptive_batching.py +0 -0
  230. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/batcher.py +0 -0
  231. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/deps.py +0 -0
  232. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/disk_cache.py +0 -0
  233. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/encode_pipeline.py +0 -0
  234. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/extract_cost.py +0 -0
  235. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/gpu_health.py +0 -0
  236. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/hf_env.py +0 -0
  237. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/hot_reload.py +0 -0
  238. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/inference.py +0 -0
  239. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/inference_output.py +0 -0
  240. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/load_errors.py +0 -0
  241. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/loader.py +0 -0
  242. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/memory.py +0 -0
  243. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/model_loader.py +0 -0
  244. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/oom.py +0 -0
  245. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/pool_isolation.py +0 -0
  246. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/postprocessor.py +0 -0
  247. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/postprocessor_registry.py +0 -0
  248. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/prepared.py +0 -0
  249. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/preprocessor/__init__.py +0 -0
  250. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/preprocessor/base.py +0 -0
  251. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/preprocessor/image.py +0 -0
  252. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/preprocessor/text.py +0 -0
  253. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/preprocessor/vision.py +0 -0
  254. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/preprocessor_registry.py +0 -0
  255. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/readiness.py +0 -0
  256. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/registry.py +0 -0
  257. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/shutdown.py +0 -0
  258. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/text_tokens.py +0 -0
  259. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/timing.py +0 -0
  260. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/tokenizer.py +0 -0
  261. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/watcher.py +0 -0
  262. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/worker/__init__.py +0 -0
  263. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/worker/handlers/__init__.py +0 -0
  264. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/worker/handlers/base.py +0 -0
  265. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/worker/handlers/encode.py +0 -0
  266. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/worker/handlers/extract.py +0 -0
  267. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/worker/handlers/score.py +0 -0
  268. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/worker/model_worker.py +0 -0
  269. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/worker/oom_recovery.py +0 -0
  270. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/core/worker/types.py +0 -0
  271. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/health/__init__.py +0 -0
  272. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/health/nats_publisher.py +0 -0
  273. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/health/saturation.py +0 -0
  274. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/ipc_server.py +0 -0
  275. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/ipc_types.py +0 -0
  276. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/observability/__init__.py +0 -0
  277. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/observability/gpu.py +0 -0
  278. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/observability/metrics.py +0 -0
  279. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/observability/prometheus.py +0 -0
  280. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/observability/telemetry.py +0 -0
  281. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/observability/tracing.py +0 -0
  282. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/processors/__init__.py +0 -0
  283. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/processors/admission.py +0 -0
  284. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/processors/base.py +0 -0
  285. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/processors/grammar_cache.py +0 -0
  286. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/processors/grammar_compile.py +0 -0
  287. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/processors/streaming.py +0 -0
  288. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/processors/tool_call_grammar.py +0 -0
  289. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/processors/tool_call_parser.py +0 -0
  290. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/processors/work_class_scheduler.py +0 -0
  291. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/queue_executor.py +0 -0
  292. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/static/__init__.py +0 -0
  293. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/static/index.html +0 -0
  294. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/types/__init__.py +0 -0
  295. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/types/grammar.py +0 -0
  296. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/types/inputs.py +0 -0
  297. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/types/openapi.py +0 -0
  298. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/types/outputs.py +0 -0
  299. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/types/overflow_policy.py +0 -0
  300. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/types/requests.py +0 -0
  301. {sie_server-0.6.0 → sie_server-0.6.2}/src/sie_server/types/responses.py +0 -0
  302. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/__init__.py +0 -0
  303. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_base.py +0 -0
  304. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_bge_m3.py +0 -0
  305. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_bge_m3_flash.py +0 -0
  306. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_clip.py +0 -0
  307. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_colbert.py +0 -0
  308. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_docling.py +0 -0
  309. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_docling_smoke.py +0 -0
  310. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_donut.py +0 -0
  311. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_factory_integration.py +0 -0
  312. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_flash_base.py +0 -0
  313. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_florence2.py +0 -0
  314. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_gliclass_overflow_policy.py +0 -0
  315. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_glirel.py +0 -0
  316. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_glm_ocr.py +0 -0
  317. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_grounding_dino.py +0 -0
  318. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_gte_sparse.py +0 -0
  319. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_jina_flash_cross_encoder.py +0 -0
  320. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_lighton_ocr.py +0 -0
  321. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_lora.py +0 -0
  322. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_lora_integration.py +0 -0
  323. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_mineru_vl.py +0 -0
  324. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_paddleocr_vl.py +0 -0
  325. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_pytorch_embedding_revision.py +0 -0
  326. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_runtime_options.py +0 -0
  327. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_sentence_transformer.py +0 -0
  328. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_sglang.py +0 -0
  329. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_sglang_generation.py +0 -0
  330. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_siglip.py +0 -0
  331. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_sparse_aggregation.py +0 -0
  332. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_stablebridge_integration.py +0 -0
  333. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_stablebridge_pruner.py +0 -0
  334. {sie_server-0.6.0 → sie_server-0.6.2}/tests/adapters/test_visual_document.py +0 -0
  335. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/__init__.py +0 -0
  336. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_encode_dtype.py +0 -0
  337. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_encode_endpoint.py +0 -0
  338. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_encode_json_schema.py +0 -0
  339. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_encode_timing.py +0 -0
  340. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_encode_validation.py +0 -0
  341. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_extract.py +0 -0
  342. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_extract_integration.py +0 -0
  343. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_extract_oom.py +0 -0
  344. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_generate.py +0 -0
  345. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_health.py +0 -0
  346. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_models.py +0 -0
  347. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_openai_compat.py +0 -0
  348. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_score.py +0 -0
  349. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_version_header.py +0 -0
  350. {sie_server-0.6.0 → sie_server-0.6.2}/tests/api/test_ws.py +0 -0
  351. {sie_server-0.6.0 → sie_server-0.6.2}/tests/app/__init__.py +0 -0
  352. {sie_server-0.6.0 → sie_server-0.6.2}/tests/app/test_app_factory.py +0 -0
  353. {sie_server-0.6.0 → sie_server-0.6.2}/tests/config/__init__.py +0 -0
  354. {sie_server-0.6.0 → sie_server-0.6.2}/tests/config/test_bundle_coverage.py +0 -0
  355. {sie_server-0.6.0 → sie_server-0.6.2}/tests/config/test_config.py +0 -0
  356. {sie_server-0.6.0 → sie_server-0.6.2}/tests/config/test_model_prewarm_grammars.py +0 -0
  357. {sie_server-0.6.0 → sie_server-0.6.2}/tests/config/test_profile_backend_consistency.py +0 -0
  358. {sie_server-0.6.0 → sie_server-0.6.2}/tests/conftest.py +0 -0
  359. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/__init__.py +0 -0
  360. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_adaptive_batching.py +0 -0
  361. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_batcher.py +0 -0
  362. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_disk_cache.py +0 -0
  363. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_gpu_health.py +0 -0
  364. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_hot_reload.py +0 -0
  365. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_idle_evict.py +0 -0
  366. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_inference.py +0 -0
  367. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_lora_generation_exclusion.py +0 -0
  368. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_memory.py +0 -0
  369. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_model_load_timeout.py +0 -0
  370. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_oom_detection.py +0 -0
  371. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_pool_isolation.py +0 -0
  372. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_postprocessor.py +0 -0
  373. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_postprocessor_registry.py +0 -0
  374. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_prepared.py +0 -0
  375. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_preprocessor.py +0 -0
  376. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_preprocessor_registry.py +0 -0
  377. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_quantization.py +0 -0
  378. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_readiness.py +0 -0
  379. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_registry_async.py +0 -0
  380. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_registry_core.py +0 -0
  381. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_registry_deps.py +0 -0
  382. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_registry_failed_state.py +0 -0
  383. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_registry_memory.py +0 -0
  384. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_registry_multi_model.py +0 -0
  385. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_shutdown.py +0 -0
  386. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_timing.py +0 -0
  387. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_watcher.py +0 -0
  388. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_worker_backpressure.py +0 -0
  389. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_worker_core.py +0 -0
  390. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_worker_extract.py +0 -0
  391. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_worker_lora.py +0 -0
  392. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_worker_options.py +0 -0
  393. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_worker_passthrough.py +0 -0
  394. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/test_worker_score.py +0 -0
  395. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/worker/__init__.py +0 -0
  396. {sie_server-0.6.0 → sie_server-0.6.2}/tests/core/worker/test_oom_recovery.py +0 -0
  397. {sie_server-0.6.0 → sie_server-0.6.2}/tests/health/__init__.py +0 -0
  398. {sie_server-0.6.0 → sie_server-0.6.2}/tests/health/test_nats_publisher.py +0 -0
  399. {sie_server-0.6.0 → sie_server-0.6.2}/tests/health/test_saturation.py +0 -0
  400. {sie_server-0.6.0 → sie_server-0.6.2}/tests/health/test_worker_id_consistency.py +0 -0
  401. {sie_server-0.6.0 → sie_server-0.6.2}/tests/integration/__init__.py +0 -0
  402. {sie_server-0.6.0 → sie_server-0.6.2}/tests/integration/test_chat_completions.py +0 -0
  403. {sie_server-0.6.0 → sie_server-0.6.2}/tests/integration/test_grammar_generate.py +0 -0
  404. {sie_server-0.6.0 → sie_server-0.6.2}/tests/observability/__init__.py +0 -0
  405. {sie_server-0.6.0 → sie_server-0.6.2}/tests/observability/test_generation_metrics.py +0 -0
  406. {sie_server-0.6.0 → sie_server-0.6.2}/tests/observability/test_metrics.py +0 -0
  407. {sie_server-0.6.0 → sie_server-0.6.2}/tests/observability/test_telemetry.py +0 -0
  408. {sie_server-0.6.0 → sie_server-0.6.2}/tests/observability/test_trace_propagation.py +0 -0
  409. {sie_server-0.6.0 → sie_server-0.6.2}/tests/observability/test_tracing.py +0 -0
  410. {sie_server-0.6.0 → sie_server-0.6.2}/tests/processors/__init__.py +0 -0
  411. {sie_server-0.6.0 → sie_server-0.6.2}/tests/processors/test_grammar_cache.py +0 -0
  412. {sie_server-0.6.0 → sie_server-0.6.2}/tests/processors/test_grammar_compile.py +0 -0
  413. {sie_server-0.6.0 → sie_server-0.6.2}/tests/processors/test_grammar_prewarm.py +0 -0
  414. {sie_server-0.6.0 → sie_server-0.6.2}/tests/processors/test_streaming.py +0 -0
  415. {sie_server-0.6.0 → sie_server-0.6.2}/tests/processors/test_streaming_admission.py +0 -0
  416. {sie_server-0.6.0 → sie_server-0.6.2}/tests/processors/test_streaming_integration.py +0 -0
  417. {sie_server-0.6.0 → sie_server-0.6.2}/tests/processors/test_tool_call_grammar.py +0 -0
  418. {sie_server-0.6.0 → sie_server-0.6.2}/tests/processors/test_tool_call_parser.py +0 -0
  419. {sie_server-0.6.0 → sie_server-0.6.2}/tests/processors/test_work_class_scheduler.py +0 -0
  420. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_adapter_call_loop.py +0 -0
  421. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_all_models.py +0 -0
  422. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_docker_integration.py +0 -0
  423. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_ipc_server.py +0 -0
  424. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_ipc_types_raw_output.py +0 -0
  425. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_model_yaml_filenames.py +0 -0
  426. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_openapi_export.py +0 -0
  427. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_parity_run_batch.py +0 -0
  428. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_queue_executor.py +0 -0
  429. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_queue_executor_stage1d.py +0 -0
  430. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_readiness.py +0 -0
  431. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_sdk_integration.py +0 -0
  432. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_server_smoke.py +0 -0
  433. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_sparse_integration.py +0 -0
  434. {sie_server-0.6.0 → sie_server-0.6.2}/tests/test_stage1d_byte_identity.py +0 -0
  435. {sie_server-0.6.0 → sie_server-0.6.2}/tests/type_defs/__init__.py +0 -0
  436. {sie_server-0.6.0 → sie_server-0.6.2}/tests/type_defs/test_inputs.py +0 -0
  437. {sie_server-0.6.0 → sie_server-0.6.2}/tests/type_defs/test_inputs_json_decode.py +0 -0
  438. {sie_server-0.6.0 → sie_server-0.6.2}/tests/type_defs/test_media_bytes.py +0 -0
  439. {sie_server-0.6.0 → sie_server-0.6.2}/tests/type_defs/test_types.py +0 -0
@@ -200,6 +200,7 @@ ENV DEBIAN_FRONTEND=noninteractive
200
200
  # opencv-python wheel unconditionally dlopens an X11 + libGL + glib chain at
201
201
  # import even in headless usage. Without these, every docling extract crashes
202
202
  # with "ImportError: libxcb.so.1: cannot open shared object file" (issue #1028).
203
+ # ninja-build: flashinfer invokes ninja during first-use SGLang kernel JIT.
203
204
  RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
204
205
  --mount=type=cache,target=/var/lib/apt/lists,sharing=locked \
205
206
  apt-get update && apt-get install -y --no-install-recommends \
@@ -213,6 +214,7 @@ RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
213
214
  libnuma1 \
214
215
  libsm6 \
215
216
  libspatialindex-c6 \
217
+ ninja-build \
216
218
  libx11-6 \
217
219
  libxcb1 \
218
220
  libxext6
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: sie-server
3
- Version: 0.6.0
3
+ Version: 0.6.2
4
4
  Summary: Search Inference Engine - GPU inference server for search workloads
5
5
  License: Apache-2.0
6
6
  License-File: LICENSE
@@ -0,0 +1,28 @@
1
+ sie_id: Snowflake/snowflake-arctic-embed-l-v2.0
2
+ hf_id: Snowflake/snowflake-arctic-embed-l-v2.0
3
+ inputs:
4
+ text: true
5
+ image: false
6
+ audio: false
7
+ video: false
8
+ tasks:
9
+ encode:
10
+ dense:
11
+ dim: 1024
12
+ sparse: null
13
+ multivector: null
14
+ score: null
15
+ extract: null
16
+ max_sequence_length: 8192
17
+ profiles:
18
+ default:
19
+ max_batch_tokens: 16384
20
+ compute_precision: null
21
+ adapter_path: sie_server.adapters.xlm_roberta_flash:XLMRobertaFlashAdapter
22
+ adapter_options:
23
+ loadtime: {}
24
+ runtime:
25
+ pooling: cls
26
+ normalize: true
27
+ query_template: 'query: {text}'
28
+ doc_template: '{text}'
@@ -0,0 +1,28 @@
1
+ sie_id: mixedbread-ai/mxbai-embed-large-v1
2
+ hf_id: mixedbread-ai/mxbai-embed-large-v1
3
+ inputs:
4
+ text: true
5
+ image: false
6
+ audio: false
7
+ video: false
8
+ tasks:
9
+ encode:
10
+ dense:
11
+ dim: 1024
12
+ sparse: null
13
+ multivector: null
14
+ score: null
15
+ extract: null
16
+ max_sequence_length: 512
17
+ profiles:
18
+ default:
19
+ max_batch_tokens: 16384
20
+ compute_precision: null
21
+ adapter_path: sie_server.adapters.bert_flash:BertFlashAdapter
22
+ adapter_options:
23
+ loadtime: {}
24
+ runtime:
25
+ pooling: cls
26
+ normalize: true
27
+ query_template: 'Represent this sentence for searching relevant passages: {text}'
28
+ doc_template: '{text}'
@@ -0,0 +1,28 @@
1
+ sie_id: nomic-ai/modernbert-embed-base
2
+ hf_id: nomic-ai/modernbert-embed-base
3
+ inputs:
4
+ text: true
5
+ image: false
6
+ audio: false
7
+ video: false
8
+ tasks:
9
+ encode:
10
+ dense:
11
+ dim: 768
12
+ sparse: null
13
+ multivector: null
14
+ score: null
15
+ extract: null
16
+ max_sequence_length: 8192
17
+ profiles:
18
+ default:
19
+ max_batch_tokens: 16384
20
+ compute_precision: bfloat16
21
+ adapter_path: sie_server.adapters.modernbert_flash:ModernBERTFlashAdapter
22
+ adapter_options:
23
+ loadtime: {}
24
+ runtime:
25
+ pooling: mean
26
+ normalize: true
27
+ query_template: 'search_query: {text}'
28
+ doc_template: 'search_document: {text}'
@@ -3,7 +3,7 @@
3
3
  "info": {
4
4
  "title": "SIE Server",
5
5
  "description": "Search Inference Engine - GPU inference server for search workloads",
6
- "version": "0.6.0"
6
+ "version": "0.6.2"
7
7
  },
8
8
  "paths": {
9
9
  "/": {
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "sie-server"
3
- version = "0.6.0"
3
+ version = "0.6.2"
4
4
  description = "Search Inference Engine - GPU inference server for search workloads"
5
5
  requires-python = ">=3.12,<3.13"
6
6
  license = { text = "Apache-2.0" }
@@ -98,6 +98,7 @@ class Qwen3VLEmbeddingAdapter(BaseAdapter):
98
98
  max_seq_length: int | None = None,
99
99
  pooling: str = "last",
100
100
  default_instruction: str = _DEFAULT_INSTRUCTION,
101
+ dense_dim: int | None = None,
101
102
  ) -> None:
102
103
  if pooling not in _SUPPORTED_POOLING:
103
104
  msg = f"Unsupported pooling '{pooling}', must be one of {_SUPPORTED_POOLING}"
@@ -110,11 +111,12 @@ class Qwen3VLEmbeddingAdapter(BaseAdapter):
110
111
  self._max_seq_length = max_seq_length
111
112
  self._pooling = pooling
112
113
  self._default_instruction = default_instruction
114
+ self._configured_dense_dim = dense_dim
113
115
 
114
116
  self._model: Qwen3VLForConditionalGeneration | None = None
115
117
  self._processor: AutoProcessor | None = None
116
118
  self._device: str | None = None
117
- self._dense_dim: int | None = 2048
119
+ self._dense_dim: int | None = dense_dim or 2048
118
120
 
119
121
  def load(self, device: str) -> None:
120
122
  from transformers import AutoProcessor, Qwen3VLForConditionalGeneration
@@ -162,12 +164,22 @@ class Qwen3VLEmbeddingAdapter(BaseAdapter):
162
164
  # Qwen3VLConfig stores the text model hidden size under text_config
163
165
  cfg = self._model.config
164
166
  if hasattr(cfg, "hidden_size"):
165
- self._dense_dim = cfg.hidden_size
167
+ self._dense_dim = self._validate_or_set_dense_dim(cfg.hidden_size)
166
168
  elif hasattr(cfg, "text_config") and hasattr(cfg.text_config, "hidden_size"):
167
- self._dense_dim = cfg.text_config.hidden_size
169
+ self._dense_dim = self._validate_or_set_dense_dim(cfg.text_config.hidden_size)
168
170
  else:
169
171
  logger.warning("Could not determine hidden_size from config, defaulting to 2048")
170
- self._dense_dim = 2048
172
+ self._dense_dim = self._validate_or_set_dense_dim(2048)
173
+
174
+ def _validate_or_set_dense_dim(self, observed_dim: int) -> int:
175
+ """Validate observed model width against configured dense_dim."""
176
+ if self._configured_dense_dim is not None and observed_dim != self._configured_dense_dim:
177
+ msg = (
178
+ "Qwen3-VL embedding dimension mismatch: "
179
+ f"configured dense_dim={self._configured_dense_dim}, model hidden_size={observed_dim}"
180
+ )
181
+ raise ValueError(msg)
182
+ return observed_dim
171
183
 
172
184
  def _resolve_dtype(self) -> torch.dtype:
173
185
  if not self._device or not str(self._device).startswith("cuda"):
@@ -16,6 +16,7 @@ os.environ.setdefault("HF_HUB_ETAG_TIMEOUT", "30")
16
16
  import hashlib
17
17
  import logging
18
18
  from pathlib import Path
19
+ from typing import Annotated
19
20
 
20
21
  import typer
21
22
  from sie_sdk.bundle_utils import find_bundle_for_models, match_bundle_models
@@ -230,6 +231,15 @@ def serve(
230
231
  tracing: bool = typer.Option(default=False, help="Enable OpenTelemetry tracing (exports to localhost:4317)"),
231
232
  instrumentation: bool = typer.Option(False, "--instrumentation", "-i", help="Enable batch instrumentation logging"),
232
233
  verbose: bool = typer.Option(False, "--verbose", "-v", help="Enable verbose logging"),
234
+ log_level: Annotated[
235
+ str,
236
+ typer.Option(
237
+ "--log-level",
238
+ "-l",
239
+ envvar="SIE_LOG_LEVEL",
240
+ help="Log level (DEBUG, INFO, WARNING, ERROR). Helm sets SIE_LOG_LEVEL for workers.",
241
+ ),
242
+ ] = "info",
233
243
  preload: str | None = typer.Option(None, "--preload", help="Comma-separated model names to preload at startup"),
234
244
  json_logs: bool = typer.Option(False, "--json-logs", help="Enable structured JSON logging (for Loki)"),
235
245
  ) -> None:
@@ -239,7 +249,7 @@ def serve(
239
249
  from sie_server.core.logging import configure_logging
240
250
 
241
251
  # Configure logging (supports JSON format for Loki compatibility)
242
- configure_logging(verbose=verbose, json_format=json_logs or None)
252
+ configure_logging(verbose=verbose, json_format=json_logs or None, level_name=log_level)
243
253
 
244
254
  # Handle models directory - cloud URLs pass through, local paths resolve
245
255
  if is_cloud_path(models_dir):
@@ -334,6 +344,7 @@ def serve(
334
344
  typer.echo("Start Jaeger with: mise run jaeger")
335
345
 
336
346
  typer.echo(f"Starting SIE server on {host}:{port}")
347
+
337
348
  typer.echo(f"Models directory: {models_dir_resolved}")
338
349
  typer.echo(f"Device: {resolved_device}")
339
350
  if cluster_cache:
@@ -370,7 +381,11 @@ def serve(
370
381
  preload_models=preload_models,
371
382
  )
372
383
 
373
- run_server(host=host, port=port, reload=reload, config=config)
384
+ uvicorn_log = "debug" if verbose else log_level.strip().lower()
385
+ if uvicorn_log not in ("critical", "error", "warning", "info", "debug", "trace"):
386
+ uvicorn_log = "info"
387
+
388
+ run_server(host=host, port=port, reload=reload, config=config, uvicorn_log_level=uvicorn_log)
374
389
 
375
390
 
376
391
  if __name__ == "__main__":
@@ -69,15 +69,29 @@ class TextFormatter(logging.Formatter):
69
69
  )
70
70
 
71
71
 
72
- def configure_logging(*, verbose: bool = False, json_format: bool | None = None) -> None:
72
+ def _resolve_log_level(*, verbose: bool, level_name: str | None) -> int:
73
+ """Pick root log level: ``--verbose`` wins, then explicit name, then ``SIE_LOG_LEVEL`` env."""
74
+ if verbose:
75
+ return logging.DEBUG
76
+ raw = (level_name or os.environ.get("SIE_LOG_LEVEL") or "INFO").strip()
77
+ mapping = logging.getLevelNamesMapping()
78
+ return mapping.get(raw.upper(), logging.INFO)
79
+
80
+
81
+ def configure_logging(
82
+ *,
83
+ verbose: bool = False,
84
+ json_format: bool | None = None,
85
+ level_name: str | None = None,
86
+ ) -> None:
73
87
  """Configure logging for SIE server.
74
88
 
75
89
  Args:
76
- verbose: Enable DEBUG level logging.
90
+ verbose: Enable DEBUG level logging (overrides ``level_name`` / ``SIE_LOG_LEVEL``).
77
91
  json_format: Use JSON format. If None, reads from SIE_LOG_JSON env var.
92
+ level_name: Log level name (e.g. ``DEBUG``, ``INFO``). When None, uses ``SIE_LOG_LEVEL``.
78
93
  """
79
- # Determine log level
80
- log_level = logging.DEBUG if verbose else logging.INFO
94
+ log_level = _resolve_log_level(verbose=verbose, level_name=level_name)
81
95
 
82
96
  # Determine format (env var takes precedence if json_format not explicitly set)
83
97
  if json_format is None:
@@ -28,7 +28,14 @@ def _create_app_from_env() -> FastAPI:
28
28
  return AppFactory.create_app(config)
29
29
 
30
30
 
31
- def run_server(host: str, port: int, reload: bool, config: AppStateConfig) -> None:
31
+ def run_server(
32
+ host: str,
33
+ port: int,
34
+ reload: bool,
35
+ config: AppStateConfig,
36
+ *,
37
+ uvicorn_log_level: str = "info",
38
+ ) -> None:
32
39
  config.save_to_env_vars()
33
40
  uvicorn.run(
34
41
  "sie_server.main:_create_app_from_env",
@@ -38,4 +45,5 @@ def run_server(host: str, port: int, reload: bool, config: AppStateConfig) -> No
38
45
  factory=True,
39
46
  loop="uvloop",
40
47
  timeout_keep_alive=120,
48
+ log_level=uvicorn_log_level,
41
49
  )
@@ -311,6 +311,20 @@ class TestLoadAdapter:
311
311
 
312
312
  assert type(adapter).__name__ == "BGEM3FlagAdapter"
313
313
 
314
+ def test_load_qwen3_vl_embedding_accepts_dense_dim(self, tmp_path: Path) -> None:
315
+ """Qwen3 VL embedding adapter accepts dense_dim supplied by loader."""
316
+ config = _make_config(
317
+ sie_id="Qwen/Qwen3-VL-Embedding-2B",
318
+ hf_id="Qwen/Qwen3-VL-Embedding-2B",
319
+ adapter_path="sie_server.adapters.qwen3_vl_embedding:Qwen3VLEmbeddingAdapter",
320
+ dense_dim=2048,
321
+ )
322
+
323
+ adapter = load_adapter(config, tmp_path, device="cpu")
324
+
325
+ assert type(adapter).__name__ == "Qwen3VLEmbeddingAdapter"
326
+ assert adapter.dims.dense == 2048
327
+
314
328
  def test_load_custom_adapter(self, tmp_path: Path) -> None:
315
329
  """Can load a custom adapter from file."""
316
330
  # Create custom adapter file
@@ -113,6 +113,7 @@ class TestConfigureLogging:
113
113
  def test_json_format_explicit(self, monkeypatch: pytest.MonkeyPatch) -> None:
114
114
  """Test explicit JSON format configuration."""
115
115
  monkeypatch.delenv("SIE_LOG_JSON", raising=False)
116
+ monkeypatch.delenv("SIE_LOG_LEVEL", raising=False)
116
117
 
117
118
  configure_logging(json_format=True)
118
119
 
@@ -123,6 +124,7 @@ class TestConfigureLogging:
123
124
  def test_text_format_explicit(self, monkeypatch: pytest.MonkeyPatch) -> None:
124
125
  """Test explicit text format configuration."""
125
126
  monkeypatch.delenv("SIE_LOG_JSON", raising=False)
127
+ monkeypatch.delenv("SIE_LOG_LEVEL", raising=False)
126
128
 
127
129
  configure_logging(json_format=False)
128
130
 
@@ -133,6 +135,7 @@ class TestConfigureLogging:
133
135
  def test_json_format_from_env(self, monkeypatch: pytest.MonkeyPatch) -> None:
134
136
  """Test JSON format from environment variable."""
135
137
  monkeypatch.setenv("SIE_LOG_JSON", "true")
138
+ monkeypatch.delenv("SIE_LOG_LEVEL", raising=False)
136
139
 
137
140
  configure_logging()
138
141
 
@@ -143,8 +146,38 @@ class TestConfigureLogging:
143
146
  def test_verbose_sets_debug_level(self, monkeypatch: pytest.MonkeyPatch) -> None:
144
147
  """Test verbose flag sets DEBUG level."""
145
148
  monkeypatch.delenv("SIE_LOG_JSON", raising=False)
149
+ monkeypatch.setenv("SIE_LOG_LEVEL", "INFO")
146
150
 
147
151
  configure_logging(verbose=True, json_format=False)
148
152
 
149
153
  root = logging.getLogger()
150
154
  assert root.level == logging.DEBUG
155
+
156
+ def test_sie_log_level_from_env(self, monkeypatch: pytest.MonkeyPatch) -> None:
157
+ """SIE_LOG_LEVEL controls root level when not verbose."""
158
+ monkeypatch.delenv("SIE_LOG_JSON", raising=False)
159
+ monkeypatch.setenv("SIE_LOG_LEVEL", "DEBUG")
160
+
161
+ configure_logging(json_format=False)
162
+
163
+ root = logging.getLogger()
164
+ assert root.level == logging.DEBUG
165
+
166
+ def test_level_name_param_over_env(self, monkeypatch: pytest.MonkeyPatch) -> None:
167
+ """Explicit level_name wins over SIE_LOG_LEVEL."""
168
+ monkeypatch.delenv("SIE_LOG_JSON", raising=False)
169
+ monkeypatch.setenv("SIE_LOG_LEVEL", "DEBUG")
170
+
171
+ configure_logging(json_format=False, level_name="WARNING")
172
+
173
+ root = logging.getLogger()
174
+ assert root.level == logging.WARNING
175
+
176
+ def test_invalid_log_level_falls_back_to_info(self, monkeypatch: pytest.MonkeyPatch) -> None:
177
+ monkeypatch.delenv("SIE_LOG_JSON", raising=False)
178
+ monkeypatch.setenv("SIE_LOG_LEVEL", "not-a-real-level")
179
+
180
+ configure_logging(json_format=False)
181
+
182
+ root = logging.getLogger()
183
+ assert root.level == logging.INFO
File without changes
File without changes
File without changes
File without changes
File without changes