isagellm-core 0.4.0.17__py2.py3-none-any.whl → 0.4.0.19__py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (168) hide show
  1. isagellm_core-0.4.0.19.dist-info/METADATA +718 -0
  2. isagellm_core-0.4.0.19.dist-info/RECORD +174 -0
  3. {isagellm_core-0.4.0.17.dist-info → isagellm_core-0.4.0.19.dist-info}/WHEEL +1 -1
  4. sagellm_core/__init__.py +4 -22
  5. sagellm_core/__init__.pyc +0 -0
  6. sagellm_core/__main__.pyc +0 -0
  7. sagellm_core/__pycache__/__init__.cpython-311.pyc +0 -0
  8. sagellm_core/__pycache__/config.cpython-311.pyc +0 -0
  9. sagellm_core/__pycache__/demo.cpython-311.pyc +0 -0
  10. sagellm_core/__pycache__/engine.cpython-311.pyc +0 -0
  11. sagellm_core/__pycache__/engine_factory.cpython-311.pyc +0 -0
  12. sagellm_core/__pycache__/engine_server.cpython-311.pyc +0 -0
  13. sagellm_core/__pycache__/factory.cpython-311.pyc +0 -0
  14. sagellm_core/__pycache__/health.cpython-311.pyc +0 -0
  15. sagellm_core/__pycache__/llm_engine.cpython-311.pyc +0 -0
  16. sagellm_core/__pycache__/pd_executor.cpython-311.pyc +0 -0
  17. sagellm_core/__pycache__/plugins.cpython-311.pyc +0 -0
  18. sagellm_core/__pycache__/runner.cpython-311.pyc +0 -0
  19. sagellm_core/__pycache__/runtime.cpython-311.pyc +0 -0
  20. sagellm_core/__pycache__/workload.cpython-311.pyc +0 -0
  21. sagellm_core/config.pyc +0 -0
  22. sagellm_core/decoding/__init__.pyc +0 -0
  23. sagellm_core/decoding/__pycache__/__init__.cpython-311.pyc +0 -0
  24. sagellm_core/decoding/__pycache__/base.cpython-311.pyc +0 -0
  25. sagellm_core/decoding/__pycache__/beam_search.cpython-311.pyc +0 -0
  26. sagellm_core/decoding/__pycache__/contrastive.cpython-311.pyc +0 -0
  27. sagellm_core/decoding/__pycache__/greedy.cpython-311.pyc +0 -0
  28. sagellm_core/decoding/__pycache__/sampling.cpython-311.pyc +0 -0
  29. sagellm_core/decoding/base.pyc +0 -0
  30. sagellm_core/decoding/beam_search.pyc +0 -0
  31. sagellm_core/decoding/contrastive.pyc +0 -0
  32. sagellm_core/decoding/greedy.pyc +0 -0
  33. sagellm_core/decoding/sampling.pyc +0 -0
  34. sagellm_core/demo.pyc +0 -0
  35. sagellm_core/distributed/__init__.pyc +0 -0
  36. sagellm_core/distributed/__pycache__/__init__.cpython-311.pyc +0 -0
  37. sagellm_core/distributed/__pycache__/strategies.cpython-311.pyc +0 -0
  38. sagellm_core/distributed/strategies.pyc +0 -0
  39. sagellm_core/engine.pyc +0 -0
  40. sagellm_core/engine_core/__init__.pyc +0 -0
  41. sagellm_core/engine_core/__pycache__/__init__.cpython-311.pyc +0 -0
  42. sagellm_core/engine_core/__pycache__/engine_core.cpython-311.pyc +0 -0
  43. sagellm_core/engine_core/engine_core.pyc +0 -0
  44. sagellm_core/engine_core/scheduler/__init__.py +31 -3
  45. sagellm_core/engine_core/scheduler/__init__.pyc +0 -0
  46. sagellm_core/engine_core/scheduler/__pycache__/__init__.cpython-311.pyc +0 -0
  47. sagellm_core/engine_core/scheduler/__pycache__/base.cpython-311.pyc +0 -0
  48. sagellm_core/engine_core/scheduler/__pycache__/batch.cpython-311.pyc +0 -0
  49. sagellm_core/engine_core/scheduler/__pycache__/metrics.cpython-311.pyc +0 -0
  50. sagellm_core/engine_core/scheduler/__pycache__/scheduler.cpython-311.pyc +0 -0
  51. sagellm_core/engine_core/scheduler/__pycache__/scheduler_kv_bridge.cpython-311.pyc +0 -0
  52. sagellm_core/engine_core/scheduler/base.pyc +0 -0
  53. sagellm_core/engine_core/scheduler/batch.pyc +0 -0
  54. sagellm_core/engine_core/scheduler/metrics.pyc +0 -0
  55. sagellm_core/engine_core/scheduler/policy/__init__.py +6 -0
  56. sagellm_core/engine_core/scheduler/policy/__init__.pyc +0 -0
  57. sagellm_core/engine_core/scheduler/policy/__pycache__/__init__.cpython-311.pyc +0 -0
  58. sagellm_core/engine_core/scheduler/policy/__pycache__/fcfs.cpython-311.pyc +0 -0
  59. sagellm_core/engine_core/scheduler/policy/__pycache__/priority.cpython-311.pyc +0 -0
  60. sagellm_core/engine_core/scheduler/policy/fcfs.pyc +0 -0
  61. sagellm_core/engine_core/scheduler/policy/priority.pyc +0 -0
  62. sagellm_core/engine_core/scheduler/scheduler.pyc +0 -0
  63. sagellm_core/engine_core/scheduler/scheduler_kv_bridge.pyc +0 -0
  64. sagellm_core/engine_factory.pyc +0 -0
  65. sagellm_core/engine_server.pyc +0 -0
  66. sagellm_core/engines/__init__.pyc +0 -0
  67. sagellm_core/engines/__pycache__/__init__.cpython-311.pyc +0 -0
  68. sagellm_core/engines/__pycache__/ascend.cpython-311.pyc +0 -0
  69. sagellm_core/engines/__pycache__/cpu.cpython-311.pyc +0 -0
  70. sagellm_core/engines/__pycache__/embedding.cpython-311.pyc +0 -0
  71. sagellm_core/engines/__pycache__/hf_cuda.cpython-311.pyc +0 -0
  72. sagellm_core/engines/__pycache__/pytorch.cpython-311.pyc +0 -0
  73. sagellm_core/engines/__pycache__/pytorch_engine.cpython-311.pyc +0 -0
  74. sagellm_core/engines/embedding.pyc +0 -0
  75. sagellm_core/executor/__init__.pyc +0 -0
  76. sagellm_core/executor/__pycache__/__init__.cpython-311.pyc +0 -0
  77. sagellm_core/executor/__pycache__/executor_base.cpython-311.pyc +0 -0
  78. sagellm_core/executor/__pycache__/uniproc_executor.cpython-311.pyc +0 -0
  79. sagellm_core/executor/executor_base.pyc +0 -0
  80. sagellm_core/executor/uniproc_executor.pyc +0 -0
  81. sagellm_core/factory.pyc +0 -0
  82. sagellm_core/health.pyc +0 -0
  83. sagellm_core/inputs/__init__.pyc +0 -0
  84. sagellm_core/inputs/__pycache__/__init__.cpython-311.pyc +0 -0
  85. sagellm_core/inputs/__pycache__/processor.cpython-311.pyc +0 -0
  86. sagellm_core/inputs/__pycache__/tokenizer_utils.cpython-311.pyc +0 -0
  87. sagellm_core/inputs/processor.pyc +0 -0
  88. sagellm_core/inputs/tokenizer_utils.pyc +0 -0
  89. sagellm_core/layers/__init__.py +30 -0
  90. sagellm_core/layers/__init__.pyc +0 -0
  91. sagellm_core/layers/__pycache__/__init__.cpython-311.pyc +0 -0
  92. sagellm_core/layers/__pycache__/activation.cpython-311.pyc +0 -0
  93. sagellm_core/layers/__pycache__/base.cpython-311.pyc +0 -0
  94. sagellm_core/layers/__pycache__/embedding.cpython-311.pyc +0 -0
  95. sagellm_core/layers/__pycache__/linear.cpython-311.pyc +0 -0
  96. sagellm_core/layers/__pycache__/normalization.cpython-311.pyc +0 -0
  97. sagellm_core/layers/activation.pyc +0 -0
  98. sagellm_core/layers/base.pyc +0 -0
  99. sagellm_core/layers/embedding.pyc +0 -0
  100. sagellm_core/layers/linear.pyc +0 -0
  101. sagellm_core/layers/normalization.pyc +0 -0
  102. sagellm_core/llm_engine.pyc +0 -0
  103. sagellm_core/model/__init__.py +131 -5
  104. sagellm_core/model/__init__.pyc +0 -0
  105. sagellm_core/model/__pycache__/__init__.cpython-311.pyc +0 -0
  106. sagellm_core/model/__pycache__/base.cpython-311.pyc +0 -0
  107. sagellm_core/model/__pycache__/factory.cpython-311.pyc +0 -0
  108. sagellm_core/model/__pycache__/gpt2.cpython-311.pyc +0 -0
  109. sagellm_core/model/__pycache__/llama.cpython-311.pyc +0 -0
  110. sagellm_core/model/__pycache__/mixtral.cpython-311.pyc +0 -0
  111. sagellm_core/model/__pycache__/model_loader.cpython-311.pyc +0 -0
  112. sagellm_core/model/__pycache__/quantization.cpython-311.pyc +0 -0
  113. sagellm_core/model/__pycache__/qwen2.cpython-311.pyc +0 -0
  114. sagellm_core/model/__pycache__/registry.cpython-311.pyc +0 -0
  115. sagellm_core/model/__pycache__/weight_utils.cpython-311.pyc +0 -0
  116. sagellm_core/model/base.pyc +0 -0
  117. sagellm_core/model/factory.pyc +0 -0
  118. sagellm_core/model/gpt2.pyc +0 -0
  119. sagellm_core/model/llama.pyc +0 -0
  120. sagellm_core/model/mixtral.pyc +0 -0
  121. sagellm_core/model/model_loader.pyc +0 -0
  122. sagellm_core/model/quantization.pyc +0 -0
  123. sagellm_core/model/qwen2.pyc +0 -0
  124. sagellm_core/model/registry.pyc +0 -0
  125. sagellm_core/model/weight_loader/__init__.py +54 -0
  126. sagellm_core/model/weight_loader/__init__.pyc +0 -0
  127. sagellm_core/model/weight_loader/__pycache__/__init__.cpython-311.pyc +0 -0
  128. sagellm_core/model/weight_loader/__pycache__/base.cpython-311.pyc +0 -0
  129. sagellm_core/model/weight_loader/__pycache__/pytorch.cpython-311.pyc +0 -0
  130. sagellm_core/model/weight_loader/__pycache__/quantized.cpython-311.pyc +0 -0
  131. sagellm_core/model/weight_loader/__pycache__/safetensors.cpython-311.pyc +0 -0
  132. sagellm_core/model/weight_loader/base.pyc +0 -0
  133. sagellm_core/model/weight_loader/pytorch.pyc +0 -0
  134. sagellm_core/model/weight_loader/quantized.pyc +0 -0
  135. sagellm_core/model/weight_loader/safetensors.pyc +0 -0
  136. sagellm_core/model/weight_utils.pyc +0 -0
  137. sagellm_core/observability/__init__.pyc +0 -0
  138. sagellm_core/observability/__pycache__/__init__.cpython-311.pyc +0 -0
  139. sagellm_core/observability/__pycache__/logger.cpython-311.pyc +0 -0
  140. sagellm_core/observability/__pycache__/metrics.cpython-311.pyc +0 -0
  141. sagellm_core/observability/logger.pyc +0 -0
  142. sagellm_core/observability/metrics.pyc +0 -0
  143. sagellm_core/pd_executor.pyc +0 -0
  144. sagellm_core/plugins.pyc +0 -0
  145. sagellm_core/runner.pyc +0 -0
  146. sagellm_core/runtime.pyc +0 -0
  147. sagellm_core/sampling/__init__.pyc +0 -0
  148. sagellm_core/sampling/__pycache__/__init__.cpython-311.pyc +0 -0
  149. sagellm_core/sampling/__pycache__/params.cpython-311.pyc +0 -0
  150. sagellm_core/sampling/__pycache__/sampler.cpython-311.pyc +0 -0
  151. sagellm_core/sampling/params.pyc +0 -0
  152. sagellm_core/sampling/sampler.pyc +0 -0
  153. sagellm_core/worker/__init__.pyc +0 -0
  154. sagellm_core/worker/__pycache__/__init__.cpython-311.pyc +0 -0
  155. sagellm_core/worker/__pycache__/worker.cpython-311.pyc +0 -0
  156. sagellm_core/worker/model_runner/__init__.pyc +0 -0
  157. sagellm_core/worker/model_runner/__pycache__/__init__.cpython-311.pyc +0 -0
  158. sagellm_core/worker/model_runner/__pycache__/model_runner.cpython-311.pyc +0 -0
  159. sagellm_core/worker/model_runner/model_runner.pyc +0 -0
  160. sagellm_core/worker/worker.pyc +0 -0
  161. sagellm_core/workload.pyc +0 -0
  162. isagellm_core-0.4.0.17.dist-info/METADATA +0 -308
  163. isagellm_core-0.4.0.17.dist-info/RECORD +0 -122
  164. sagellm_core/__pycache__/base_engine.cpython-311.pyc +0 -0
  165. sagellm_core/__pycache__/mock_engine.cpython-311.pyc +0 -0
  166. sagellm_core/engines/__pycache__/mock.cpython-311.pyc +0 -0
  167. {isagellm_core-0.4.0.17.dist-info → isagellm_core-0.4.0.19.dist-info}/entry_points.txt +0 -0
  168. {isagellm_core-0.4.0.17.dist-info → isagellm_core-0.4.0.19.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,174 @@
1
+ sagellm_core/__init__.py,sha256=lXJheNgD5o1-7-EfOlGwCXs91Yomaxy4ZTNrSL7PmJ0,6355
2
+ sagellm_core/__init__.pyc,sha256=R60LStNbkJYjkw9Ok480ebMKjaeOBhNrpQn3Z-UQ1zM,4020
3
+ sagellm_core/__main__.pyc,sha256=_81UAvEI2ABP1lWBb048OKWxM4W95lobVNDFgz98wSg,384
4
+ sagellm_core/config.pyc,sha256=ktdBhyhAf9YrBrvCG1QziS4Y5l9YTXID79CjMtEw4Tw,8453
5
+ sagellm_core/demo.pyc,sha256=Lo_YBnu_k9qlC57vFwKQ2YcNNigTqLOB6-vlQB33zi0,6028
6
+ sagellm_core/engine.pyc,sha256=8ZhJNTvsl4BksUykALGZ8_SbUWr7UBIcd-dVzXHCW_k,12258
7
+ sagellm_core/engine_factory.pyc,sha256=FZoayMoeWtzvIVewzUd8EKRwOMxhkTo_w5LD7j9Ti5Q,14886
8
+ sagellm_core/engine_server.pyc,sha256=6566zyCwKgoTd0nLjOaA5q2EPBE6EyGU3jCkeaskHfo,19273
9
+ sagellm_core/factory.pyc,sha256=gu4m3nWOLPOL3Xd3q9C2X5zA_z2ggRqv5ldrSmMzqpo,2737
10
+ sagellm_core/health.pyc,sha256=G2MEAQSK8CC1TEuonKlAYisiYrUd1QxRC8QpiSiAiQI,684
11
+ sagellm_core/llm_engine.pyc,sha256=b8_1eymY_uvg9PJK97RbhjDuWn_7Y16BoGwr2MGcgNI,32483
12
+ sagellm_core/pd_executor.pyc,sha256=n7gvfeYAQA1PZdYCHIj90kdHUi2cPbtPMjExvBEmTHU,17970
13
+ sagellm_core/plugins.pyc,sha256=dpgURpeNuhdnle1Ui8xSb9kCWhdlE3BI7F3tq2_tG4U,2617
14
+ sagellm_core/py.typed,sha256=ixa8YukDZ3kLo0WsFJRGohLMyHzbMur1ALmmASML2cs,64
15
+ sagellm_core/runner.pyc,sha256=_sRztiSFepLu5Wl2DQsBNsCCtfcRC8GDZjDk2YZCTbc,14180
16
+ sagellm_core/runtime.pyc,sha256=SK4ZzkKQAK3efQokaIKb5ha30DZ3e42HLnhTwMJNRG0,10018
17
+ sagellm_core/workload.pyc,sha256=oXLJNnjbAI8oTgVFvhFzRysTno5-xabyLZiE2wVkUdQ,4127
18
+ sagellm_core/__pycache__/__init__.cpython-311.pyc,sha256=tLS8QIreF81JH9tkRIxARZKRwecRklEkA1-VSTw0-b0,4064
19
+ sagellm_core/__pycache__/config.cpython-311.pyc,sha256=4KZjBCv_6xE1yTw5rhddE1QeUdHsAOA4pjm-J3zyEx4,8497
20
+ sagellm_core/__pycache__/demo.cpython-311.pyc,sha256=ObO59vU-p7ryKr4B8R0dtnlJNHmQtQ80htb6DWurgpM,6072
21
+ sagellm_core/__pycache__/engine.cpython-311.pyc,sha256=lJG2v0M8nQiSeMhp9hJ7jTYM5_j4W1zlC2hyKbOTeFY,12302
22
+ sagellm_core/__pycache__/engine_factory.cpython-311.pyc,sha256=xUAN2_eFMySJT8KEaOHYFDDSpgcDUXNW581Bj5S5Jkk,14930
23
+ sagellm_core/__pycache__/engine_server.cpython-311.pyc,sha256=oYG5-hZKVgTpVly1T1khhX_tyIzrbF0TUTX02JwmD8s,19317
24
+ sagellm_core/__pycache__/factory.cpython-311.pyc,sha256=UeONZctwWSrRyIcAeR2wQWc0cGUNIgu4vYSMVdtokos,2781
25
+ sagellm_core/__pycache__/health.cpython-311.pyc,sha256=6v3mRLjfqNaCVb0xoyoQCzriPkDEKweV98hmKcE1A64,728
26
+ sagellm_core/__pycache__/llm_engine.cpython-311.pyc,sha256=K6MBHMV880RuCimXLEn_pKrKgOh1bObIgV8Bf6xRA8g,32527
27
+ sagellm_core/__pycache__/pd_executor.cpython-311.pyc,sha256=YuY1Y4D-2MZaz99_Id6hB67PDHyKMqujVXItaOPHiuw,18014
28
+ sagellm_core/__pycache__/plugins.cpython-311.pyc,sha256=n9qa5tqPUcoAOxzBIhs1JiU1-F_2hxT06yymA7RSbhM,2661
29
+ sagellm_core/__pycache__/runner.cpython-311.pyc,sha256=CyHAg_u0xHq3QKNxEbunK78Gd1klAYDKZlnAuscl_t8,14224
30
+ sagellm_core/__pycache__/runtime.cpython-311.pyc,sha256=wBRGFV3TRmtNz9nuc8IDa-E7xMgGQe6MQ3oWZH4hHRY,10062
31
+ sagellm_core/__pycache__/workload.cpython-311.pyc,sha256=xkb7dQAy-4soQ9KjrYLud4WGcaPKpT0gzk9Otp_A_5I,4171
32
+ sagellm_core/decoding/__init__.py,sha256=P9u4AgMYaPlhcgIfvT0V8JZ_51Vn58Js52QiNHfYgYE,1386
33
+ sagellm_core/decoding/__init__.pyc,sha256=_L9S72b85H7UVNLP5odDBhrHV20-z8SvDlde53vznUs,1837
34
+ sagellm_core/decoding/base.pyc,sha256=vocBsZUgYMxl9zaREJF4ETf_iSyM2bdI8WaogrUrFsg,1685
35
+ sagellm_core/decoding/beam_search.pyc,sha256=mRi2S8IwqAwg4K4GfvV8cRtpsEPzRfMjr2HwfeTubrc,1396
36
+ sagellm_core/decoding/contrastive.pyc,sha256=E3BcEZ_ZfkMCLV6KPvJj-GKmxLNTQnd5qvmx9hoAM2w,1373
37
+ sagellm_core/decoding/greedy.pyc,sha256=i1vUrviyddpCNPyhKR_wXhMCs8-W5KE2Z6aY2f-WV4I,1203
38
+ sagellm_core/decoding/sampling.pyc,sha256=rOQMdm1otppsQobImKaa4Qy52QGrgo72iRJ7NspLkZM,1712
39
+ sagellm_core/decoding/__pycache__/__init__.cpython-311.pyc,sha256=tMwO6gxnmWHKfziP2_XyonOqC3lE2lNFXge2SWuLDrk,1881
40
+ sagellm_core/decoding/__pycache__/base.cpython-311.pyc,sha256=InA-thn6n7iC5MVFgnnVndoqBBO1vAJcvaeAE9EENwo,1729
41
+ sagellm_core/decoding/__pycache__/beam_search.cpython-311.pyc,sha256=gj0q4Ww6fteei0tNXjaZyRSYo6E-0I9erUg9M2VTNfo,1440
42
+ sagellm_core/decoding/__pycache__/contrastive.cpython-311.pyc,sha256=cC2XMgtpt6idxhLUjvawQl9RuTa6Ik_efywf-dsfF20,1417
43
+ sagellm_core/decoding/__pycache__/greedy.cpython-311.pyc,sha256=pHAZg7gRPq2rrv2J_NGONeIvkGE08gvb2jTEzafxBPc,1247
44
+ sagellm_core/decoding/__pycache__/sampling.cpython-311.pyc,sha256=hx9rkhbkPUnoUU_i_cIRgoe7RbR5y4nP9mM044in_Og,1756
45
+ sagellm_core/distributed/__init__.py,sha256=8WTrKkZmYGrV7pj3L083496LskHAv3BOULEIZflgBTc,328
46
+ sagellm_core/distributed/__init__.pyc,sha256=AO5IqU7iT0QdxM-aM5Qto4x3J0ZUTG3pkAlHbCobIy8,498
47
+ sagellm_core/distributed/strategies.pyc,sha256=J2S7SkIt9MStA5hgm1zOLe4hm5RIO8eFAIKzd1vXLFY,6061
48
+ sagellm_core/distributed/__pycache__/__init__.cpython-311.pyc,sha256=Q1D9T2ERrFnXz8GnW0qjPGwP_vAVkSJTMvBwN8Szcn8,542
49
+ sagellm_core/distributed/__pycache__/strategies.cpython-311.pyc,sha256=oVq8fDQ7qMBtDFD1U5qF4gyndHifmqnwXVlShLf4P4Q,6105
50
+ sagellm_core/engine_core/__init__.py,sha256=wG6ONHCRWk4ScU6WwW8f-qL3xITF5OcqbxBHGKAAwd4,314
51
+ sagellm_core/engine_core/__init__.pyc,sha256=evEMExxwDoRFpVkyAGhlaqxeHQP4XFgMHsIYniaTUCI,502
52
+ sagellm_core/engine_core/engine_core.pyc,sha256=tVKyU4xLpy4WX0na6Fa_sCjVGUY7e686XXd9edCidCM,8790
53
+ sagellm_core/engine_core/__pycache__/__init__.cpython-311.pyc,sha256=WtEUv3r0QBw1Jop1bsxnAPDpsmyG_54zANlLh5MERW4,546
54
+ sagellm_core/engine_core/__pycache__/engine_core.cpython-311.pyc,sha256=_KFHXAO7X2qvSWCsHfGgDpJ_JQqkZw9vR0otvc2tKZs,8834
55
+ sagellm_core/engine_core/scheduler/__init__.py,sha256=QJ2cRDyc7U-WHQIX2dLtlalrYXS4-6ZSSEG5sY9r2OQ,1390
56
+ sagellm_core/engine_core/scheduler/__init__.pyc,sha256=JAYSwGjf9J1x-y0iaJ9_IDMU5R4oCktUPIC8-l7SXmg,1553
57
+ sagellm_core/engine_core/scheduler/base.pyc,sha256=4aoA1G8cPpEgZq4KpC__Kz2M3rvmYm9vdpmWmFMe-RY,5778
58
+ sagellm_core/engine_core/scheduler/batch.pyc,sha256=8agGr53XfgF71l35hHC8pIN5sOJBmAEf7QFjQeIDtx4,3856
59
+ sagellm_core/engine_core/scheduler/metrics.pyc,sha256=z3-EZnTMeJa_mCWvtnt710l82EyNEBAnlEodV_8NVNM,6183
60
+ sagellm_core/engine_core/scheduler/scheduler.pyc,sha256=CJFop1Y12B856BffdTLgqaFq-Mx-fVftNWVURO3cS7g,27116
61
+ sagellm_core/engine_core/scheduler/scheduler_kv_bridge.pyc,sha256=KU-JJaBV5I5jz5pE6INP13m_QZK-sn-bxiCuTlQakvw,12194
62
+ sagellm_core/engine_core/scheduler/__pycache__/__init__.cpython-311.pyc,sha256=3L57db_9-YkfCj1FBpKwwqBzuz1qiXWYo23HLVDqU_8,1597
63
+ sagellm_core/engine_core/scheduler/__pycache__/base.cpython-311.pyc,sha256=PGXAM6ujO8bGLK00YbD1sxMB1i8y2-IQ6eQtyCZ49S8,5822
64
+ sagellm_core/engine_core/scheduler/__pycache__/batch.cpython-311.pyc,sha256=AS5jLQeyh57kRMaDpyKgjf4_A0SiLWRHuOdbrT0unNY,3900
65
+ sagellm_core/engine_core/scheduler/__pycache__/metrics.cpython-311.pyc,sha256=4g_HimozpwLEraPEkY4F64CGxSoIOT08P1FI3f-kALk,6227
66
+ sagellm_core/engine_core/scheduler/__pycache__/scheduler.cpython-311.pyc,sha256=TCXzNw-VcLgFw2QZ9onEhxUPfGT3QV-kArjcBKr2vVo,27160
67
+ sagellm_core/engine_core/scheduler/__pycache__/scheduler_kv_bridge.cpython-311.pyc,sha256=ajexkkJfgwghsAcbdRcZLd_gH_HOvo2f2_Z4SNeuHg0,12238
68
+ sagellm_core/engine_core/scheduler/policy/__init__.py,sha256=d5w_189s0cd8fAmCRSzz1rTpYPZab3AFFwpW3Id1LTo,249
69
+ sagellm_core/engine_core/scheduler/policy/__init__.pyc,sha256=J83Agt3POsKXp7-xSyFNRoscOxUYwiukxEHQr-EKUyI,468
70
+ sagellm_core/engine_core/scheduler/policy/fcfs.pyc,sha256=sVyTOrmwOmi5q7XL3exOMk0qEPMvv5pjrigQ7zgX2Ys,6670
71
+ sagellm_core/engine_core/scheduler/policy/priority.pyc,sha256=fuT9NrJv3Bqufnzqz1QC-TR5pinVsRK0fDB8g8yp1VI,6813
72
+ sagellm_core/engine_core/scheduler/policy/__pycache__/__init__.cpython-311.pyc,sha256=bhiMfXveF2TZEfkBYozPDOA0IMgTRYD2OU8NHxJvfpo,512
73
+ sagellm_core/engine_core/scheduler/policy/__pycache__/fcfs.cpython-311.pyc,sha256=Nth8zT4rSCRFSJOg4fs2xGwWN_AJElogaG0L9NDIPso,6714
74
+ sagellm_core/engine_core/scheduler/policy/__pycache__/priority.cpython-311.pyc,sha256=ZlYzaSnSnJgCunFmQpJt7pBMOljvXdpDJlTpI3wmcbI,6857
75
+ sagellm_core/engines/__init__.py,sha256=eRxLCXebcl0DqhMh4J3yPcpmoSMtZzjWjCXNku0hcek,865
76
+ sagellm_core/engines/__init__.pyc,sha256=IvYGoZ-rasQT93EADKUxskfHjhW7hLTaMsaxf9hvmwQ,934
77
+ sagellm_core/engines/embedding.pyc,sha256=vj07-CNm1zrlmDo7RpcX3h43AWTP-r7qF1UIVWpNEdw,12189
78
+ sagellm_core/engines/__pycache__/__init__.cpython-311.pyc,sha256=EXx-tB8C1aUA1DVez3F2GRvtBzj8Qizhuf2wM5541Is,978
79
+ sagellm_core/engines/__pycache__/ascend.cpython-311.pyc,sha256=rBTOaG6tOcFm0ZjBP701UTLQudW7OdroTfycR-BfyhI,17307
80
+ sagellm_core/engines/__pycache__/cpu.cpython-311.pyc,sha256=g9GrBDXtdmJMf9LKK4NWYdLW1N-yb6HThRMp5tfH9Jg,29330
81
+ sagellm_core/engines/__pycache__/embedding.cpython-311.pyc,sha256=iYhVvD8JBZcSp4xrNYEo-f4YfaAkZxLrQ-fhtHL6xno,12233
82
+ sagellm_core/engines/__pycache__/hf_cuda.cpython-311.pyc,sha256=sIXd-cq2T__5B2uYUz3u_Fdb46EXSHSBq6LWcVGIbO0,61147
83
+ sagellm_core/engines/__pycache__/pytorch.cpython-311.pyc,sha256=Grw94kmuWI3YJiElmxDvzyM-zyV-H-o3xRtIqtODUnA,18452
84
+ sagellm_core/engines/__pycache__/pytorch_engine.cpython-311.pyc,sha256=TrwvIobQZWMPGW4GAN8H5hkydR1E3_az0fZojU5_EjM,15644
85
+ sagellm_core/executor/__init__.py,sha256=Acm1uxVigM823XnTaJ2UC_mSgTIlvtHb6uX076tMSN0,507
86
+ sagellm_core/executor/__init__.pyc,sha256=khWBYZiUBe87zjIB4H72DvD7kU1jXD1REmfnpEi-bZI,705
87
+ sagellm_core/executor/executor_base.pyc,sha256=J10pQgxDt_dYRJUIS7ht46fETgPR1S3NpgTrTdJA-aQ,4759
88
+ sagellm_core/executor/uniproc_executor.pyc,sha256=sQ4mFn2K6cNo6yDs308A1Bvi5qzK5omb6WvljF793j8,4940
89
+ sagellm_core/executor/__pycache__/__init__.cpython-311.pyc,sha256=LoHU2Z7wWw4Lvss8iiLVgTZWe35-b7SXXblwzyY5mB0,749
90
+ sagellm_core/executor/__pycache__/executor_base.cpython-311.pyc,sha256=-9h0dT5Bwra6VWjhsr3vKYCIn5ZM-HohzmNk7JeJQNU,4803
91
+ sagellm_core/executor/__pycache__/uniproc_executor.cpython-311.pyc,sha256=kJ6tDBq5yh1cmBAUPTX1lbByuhUQjUmOfL4l7FvG9WQ,4984
92
+ sagellm_core/inputs/__init__.py,sha256=t_DP0n7Cx-L9BiniDcKHBcg6IK6EVCs8J7GRbAwPbLk,301
93
+ sagellm_core/inputs/__init__.pyc,sha256=ocGa1p3NXflh1TXdOljNxry1PCd9msOO2FCg3Uzy2TU,513
94
+ sagellm_core/inputs/processor.pyc,sha256=y95MlzBEeZO1U_oNDNtCDPuhRGP0INbKEONnL-xVUPQ,3641
95
+ sagellm_core/inputs/tokenizer_utils.pyc,sha256=acCTNBubOb5NnC3oq7GhUNzI1ijM5FMTVqWkjzpxmY8,2871
96
+ sagellm_core/inputs/__pycache__/__init__.cpython-311.pyc,sha256=Sw3jm2TybH0c1wcxIZcztl1v-FpmvxffvKuH6dxPH5A,557
97
+ sagellm_core/inputs/__pycache__/processor.cpython-311.pyc,sha256=VCCNAVklX7UM4rwpHQOM_YRa2UIN7NbQarz0b42ZvZU,3685
98
+ sagellm_core/inputs/__pycache__/tokenizer_utils.cpython-311.pyc,sha256=yyyO--2Z9Dj-0iI95bdgfBP3TvIQ6RRNJ5wY1NB9ibU,2915
99
+ sagellm_core/layers/__init__.py,sha256=3Qis9XQHijuy-3k7ByX-ehUoO016EkcBXtEgCYJ5Wvo,894
100
+ sagellm_core/layers/__init__.pyc,sha256=PY9yzqCUnLbU3Jz4zvJvKopVTnuzuCTpr6f9FUdDLIY,1151
101
+ sagellm_core/layers/activation.pyc,sha256=ARmpihbwjqa6YioXajFXpeDPAfZUtGalXQuUQtuhgNQ,3998
102
+ sagellm_core/layers/base.pyc,sha256=IcmttxQtodOjEACkkp1CU6vNeWdAXS3bW95dLjtwWUk,3114
103
+ sagellm_core/layers/embedding.pyc,sha256=9hleCHHWfxMfwMfcHyFwBON3OUROAoctKd_82L8RaPQ,6610
104
+ sagellm_core/layers/linear.pyc,sha256=qLUYMsiosQasdK8aIsRNtqgIL27f3f0npW4lc83wv-s,10855
105
+ sagellm_core/layers/normalization.pyc,sha256=JVvKoFuTBmxNJ8cYZXohZpvwBuvunsc004Aw_CJ1DOA,5757
106
+ sagellm_core/layers/__pycache__/__init__.cpython-311.pyc,sha256=2ZEXCsw_KolZ6hrEXHwSUz0kNHzlNa1ELXLq16KQnrY,1195
107
+ sagellm_core/layers/__pycache__/activation.cpython-311.pyc,sha256=u3ic6THNcazgquywM5TgpZi9aRWUYJPxbdpYNrmyDcA,4042
108
+ sagellm_core/layers/__pycache__/base.cpython-311.pyc,sha256=nG8GybGx1xohSyJD6U9PK8Bk3bOvGMG8iba7YTrLEqI,3158
109
+ sagellm_core/layers/__pycache__/embedding.cpython-311.pyc,sha256=Ekfi0ERpqbKgmuRnACQ1WJUEj66QldemjSaiX172M-Q,6654
110
+ sagellm_core/layers/__pycache__/linear.cpython-311.pyc,sha256=UnMeRZhlG4gpFa_CIU0l1SE4eH5BFE0Hme1_DO9EY2Q,10899
111
+ sagellm_core/layers/__pycache__/normalization.cpython-311.pyc,sha256=hUhYUYUTHIVhm6BpZ3_33kZqcf743Ej8BTDUynjg5mE,5801
112
+ sagellm_core/model/__init__.py,sha256=P2yGYFm7AfE9jKtCusNOiAOPFw9fGZTqfyuz1cOYxqo,3452
113
+ sagellm_core/model/__init__.pyc,sha256=ZZ7JTzSp5_WTW3wiyBAWGRKVXsScNf6r5LI8Is6dFX4,3370
114
+ sagellm_core/model/base.pyc,sha256=r-DpzMx9nUYgFSl2GS0zk7R9offTEUXAf6y656xWYk0,8218
115
+ sagellm_core/model/factory.pyc,sha256=IYCm18ytcZPhO0lP4unH9feZUJGTMWCyPh6e9kVD8BE,9399
116
+ sagellm_core/model/gpt2.pyc,sha256=ePTJVNy14Pl0L44WwG5KWZj_u2MMFrz-tq8Wg_SqZMQ,9993
117
+ sagellm_core/model/llama.pyc,sha256=HHQ8hRa4HLQ_poOl382TEP9IgAE1OUhpHTma1tor4yM,24446
118
+ sagellm_core/model/mixtral.pyc,sha256=dOD5Y_zqn2y2pJlaQ4dw0-ZNg6QTb4XiuSSQoUrRVls,15955
119
+ sagellm_core/model/model_loader.pyc,sha256=WN2g_XenQTLKSngxkNSTxBIttBwK93yXTnyJe6hd-r8,5822
120
+ sagellm_core/model/quantization.pyc,sha256=kPCBC3zCYnxqyrVYiuSuaewsgmvZcuhtJWZNwE0lsKk,5478
121
+ sagellm_core/model/qwen2.pyc,sha256=9AxgiLbzp_tu8beLTLRQwn1YK7UOVKhCDbAH4ES1-Ak,17885
122
+ sagellm_core/model/registry.pyc,sha256=DVOsvbPosGiMQAk45UvWpqbCaRzxrP2f8W2F4SJ0uAM,5334
123
+ sagellm_core/model/weight_utils.pyc,sha256=mwBOldZZjyhpld__gZ651cHJYHgVhiYKQmXEFoB_3gM,1830
124
+ sagellm_core/model/__pycache__/__init__.cpython-311.pyc,sha256=UfGaLmaK5sFurKzGQs7Rv0nfBmz4yQ_G8vETIQl_Ibo,3414
125
+ sagellm_core/model/__pycache__/base.cpython-311.pyc,sha256=2xTfORrmZ61p7Nca_7QMGc4ZxOiswzpMlQ0thgArkBI,8262
126
+ sagellm_core/model/__pycache__/factory.cpython-311.pyc,sha256=wI8swBf0Tc5s8uq48jK23J0o3s9-u2et--IvbAnEN_A,9443
127
+ sagellm_core/model/__pycache__/gpt2.cpython-311.pyc,sha256=IL_inxu83zASGeo33Bp0L5xgCbooj7OnEcj7CgMI2Gs,10037
128
+ sagellm_core/model/__pycache__/llama.cpython-311.pyc,sha256=MQxAWSnOc3zifbPsS3D_L0BYM99-wkuxo6fGHG7dqc0,24490
129
+ sagellm_core/model/__pycache__/mixtral.cpython-311.pyc,sha256=K7H-DEg6Nk4ra_tnHQJs-qwoj7mv4Ow1luQIGkIX4UE,15999
130
+ sagellm_core/model/__pycache__/model_loader.cpython-311.pyc,sha256=QPEOn7LbYCHvj-G-3cSsrKnPtTcx-p_dC9tTILP91cA,5866
131
+ sagellm_core/model/__pycache__/quantization.cpython-311.pyc,sha256=96E_bn7CRIDDswyrAGn8EgipcSBC51Oc02-IL7hqCo4,5522
132
+ sagellm_core/model/__pycache__/qwen2.cpython-311.pyc,sha256=rlXcbdEemEj3OvQJv9iqLEv_npy_K-jirUgP_8erzN4,17929
133
+ sagellm_core/model/__pycache__/registry.cpython-311.pyc,sha256=tM5qGpTDp2RBrEO-b5eEeTqkQHDIcfFMPOGo-hpDoRg,5378
134
+ sagellm_core/model/__pycache__/weight_utils.cpython-311.pyc,sha256=a0Wv5tKBy9n2YNGPrkmSBSV8BGa7rOzNJnjbxEvWoIU,1874
135
+ sagellm_core/model/weight_loader/__init__.py,sha256=hKYqGfvGcZ_o9VS6GTBP_IHuN39qikPzRGo5Yu-uTec,1474
136
+ sagellm_core/model/weight_loader/__init__.pyc,sha256=xTGuqPCTmVrk63JYimNGCUUYb18SRCidmIp3IwAlTrw,1521
137
+ sagellm_core/model/weight_loader/base.pyc,sha256=ccL1XcOpKdYFDx9iPdEA0KlYD0rtiXmcY7SOYfRltYs,12850
138
+ sagellm_core/model/weight_loader/pytorch.pyc,sha256=_Jl5oVFOTx2snRWJLNcLyaNk7x40Yg5Kk3ZDbvxWohA,6945
139
+ sagellm_core/model/weight_loader/quantized.pyc,sha256=ahsXyYEVz8n4C_3NJcC8RLxbTKVGu9Q12SlLl4_BwtM,14090
140
+ sagellm_core/model/weight_loader/safetensors.pyc,sha256=_13Tblgcmaz3gSJdlXLG9krcwIDFTkz3lb5QDCYsdq4,8911
141
+ sagellm_core/model/weight_loader/__pycache__/__init__.cpython-311.pyc,sha256=vzcetCFSikIqw9q5J-59FSfMvVjmMG9t-w3KU9CGl6E,1565
142
+ sagellm_core/model/weight_loader/__pycache__/base.cpython-311.pyc,sha256=1atSyz848y72l7qfbvSgVTU1HPCv5I1Vlc5pdFtMHTA,12894
143
+ sagellm_core/model/weight_loader/__pycache__/pytorch.cpython-311.pyc,sha256=QDOq4W0KQlIS4_DB76SHZakAVBrPIoQfbP6tBghdccQ,6989
144
+ sagellm_core/model/weight_loader/__pycache__/quantized.cpython-311.pyc,sha256=_iDAjyuSyc1r7McM35_SdpOoeOE7I-l1o-aSw_KTJmY,14134
145
+ sagellm_core/model/weight_loader/__pycache__/safetensors.cpython-311.pyc,sha256=zAET47I4KzgIhYgsfRE1RguvgaLSqz-OnDoAx3RPgL0,8955
146
+ sagellm_core/observability/__init__.py,sha256=lT3qt-69vwH3KlxqN0H_hjknmaXl8Yx2Q3PrWifNvd8,378
147
+ sagellm_core/observability/__init__.pyc,sha256=AgMxpuktnXApjcskYhtZu9txYykL0zA5pxA88GFdyZ4,608
148
+ sagellm_core/observability/logger.pyc,sha256=L4plrgadkvv45aDqMkKoj49NESFixBb_Ul1dVqu1PSQ,1910
149
+ sagellm_core/observability/metrics.pyc,sha256=BPH0Cs4BozpOGEzqzQJ8WpG_uSrWMj_p2ZpfoYPiTqA,6314
150
+ sagellm_core/observability/__pycache__/__init__.cpython-311.pyc,sha256=uAvN7NoVbwrmGEv9Y-9jFEfvLyuVFxS5dw9KW3S3NnQ,652
151
+ sagellm_core/observability/__pycache__/logger.cpython-311.pyc,sha256=PGUrMdntSbemDjZ4bBvbE6T5T0ayRc9u_6EwlVPai8c,1954
152
+ sagellm_core/observability/__pycache__/metrics.cpython-311.pyc,sha256=1fDSo9sL5Lu7Ft9NnpBcaWL4e04xdN8ypfBNNofwmBY,6358
153
+ sagellm_core/sampling/__init__.py,sha256=H8b1UnwiYfMP2rODrjDJXvoI8fRTyfCoDImHRstIDGg,330
154
+ sagellm_core/sampling/__init__.pyc,sha256=SNCG-L_cGlWWNFtcRIgd5PkjPCRbcxMaCA4y7ROMfYQ,556
155
+ sagellm_core/sampling/params.pyc,sha256=y_RtIZycw1hL__9beE1kPsfHUYf9r_bnh3K8w33Pr5s,3391
156
+ sagellm_core/sampling/sampler.pyc,sha256=Q9IgFuLffD_auKmaxqkSpOvHox_1jO0vMxn9rJwhDos,6721
157
+ sagellm_core/sampling/__pycache__/__init__.cpython-311.pyc,sha256=X_CSHSW5HfR5cF6XT_QjePpVL0yNXvApBerCQ_FD2Jc,600
158
+ sagellm_core/sampling/__pycache__/params.cpython-311.pyc,sha256=OWmwd4OPH7fvtPXu52OG6EwxreoIdXG0TnSVhSkoG0k,3435
159
+ sagellm_core/sampling/__pycache__/sampler.cpython-311.pyc,sha256=P8WXBrbB7mPizwNDxKJmlrO2gzLUCSFhZsZsHt0v1aA,6765
160
+ sagellm_core/worker/__init__.py,sha256=isHAvgRYHX_HBRQsJtB72ziV4xeSDyjR1xFH3h_HEHQ,258
161
+ sagellm_core/worker/__init__.pyc,sha256=BDzN0RkdOZUdff5r5sgymVbDzH47QDBqZW8VHzWSNMw,445
162
+ sagellm_core/worker/worker.pyc,sha256=gOZqeyw33WGypXtk5yq5wkRVyZ_wZjem6_GrmhJEe2k,4772
163
+ sagellm_core/worker/__pycache__/__init__.cpython-311.pyc,sha256=82GLZqYvY4lOSFPyl4ZJd12Az0xB1YIbtvIxo2q1bOI,489
164
+ sagellm_core/worker/__pycache__/worker.cpython-311.pyc,sha256=j-Bly_YPvAlXoLcAZsFYMM9vO4EQFOcgxLylaYp44l4,4816
165
+ sagellm_core/worker/model_runner/__init__.py,sha256=w4cq2JoxfHYNUQI3jXO-XhFCoYxNg6YHkioK-S3Ayro,246
166
+ sagellm_core/worker/model_runner/__init__.pyc,sha256=56vUUVM9SnXbQLa2o34DSrmwgCIsygG5dRILepb9CFA,447
167
+ sagellm_core/worker/model_runner/model_runner.pyc,sha256=YfoP-CAE7wz5XQojKlJyb4vXmSpjzhW-z8OKBxZBndE,17056
168
+ sagellm_core/worker/model_runner/__pycache__/__init__.cpython-311.pyc,sha256=SBuQvwarzMcetpu5Cda0yrjgPXxobuCs5TlbC-K1jP0,491
169
+ sagellm_core/worker/model_runner/__pycache__/model_runner.cpython-311.pyc,sha256=Y7oUKzfUdvFCWQwyfQf1TAUWLoLtwE6dy_GJqsG1X9c,17100
170
+ isagellm_core-0.4.0.19.dist-info/METADATA,sha256=u3G4oNtrSRM8WElqF1wR_REm_hq2J2wBjcqdjNBikr8,22827
171
+ isagellm_core-0.4.0.19.dist-info/WHEEL,sha256=JNWh1Fm1UdwIQV075glCn4MVuCRs0sotJIq-J6rbxCU,109
172
+ isagellm_core-0.4.0.19.dist-info/entry_points.txt,sha256=w0kgbHe7jVNOuy785wFMEBwqoZUnfU24HCImsQII3y0,64
173
+ isagellm_core-0.4.0.19.dist-info/top_level.txt,sha256=wcgdWrvkaoYYh_dWSFI5Toi8PZsHutVqfhTB2tb0K6g,13
174
+ isagellm_core-0.4.0.19.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: setuptools (80.10.2)
2
+ Generator: setuptools (80.9.0)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py2-none-any
5
5
  Tag: py3-none-any
sagellm_core/__init__.py CHANGED
@@ -26,7 +26,7 @@ Architecture (vLLM v1 style):
26
26
 
27
27
  from __future__ import annotations
28
28
 
29
- __version__ = "0.4.0.16"
29
+ __version__ = "0.4.0.19"
30
30
 
31
31
  # ============================================================================
32
32
  # New Architecture (vLLM v1 style) - Hardware Agnostic
@@ -47,7 +47,8 @@ from sagellm_core.worker.model_runner import ModelRunner
47
47
  # ============================================================================
48
48
  # Legacy Architecture (still supported, being refactored)
49
49
  # ============================================================================
50
- from sagellm_core.engine import BaseEngine, EngineInstanceConfig
50
+ # NOTE: BaseEngine and EngineFactory have been removed (issue #24).
51
+ # Use LLMEngine instead - the unified hardware-agnostic engine.
51
52
  from sagellm_core.config import (
52
53
  BackendConfig,
53
54
  DemoConfig,
@@ -58,14 +59,6 @@ from sagellm_core.config import (
58
59
  load_config,
59
60
  )
60
61
  from sagellm_core.demo import main as demo_main
61
- from sagellm_core.engine_factory import EngineFactory
62
-
63
- # Only EmbeddingEngine remains from legacy engines
64
- from sagellm_core.engines import (
65
- EmbeddingEngine,
66
- EmbeddingEngineConfig,
67
- )
68
- from sagellm_core.factory import create_backend, create_engine
69
62
  from sagellm_core.health import HealthStatus
70
63
  from sagellm_core.plugins import PluginResolutionError, list_entry_points, resolve_kind
71
64
  from sagellm_core.runner import DemoRunner, RunnerContext
@@ -159,19 +152,8 @@ __all__ = [
159
152
  "WorkloadConfig",
160
153
  "WorkloadSegment",
161
154
  "load_config",
162
- # Engine abstraction
163
- "BaseEngine",
164
- "EngineInstanceConfig", # For runtime engine instantiation
155
+ # Health status
165
156
  "HealthStatus",
166
- # Engine implementations
167
- # DEPRECATED: Old engines removed, use LLMEngine instead
168
- # Only EmbeddingEngine remains for embedding-only use cases
169
- "EmbeddingEngine",
170
- "EmbeddingEngineConfig",
171
- # Factory functions
172
- "create_backend",
173
- "create_engine",
174
- "EngineFactory",
175
157
  # Plugin system
176
158
  "PluginResolutionError",
177
159
  "list_entry_points",
sagellm_core/__init__.pyc CHANGED
Binary file
sagellm_core/__main__.pyc CHANGED
Binary file
sagellm_core/config.pyc CHANGED
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
sagellm_core/demo.pyc CHANGED
Binary file
Binary file
Binary file
sagellm_core/engine.pyc CHANGED
Binary file
Binary file
Binary file
@@ -1,19 +1,47 @@
1
1
  """Scheduler - Request scheduling for Continuous Batching.
2
2
 
3
3
  The Scheduler is responsible for:
4
- 1. Selecting which requests to run in the next step
5
- 2. Managing prefill vs decode scheduling
6
- 3. Preemption decisions
4
+ 1. Selecting which requests to run in the next step (via pluggable policies)
5
+ 2. Managing KV cache allocation (via SchedulerKVBridge)
6
+ 3. Separating prefill vs decode batches
7
+ 4. Preemption decisions (future)
8
+
9
+ Key Components:
10
+ - ContinuousBatchingScheduler: Main scheduler class
11
+ - SchedulerKVBridge: Thin wrapper around sagellm-kv-cache
12
+ - SchedulerPolicy: Pluggable admission control (FCFS, Priority, etc.)
13
+ - Batch: Prefill or decode batch with block_tables
7
14
  """
8
15
 
16
+ from sagellm_core.engine_core.scheduler.base import (
17
+ SchedulerPolicy,
18
+ get_policy,
19
+ list_policies,
20
+ register_policy,
21
+ )
22
+ from sagellm_core.engine_core.scheduler.batch import Batch
23
+ from sagellm_core.engine_core.scheduler.metrics import RequestMetadata, SchedulerMetrics
9
24
  from sagellm_core.engine_core.scheduler.scheduler import (
10
25
  ContinuousBatchingScheduler,
11
26
  SchedulerConfig,
12
27
  SchedulerOutput,
13
28
  )
29
+ from sagellm_core.engine_core.scheduler.scheduler_kv_bridge import SchedulerKVBridge
14
30
 
15
31
  __all__ = [
32
+ # Main classes
16
33
  "ContinuousBatchingScheduler",
17
34
  "SchedulerConfig",
18
35
  "SchedulerOutput",
36
+ "Batch",
37
+ # KV bridge
38
+ "SchedulerKVBridge",
39
+ # Policy system
40
+ "SchedulerPolicy",
41
+ "register_policy",
42
+ "get_policy",
43
+ "list_policies",
44
+ # Metrics
45
+ "SchedulerMetrics",
46
+ "RequestMetadata",
19
47
  ]
@@ -0,0 +1,6 @@
1
+ """Policy package - pluggable scheduling strategies."""
2
+
3
+ from sagellm_core.engine_core.scheduler.policy.fcfs import FCFSPolicy
4
+ from sagellm_core.engine_core.scheduler.policy.priority import PriorityPolicy
5
+
6
+ __all__ = ["FCFSPolicy", "PriorityPolicy"]
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
sagellm_core/factory.pyc CHANGED
Binary file
sagellm_core/health.pyc CHANGED
Binary file
Binary file
Binary file
Binary file
@@ -0,0 +1,30 @@
1
+ """Model layers that use backend kernels.
2
+
3
+ This module provides PyTorch-style nn.Module layers that delegate
4
+ compute operations to BackendProvider kernels.
5
+
6
+ Key design:
7
+ - Layers are standard torch.nn.Module subclasses
8
+ - Forward passes use backend.get_kernel() instead of native ops
9
+ - Supports tensor parallelism via CommBackend
10
+ - Hardware-agnostic (CPU/CUDA/NPU/etc.)
11
+ """
12
+
13
+ from sagellm_core.layers.base import BaseLayer
14
+ from sagellm_core.layers.embedding import Embedding, LMHead
15
+ from sagellm_core.layers.linear import ColumnParallelLinear, LinearLayer, RowParallelLinear
16
+ from sagellm_core.layers.normalization import LayerNorm, RMSNorm
17
+ from sagellm_core.layers.activation import SiLU, SiLUAndMul
18
+
19
+ __all__ = [
20
+ "BaseLayer",
21
+ "LinearLayer",
22
+ "ColumnParallelLinear",
23
+ "RowParallelLinear",
24
+ "Embedding",
25
+ "LMHead",
26
+ "RMSNorm",
27
+ "LayerNorm",
28
+ "SiLU",
29
+ "SiLUAndMul",
30
+ ]
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file