isagellm-core 0.4.0.18__py2.py3-none-any.whl → 0.4.0.19__py2.py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- isagellm_core-0.4.0.19.dist-info/METADATA +718 -0
- isagellm_core-0.4.0.19.dist-info/RECORD +174 -0
- {isagellm_core-0.4.0.18.dist-info → isagellm_core-0.4.0.19.dist-info}/WHEEL +1 -1
- sagellm_core/__init__.py +4 -22
- sagellm_core/__init__.pyc +0 -0
- sagellm_core/__main__.pyc +0 -0
- sagellm_core/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/config.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/demo.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/engine.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/engine_factory.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/engine_server.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/factory.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/health.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/llm_engine.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/pd_executor.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/plugins.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/runner.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/runtime.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/workload.cpython-311.pyc +0 -0
- sagellm_core/config.pyc +0 -0
- sagellm_core/decoding/__init__.pyc +0 -0
- sagellm_core/decoding/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/decoding/__pycache__/base.cpython-311.pyc +0 -0
- sagellm_core/decoding/__pycache__/beam_search.cpython-311.pyc +0 -0
- sagellm_core/decoding/__pycache__/contrastive.cpython-311.pyc +0 -0
- sagellm_core/decoding/__pycache__/greedy.cpython-311.pyc +0 -0
- sagellm_core/decoding/__pycache__/sampling.cpython-311.pyc +0 -0
- sagellm_core/decoding/base.pyc +0 -0
- sagellm_core/decoding/beam_search.pyc +0 -0
- sagellm_core/decoding/contrastive.pyc +0 -0
- sagellm_core/decoding/greedy.pyc +0 -0
- sagellm_core/decoding/sampling.pyc +0 -0
- sagellm_core/demo.pyc +0 -0
- sagellm_core/distributed/__init__.pyc +0 -0
- sagellm_core/distributed/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/distributed/__pycache__/strategies.cpython-311.pyc +0 -0
- sagellm_core/distributed/strategies.pyc +0 -0
- sagellm_core/engine.pyc +0 -0
- sagellm_core/engine_core/__init__.pyc +0 -0
- sagellm_core/engine_core/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/engine_core/__pycache__/engine_core.cpython-311.pyc +0 -0
- sagellm_core/engine_core/engine_core.pyc +0 -0
- sagellm_core/engine_core/scheduler/__init__.py +31 -3
- sagellm_core/engine_core/scheduler/__init__.pyc +0 -0
- sagellm_core/engine_core/scheduler/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/engine_core/scheduler/__pycache__/base.cpython-311.pyc +0 -0
- sagellm_core/engine_core/scheduler/__pycache__/batch.cpython-311.pyc +0 -0
- sagellm_core/engine_core/scheduler/__pycache__/metrics.cpython-311.pyc +0 -0
- sagellm_core/engine_core/scheduler/__pycache__/scheduler.cpython-311.pyc +0 -0
- sagellm_core/engine_core/scheduler/__pycache__/scheduler_kv_bridge.cpython-311.pyc +0 -0
- sagellm_core/engine_core/scheduler/base.pyc +0 -0
- sagellm_core/engine_core/scheduler/batch.pyc +0 -0
- sagellm_core/engine_core/scheduler/metrics.pyc +0 -0
- sagellm_core/engine_core/scheduler/policy/__init__.py +6 -0
- sagellm_core/engine_core/scheduler/policy/__init__.pyc +0 -0
- sagellm_core/engine_core/scheduler/policy/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/engine_core/scheduler/policy/__pycache__/fcfs.cpython-311.pyc +0 -0
- sagellm_core/engine_core/scheduler/policy/__pycache__/priority.cpython-311.pyc +0 -0
- sagellm_core/engine_core/scheduler/policy/fcfs.pyc +0 -0
- sagellm_core/engine_core/scheduler/policy/priority.pyc +0 -0
- sagellm_core/engine_core/scheduler/scheduler.pyc +0 -0
- sagellm_core/engine_core/scheduler/scheduler_kv_bridge.pyc +0 -0
- sagellm_core/engine_factory.pyc +0 -0
- sagellm_core/engine_server.pyc +0 -0
- sagellm_core/engines/__init__.pyc +0 -0
- sagellm_core/engines/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/engines/__pycache__/ascend.cpython-311.pyc +0 -0
- sagellm_core/engines/__pycache__/cpu.cpython-311.pyc +0 -0
- sagellm_core/engines/__pycache__/embedding.cpython-311.pyc +0 -0
- sagellm_core/engines/__pycache__/hf_cuda.cpython-311.pyc +0 -0
- sagellm_core/engines/__pycache__/pytorch.cpython-311.pyc +0 -0
- sagellm_core/engines/__pycache__/pytorch_engine.cpython-311.pyc +0 -0
- sagellm_core/engines/embedding.pyc +0 -0
- sagellm_core/executor/__init__.pyc +0 -0
- sagellm_core/executor/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/executor/__pycache__/executor_base.cpython-311.pyc +0 -0
- sagellm_core/executor/__pycache__/uniproc_executor.cpython-311.pyc +0 -0
- sagellm_core/executor/executor_base.pyc +0 -0
- sagellm_core/executor/uniproc_executor.pyc +0 -0
- sagellm_core/factory.pyc +0 -0
- sagellm_core/health.pyc +0 -0
- sagellm_core/inputs/__init__.pyc +0 -0
- sagellm_core/inputs/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/inputs/__pycache__/processor.cpython-311.pyc +0 -0
- sagellm_core/inputs/__pycache__/tokenizer_utils.cpython-311.pyc +0 -0
- sagellm_core/inputs/processor.pyc +0 -0
- sagellm_core/inputs/tokenizer_utils.pyc +0 -0
- sagellm_core/layers/__init__.py +30 -0
- sagellm_core/layers/__init__.pyc +0 -0
- sagellm_core/layers/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/layers/__pycache__/activation.cpython-311.pyc +0 -0
- sagellm_core/layers/__pycache__/base.cpython-311.pyc +0 -0
- sagellm_core/layers/__pycache__/embedding.cpython-311.pyc +0 -0
- sagellm_core/layers/__pycache__/linear.cpython-311.pyc +0 -0
- sagellm_core/layers/__pycache__/normalization.cpython-311.pyc +0 -0
- sagellm_core/layers/activation.pyc +0 -0
- sagellm_core/layers/base.pyc +0 -0
- sagellm_core/layers/embedding.pyc +0 -0
- sagellm_core/layers/linear.pyc +0 -0
- sagellm_core/layers/normalization.pyc +0 -0
- sagellm_core/llm_engine.pyc +0 -0
- sagellm_core/model/__init__.py +131 -5
- sagellm_core/model/__init__.pyc +0 -0
- sagellm_core/model/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/model/__pycache__/base.cpython-311.pyc +0 -0
- sagellm_core/model/__pycache__/factory.cpython-311.pyc +0 -0
- sagellm_core/model/__pycache__/gpt2.cpython-311.pyc +0 -0
- sagellm_core/model/__pycache__/llama.cpython-311.pyc +0 -0
- sagellm_core/model/__pycache__/mixtral.cpython-311.pyc +0 -0
- sagellm_core/model/__pycache__/model_loader.cpython-311.pyc +0 -0
- sagellm_core/model/__pycache__/quantization.cpython-311.pyc +0 -0
- sagellm_core/model/__pycache__/qwen2.cpython-311.pyc +0 -0
- sagellm_core/model/__pycache__/registry.cpython-311.pyc +0 -0
- sagellm_core/model/__pycache__/weight_utils.cpython-311.pyc +0 -0
- sagellm_core/model/base.pyc +0 -0
- sagellm_core/model/factory.pyc +0 -0
- sagellm_core/model/gpt2.pyc +0 -0
- sagellm_core/model/llama.pyc +0 -0
- sagellm_core/model/mixtral.pyc +0 -0
- sagellm_core/model/model_loader.pyc +0 -0
- sagellm_core/model/quantization.pyc +0 -0
- sagellm_core/model/qwen2.pyc +0 -0
- sagellm_core/model/registry.pyc +0 -0
- sagellm_core/model/weight_loader/__init__.py +54 -0
- sagellm_core/model/weight_loader/__init__.pyc +0 -0
- sagellm_core/model/weight_loader/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/model/weight_loader/__pycache__/base.cpython-311.pyc +0 -0
- sagellm_core/model/weight_loader/__pycache__/pytorch.cpython-311.pyc +0 -0
- sagellm_core/model/weight_loader/__pycache__/quantized.cpython-311.pyc +0 -0
- sagellm_core/model/weight_loader/__pycache__/safetensors.cpython-311.pyc +0 -0
- sagellm_core/model/weight_loader/base.pyc +0 -0
- sagellm_core/model/weight_loader/pytorch.pyc +0 -0
- sagellm_core/model/weight_loader/quantized.pyc +0 -0
- sagellm_core/model/weight_loader/safetensors.pyc +0 -0
- sagellm_core/model/weight_utils.pyc +0 -0
- sagellm_core/observability/__init__.pyc +0 -0
- sagellm_core/observability/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/observability/__pycache__/logger.cpython-311.pyc +0 -0
- sagellm_core/observability/__pycache__/metrics.cpython-311.pyc +0 -0
- sagellm_core/observability/logger.pyc +0 -0
- sagellm_core/observability/metrics.pyc +0 -0
- sagellm_core/pd_executor.pyc +0 -0
- sagellm_core/plugins.pyc +0 -0
- sagellm_core/runner.pyc +0 -0
- sagellm_core/runtime.pyc +0 -0
- sagellm_core/sampling/__init__.pyc +0 -0
- sagellm_core/sampling/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/sampling/__pycache__/params.cpython-311.pyc +0 -0
- sagellm_core/sampling/__pycache__/sampler.cpython-311.pyc +0 -0
- sagellm_core/sampling/params.pyc +0 -0
- sagellm_core/sampling/sampler.pyc +0 -0
- sagellm_core/worker/__init__.pyc +0 -0
- sagellm_core/worker/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/worker/__pycache__/worker.cpython-311.pyc +0 -0
- sagellm_core/worker/model_runner/__init__.pyc +0 -0
- sagellm_core/worker/model_runner/__pycache__/__init__.cpython-311.pyc +0 -0
- sagellm_core/worker/model_runner/__pycache__/model_runner.cpython-311.pyc +0 -0
- sagellm_core/worker/model_runner/model_runner.pyc +0 -0
- sagellm_core/worker/worker.pyc +0 -0
- sagellm_core/workload.pyc +0 -0
- isagellm_core-0.4.0.18.dist-info/METADATA +0 -308
- isagellm_core-0.4.0.18.dist-info/RECORD +0 -122
- sagellm_core/__pycache__/base_engine.cpython-311.pyc +0 -0
- sagellm_core/__pycache__/mock_engine.cpython-311.pyc +0 -0
- sagellm_core/engines/__pycache__/mock.cpython-311.pyc +0 -0
- {isagellm_core-0.4.0.18.dist-info → isagellm_core-0.4.0.19.dist-info}/entry_points.txt +0 -0
- {isagellm_core-0.4.0.18.dist-info → isagellm_core-0.4.0.19.dist-info}/top_level.txt +0 -0
|
@@ -0,0 +1,174 @@
|
|
|
1
|
+
sagellm_core/__init__.py,sha256=lXJheNgD5o1-7-EfOlGwCXs91Yomaxy4ZTNrSL7PmJ0,6355
|
|
2
|
+
sagellm_core/__init__.pyc,sha256=R60LStNbkJYjkw9Ok480ebMKjaeOBhNrpQn3Z-UQ1zM,4020
|
|
3
|
+
sagellm_core/__main__.pyc,sha256=_81UAvEI2ABP1lWBb048OKWxM4W95lobVNDFgz98wSg,384
|
|
4
|
+
sagellm_core/config.pyc,sha256=ktdBhyhAf9YrBrvCG1QziS4Y5l9YTXID79CjMtEw4Tw,8453
|
|
5
|
+
sagellm_core/demo.pyc,sha256=Lo_YBnu_k9qlC57vFwKQ2YcNNigTqLOB6-vlQB33zi0,6028
|
|
6
|
+
sagellm_core/engine.pyc,sha256=8ZhJNTvsl4BksUykALGZ8_SbUWr7UBIcd-dVzXHCW_k,12258
|
|
7
|
+
sagellm_core/engine_factory.pyc,sha256=FZoayMoeWtzvIVewzUd8EKRwOMxhkTo_w5LD7j9Ti5Q,14886
|
|
8
|
+
sagellm_core/engine_server.pyc,sha256=6566zyCwKgoTd0nLjOaA5q2EPBE6EyGU3jCkeaskHfo,19273
|
|
9
|
+
sagellm_core/factory.pyc,sha256=gu4m3nWOLPOL3Xd3q9C2X5zA_z2ggRqv5ldrSmMzqpo,2737
|
|
10
|
+
sagellm_core/health.pyc,sha256=G2MEAQSK8CC1TEuonKlAYisiYrUd1QxRC8QpiSiAiQI,684
|
|
11
|
+
sagellm_core/llm_engine.pyc,sha256=b8_1eymY_uvg9PJK97RbhjDuWn_7Y16BoGwr2MGcgNI,32483
|
|
12
|
+
sagellm_core/pd_executor.pyc,sha256=n7gvfeYAQA1PZdYCHIj90kdHUi2cPbtPMjExvBEmTHU,17970
|
|
13
|
+
sagellm_core/plugins.pyc,sha256=dpgURpeNuhdnle1Ui8xSb9kCWhdlE3BI7F3tq2_tG4U,2617
|
|
14
|
+
sagellm_core/py.typed,sha256=ixa8YukDZ3kLo0WsFJRGohLMyHzbMur1ALmmASML2cs,64
|
|
15
|
+
sagellm_core/runner.pyc,sha256=_sRztiSFepLu5Wl2DQsBNsCCtfcRC8GDZjDk2YZCTbc,14180
|
|
16
|
+
sagellm_core/runtime.pyc,sha256=SK4ZzkKQAK3efQokaIKb5ha30DZ3e42HLnhTwMJNRG0,10018
|
|
17
|
+
sagellm_core/workload.pyc,sha256=oXLJNnjbAI8oTgVFvhFzRysTno5-xabyLZiE2wVkUdQ,4127
|
|
18
|
+
sagellm_core/__pycache__/__init__.cpython-311.pyc,sha256=tLS8QIreF81JH9tkRIxARZKRwecRklEkA1-VSTw0-b0,4064
|
|
19
|
+
sagellm_core/__pycache__/config.cpython-311.pyc,sha256=4KZjBCv_6xE1yTw5rhddE1QeUdHsAOA4pjm-J3zyEx4,8497
|
|
20
|
+
sagellm_core/__pycache__/demo.cpython-311.pyc,sha256=ObO59vU-p7ryKr4B8R0dtnlJNHmQtQ80htb6DWurgpM,6072
|
|
21
|
+
sagellm_core/__pycache__/engine.cpython-311.pyc,sha256=lJG2v0M8nQiSeMhp9hJ7jTYM5_j4W1zlC2hyKbOTeFY,12302
|
|
22
|
+
sagellm_core/__pycache__/engine_factory.cpython-311.pyc,sha256=xUAN2_eFMySJT8KEaOHYFDDSpgcDUXNW581Bj5S5Jkk,14930
|
|
23
|
+
sagellm_core/__pycache__/engine_server.cpython-311.pyc,sha256=oYG5-hZKVgTpVly1T1khhX_tyIzrbF0TUTX02JwmD8s,19317
|
|
24
|
+
sagellm_core/__pycache__/factory.cpython-311.pyc,sha256=UeONZctwWSrRyIcAeR2wQWc0cGUNIgu4vYSMVdtokos,2781
|
|
25
|
+
sagellm_core/__pycache__/health.cpython-311.pyc,sha256=6v3mRLjfqNaCVb0xoyoQCzriPkDEKweV98hmKcE1A64,728
|
|
26
|
+
sagellm_core/__pycache__/llm_engine.cpython-311.pyc,sha256=K6MBHMV880RuCimXLEn_pKrKgOh1bObIgV8Bf6xRA8g,32527
|
|
27
|
+
sagellm_core/__pycache__/pd_executor.cpython-311.pyc,sha256=YuY1Y4D-2MZaz99_Id6hB67PDHyKMqujVXItaOPHiuw,18014
|
|
28
|
+
sagellm_core/__pycache__/plugins.cpython-311.pyc,sha256=n9qa5tqPUcoAOxzBIhs1JiU1-F_2hxT06yymA7RSbhM,2661
|
|
29
|
+
sagellm_core/__pycache__/runner.cpython-311.pyc,sha256=CyHAg_u0xHq3QKNxEbunK78Gd1klAYDKZlnAuscl_t8,14224
|
|
30
|
+
sagellm_core/__pycache__/runtime.cpython-311.pyc,sha256=wBRGFV3TRmtNz9nuc8IDa-E7xMgGQe6MQ3oWZH4hHRY,10062
|
|
31
|
+
sagellm_core/__pycache__/workload.cpython-311.pyc,sha256=xkb7dQAy-4soQ9KjrYLud4WGcaPKpT0gzk9Otp_A_5I,4171
|
|
32
|
+
sagellm_core/decoding/__init__.py,sha256=P9u4AgMYaPlhcgIfvT0V8JZ_51Vn58Js52QiNHfYgYE,1386
|
|
33
|
+
sagellm_core/decoding/__init__.pyc,sha256=_L9S72b85H7UVNLP5odDBhrHV20-z8SvDlde53vznUs,1837
|
|
34
|
+
sagellm_core/decoding/base.pyc,sha256=vocBsZUgYMxl9zaREJF4ETf_iSyM2bdI8WaogrUrFsg,1685
|
|
35
|
+
sagellm_core/decoding/beam_search.pyc,sha256=mRi2S8IwqAwg4K4GfvV8cRtpsEPzRfMjr2HwfeTubrc,1396
|
|
36
|
+
sagellm_core/decoding/contrastive.pyc,sha256=E3BcEZ_ZfkMCLV6KPvJj-GKmxLNTQnd5qvmx9hoAM2w,1373
|
|
37
|
+
sagellm_core/decoding/greedy.pyc,sha256=i1vUrviyddpCNPyhKR_wXhMCs8-W5KE2Z6aY2f-WV4I,1203
|
|
38
|
+
sagellm_core/decoding/sampling.pyc,sha256=rOQMdm1otppsQobImKaa4Qy52QGrgo72iRJ7NspLkZM,1712
|
|
39
|
+
sagellm_core/decoding/__pycache__/__init__.cpython-311.pyc,sha256=tMwO6gxnmWHKfziP2_XyonOqC3lE2lNFXge2SWuLDrk,1881
|
|
40
|
+
sagellm_core/decoding/__pycache__/base.cpython-311.pyc,sha256=InA-thn6n7iC5MVFgnnVndoqBBO1vAJcvaeAE9EENwo,1729
|
|
41
|
+
sagellm_core/decoding/__pycache__/beam_search.cpython-311.pyc,sha256=gj0q4Ww6fteei0tNXjaZyRSYo6E-0I9erUg9M2VTNfo,1440
|
|
42
|
+
sagellm_core/decoding/__pycache__/contrastive.cpython-311.pyc,sha256=cC2XMgtpt6idxhLUjvawQl9RuTa6Ik_efywf-dsfF20,1417
|
|
43
|
+
sagellm_core/decoding/__pycache__/greedy.cpython-311.pyc,sha256=pHAZg7gRPq2rrv2J_NGONeIvkGE08gvb2jTEzafxBPc,1247
|
|
44
|
+
sagellm_core/decoding/__pycache__/sampling.cpython-311.pyc,sha256=hx9rkhbkPUnoUU_i_cIRgoe7RbR5y4nP9mM044in_Og,1756
|
|
45
|
+
sagellm_core/distributed/__init__.py,sha256=8WTrKkZmYGrV7pj3L083496LskHAv3BOULEIZflgBTc,328
|
|
46
|
+
sagellm_core/distributed/__init__.pyc,sha256=AO5IqU7iT0QdxM-aM5Qto4x3J0ZUTG3pkAlHbCobIy8,498
|
|
47
|
+
sagellm_core/distributed/strategies.pyc,sha256=J2S7SkIt9MStA5hgm1zOLe4hm5RIO8eFAIKzd1vXLFY,6061
|
|
48
|
+
sagellm_core/distributed/__pycache__/__init__.cpython-311.pyc,sha256=Q1D9T2ERrFnXz8GnW0qjPGwP_vAVkSJTMvBwN8Szcn8,542
|
|
49
|
+
sagellm_core/distributed/__pycache__/strategies.cpython-311.pyc,sha256=oVq8fDQ7qMBtDFD1U5qF4gyndHifmqnwXVlShLf4P4Q,6105
|
|
50
|
+
sagellm_core/engine_core/__init__.py,sha256=wG6ONHCRWk4ScU6WwW8f-qL3xITF5OcqbxBHGKAAwd4,314
|
|
51
|
+
sagellm_core/engine_core/__init__.pyc,sha256=evEMExxwDoRFpVkyAGhlaqxeHQP4XFgMHsIYniaTUCI,502
|
|
52
|
+
sagellm_core/engine_core/engine_core.pyc,sha256=tVKyU4xLpy4WX0na6Fa_sCjVGUY7e686XXd9edCidCM,8790
|
|
53
|
+
sagellm_core/engine_core/__pycache__/__init__.cpython-311.pyc,sha256=WtEUv3r0QBw1Jop1bsxnAPDpsmyG_54zANlLh5MERW4,546
|
|
54
|
+
sagellm_core/engine_core/__pycache__/engine_core.cpython-311.pyc,sha256=_KFHXAO7X2qvSWCsHfGgDpJ_JQqkZw9vR0otvc2tKZs,8834
|
|
55
|
+
sagellm_core/engine_core/scheduler/__init__.py,sha256=QJ2cRDyc7U-WHQIX2dLtlalrYXS4-6ZSSEG5sY9r2OQ,1390
|
|
56
|
+
sagellm_core/engine_core/scheduler/__init__.pyc,sha256=JAYSwGjf9J1x-y0iaJ9_IDMU5R4oCktUPIC8-l7SXmg,1553
|
|
57
|
+
sagellm_core/engine_core/scheduler/base.pyc,sha256=4aoA1G8cPpEgZq4KpC__Kz2M3rvmYm9vdpmWmFMe-RY,5778
|
|
58
|
+
sagellm_core/engine_core/scheduler/batch.pyc,sha256=8agGr53XfgF71l35hHC8pIN5sOJBmAEf7QFjQeIDtx4,3856
|
|
59
|
+
sagellm_core/engine_core/scheduler/metrics.pyc,sha256=z3-EZnTMeJa_mCWvtnt710l82EyNEBAnlEodV_8NVNM,6183
|
|
60
|
+
sagellm_core/engine_core/scheduler/scheduler.pyc,sha256=CJFop1Y12B856BffdTLgqaFq-Mx-fVftNWVURO3cS7g,27116
|
|
61
|
+
sagellm_core/engine_core/scheduler/scheduler_kv_bridge.pyc,sha256=KU-JJaBV5I5jz5pE6INP13m_QZK-sn-bxiCuTlQakvw,12194
|
|
62
|
+
sagellm_core/engine_core/scheduler/__pycache__/__init__.cpython-311.pyc,sha256=3L57db_9-YkfCj1FBpKwwqBzuz1qiXWYo23HLVDqU_8,1597
|
|
63
|
+
sagellm_core/engine_core/scheduler/__pycache__/base.cpython-311.pyc,sha256=PGXAM6ujO8bGLK00YbD1sxMB1i8y2-IQ6eQtyCZ49S8,5822
|
|
64
|
+
sagellm_core/engine_core/scheduler/__pycache__/batch.cpython-311.pyc,sha256=AS5jLQeyh57kRMaDpyKgjf4_A0SiLWRHuOdbrT0unNY,3900
|
|
65
|
+
sagellm_core/engine_core/scheduler/__pycache__/metrics.cpython-311.pyc,sha256=4g_HimozpwLEraPEkY4F64CGxSoIOT08P1FI3f-kALk,6227
|
|
66
|
+
sagellm_core/engine_core/scheduler/__pycache__/scheduler.cpython-311.pyc,sha256=TCXzNw-VcLgFw2QZ9onEhxUPfGT3QV-kArjcBKr2vVo,27160
|
|
67
|
+
sagellm_core/engine_core/scheduler/__pycache__/scheduler_kv_bridge.cpython-311.pyc,sha256=ajexkkJfgwghsAcbdRcZLd_gH_HOvo2f2_Z4SNeuHg0,12238
|
|
68
|
+
sagellm_core/engine_core/scheduler/policy/__init__.py,sha256=d5w_189s0cd8fAmCRSzz1rTpYPZab3AFFwpW3Id1LTo,249
|
|
69
|
+
sagellm_core/engine_core/scheduler/policy/__init__.pyc,sha256=J83Agt3POsKXp7-xSyFNRoscOxUYwiukxEHQr-EKUyI,468
|
|
70
|
+
sagellm_core/engine_core/scheduler/policy/fcfs.pyc,sha256=sVyTOrmwOmi5q7XL3exOMk0qEPMvv5pjrigQ7zgX2Ys,6670
|
|
71
|
+
sagellm_core/engine_core/scheduler/policy/priority.pyc,sha256=fuT9NrJv3Bqufnzqz1QC-TR5pinVsRK0fDB8g8yp1VI,6813
|
|
72
|
+
sagellm_core/engine_core/scheduler/policy/__pycache__/__init__.cpython-311.pyc,sha256=bhiMfXveF2TZEfkBYozPDOA0IMgTRYD2OU8NHxJvfpo,512
|
|
73
|
+
sagellm_core/engine_core/scheduler/policy/__pycache__/fcfs.cpython-311.pyc,sha256=Nth8zT4rSCRFSJOg4fs2xGwWN_AJElogaG0L9NDIPso,6714
|
|
74
|
+
sagellm_core/engine_core/scheduler/policy/__pycache__/priority.cpython-311.pyc,sha256=ZlYzaSnSnJgCunFmQpJt7pBMOljvXdpDJlTpI3wmcbI,6857
|
|
75
|
+
sagellm_core/engines/__init__.py,sha256=eRxLCXebcl0DqhMh4J3yPcpmoSMtZzjWjCXNku0hcek,865
|
|
76
|
+
sagellm_core/engines/__init__.pyc,sha256=IvYGoZ-rasQT93EADKUxskfHjhW7hLTaMsaxf9hvmwQ,934
|
|
77
|
+
sagellm_core/engines/embedding.pyc,sha256=vj07-CNm1zrlmDo7RpcX3h43AWTP-r7qF1UIVWpNEdw,12189
|
|
78
|
+
sagellm_core/engines/__pycache__/__init__.cpython-311.pyc,sha256=EXx-tB8C1aUA1DVez3F2GRvtBzj8Qizhuf2wM5541Is,978
|
|
79
|
+
sagellm_core/engines/__pycache__/ascend.cpython-311.pyc,sha256=rBTOaG6tOcFm0ZjBP701UTLQudW7OdroTfycR-BfyhI,17307
|
|
80
|
+
sagellm_core/engines/__pycache__/cpu.cpython-311.pyc,sha256=g9GrBDXtdmJMf9LKK4NWYdLW1N-yb6HThRMp5tfH9Jg,29330
|
|
81
|
+
sagellm_core/engines/__pycache__/embedding.cpython-311.pyc,sha256=iYhVvD8JBZcSp4xrNYEo-f4YfaAkZxLrQ-fhtHL6xno,12233
|
|
82
|
+
sagellm_core/engines/__pycache__/hf_cuda.cpython-311.pyc,sha256=sIXd-cq2T__5B2uYUz3u_Fdb46EXSHSBq6LWcVGIbO0,61147
|
|
83
|
+
sagellm_core/engines/__pycache__/pytorch.cpython-311.pyc,sha256=Grw94kmuWI3YJiElmxDvzyM-zyV-H-o3xRtIqtODUnA,18452
|
|
84
|
+
sagellm_core/engines/__pycache__/pytorch_engine.cpython-311.pyc,sha256=TrwvIobQZWMPGW4GAN8H5hkydR1E3_az0fZojU5_EjM,15644
|
|
85
|
+
sagellm_core/executor/__init__.py,sha256=Acm1uxVigM823XnTaJ2UC_mSgTIlvtHb6uX076tMSN0,507
|
|
86
|
+
sagellm_core/executor/__init__.pyc,sha256=khWBYZiUBe87zjIB4H72DvD7kU1jXD1REmfnpEi-bZI,705
|
|
87
|
+
sagellm_core/executor/executor_base.pyc,sha256=J10pQgxDt_dYRJUIS7ht46fETgPR1S3NpgTrTdJA-aQ,4759
|
|
88
|
+
sagellm_core/executor/uniproc_executor.pyc,sha256=sQ4mFn2K6cNo6yDs308A1Bvi5qzK5omb6WvljF793j8,4940
|
|
89
|
+
sagellm_core/executor/__pycache__/__init__.cpython-311.pyc,sha256=LoHU2Z7wWw4Lvss8iiLVgTZWe35-b7SXXblwzyY5mB0,749
|
|
90
|
+
sagellm_core/executor/__pycache__/executor_base.cpython-311.pyc,sha256=-9h0dT5Bwra6VWjhsr3vKYCIn5ZM-HohzmNk7JeJQNU,4803
|
|
91
|
+
sagellm_core/executor/__pycache__/uniproc_executor.cpython-311.pyc,sha256=kJ6tDBq5yh1cmBAUPTX1lbByuhUQjUmOfL4l7FvG9WQ,4984
|
|
92
|
+
sagellm_core/inputs/__init__.py,sha256=t_DP0n7Cx-L9BiniDcKHBcg6IK6EVCs8J7GRbAwPbLk,301
|
|
93
|
+
sagellm_core/inputs/__init__.pyc,sha256=ocGa1p3NXflh1TXdOljNxry1PCd9msOO2FCg3Uzy2TU,513
|
|
94
|
+
sagellm_core/inputs/processor.pyc,sha256=y95MlzBEeZO1U_oNDNtCDPuhRGP0INbKEONnL-xVUPQ,3641
|
|
95
|
+
sagellm_core/inputs/tokenizer_utils.pyc,sha256=acCTNBubOb5NnC3oq7GhUNzI1ijM5FMTVqWkjzpxmY8,2871
|
|
96
|
+
sagellm_core/inputs/__pycache__/__init__.cpython-311.pyc,sha256=Sw3jm2TybH0c1wcxIZcztl1v-FpmvxffvKuH6dxPH5A,557
|
|
97
|
+
sagellm_core/inputs/__pycache__/processor.cpython-311.pyc,sha256=VCCNAVklX7UM4rwpHQOM_YRa2UIN7NbQarz0b42ZvZU,3685
|
|
98
|
+
sagellm_core/inputs/__pycache__/tokenizer_utils.cpython-311.pyc,sha256=yyyO--2Z9Dj-0iI95bdgfBP3TvIQ6RRNJ5wY1NB9ibU,2915
|
|
99
|
+
sagellm_core/layers/__init__.py,sha256=3Qis9XQHijuy-3k7ByX-ehUoO016EkcBXtEgCYJ5Wvo,894
|
|
100
|
+
sagellm_core/layers/__init__.pyc,sha256=PY9yzqCUnLbU3Jz4zvJvKopVTnuzuCTpr6f9FUdDLIY,1151
|
|
101
|
+
sagellm_core/layers/activation.pyc,sha256=ARmpihbwjqa6YioXajFXpeDPAfZUtGalXQuUQtuhgNQ,3998
|
|
102
|
+
sagellm_core/layers/base.pyc,sha256=IcmttxQtodOjEACkkp1CU6vNeWdAXS3bW95dLjtwWUk,3114
|
|
103
|
+
sagellm_core/layers/embedding.pyc,sha256=9hleCHHWfxMfwMfcHyFwBON3OUROAoctKd_82L8RaPQ,6610
|
|
104
|
+
sagellm_core/layers/linear.pyc,sha256=qLUYMsiosQasdK8aIsRNtqgIL27f3f0npW4lc83wv-s,10855
|
|
105
|
+
sagellm_core/layers/normalization.pyc,sha256=JVvKoFuTBmxNJ8cYZXohZpvwBuvunsc004Aw_CJ1DOA,5757
|
|
106
|
+
sagellm_core/layers/__pycache__/__init__.cpython-311.pyc,sha256=2ZEXCsw_KolZ6hrEXHwSUz0kNHzlNa1ELXLq16KQnrY,1195
|
|
107
|
+
sagellm_core/layers/__pycache__/activation.cpython-311.pyc,sha256=u3ic6THNcazgquywM5TgpZi9aRWUYJPxbdpYNrmyDcA,4042
|
|
108
|
+
sagellm_core/layers/__pycache__/base.cpython-311.pyc,sha256=nG8GybGx1xohSyJD6U9PK8Bk3bOvGMG8iba7YTrLEqI,3158
|
|
109
|
+
sagellm_core/layers/__pycache__/embedding.cpython-311.pyc,sha256=Ekfi0ERpqbKgmuRnACQ1WJUEj66QldemjSaiX172M-Q,6654
|
|
110
|
+
sagellm_core/layers/__pycache__/linear.cpython-311.pyc,sha256=UnMeRZhlG4gpFa_CIU0l1SE4eH5BFE0Hme1_DO9EY2Q,10899
|
|
111
|
+
sagellm_core/layers/__pycache__/normalization.cpython-311.pyc,sha256=hUhYUYUTHIVhm6BpZ3_33kZqcf743Ej8BTDUynjg5mE,5801
|
|
112
|
+
sagellm_core/model/__init__.py,sha256=P2yGYFm7AfE9jKtCusNOiAOPFw9fGZTqfyuz1cOYxqo,3452
|
|
113
|
+
sagellm_core/model/__init__.pyc,sha256=ZZ7JTzSp5_WTW3wiyBAWGRKVXsScNf6r5LI8Is6dFX4,3370
|
|
114
|
+
sagellm_core/model/base.pyc,sha256=r-DpzMx9nUYgFSl2GS0zk7R9offTEUXAf6y656xWYk0,8218
|
|
115
|
+
sagellm_core/model/factory.pyc,sha256=IYCm18ytcZPhO0lP4unH9feZUJGTMWCyPh6e9kVD8BE,9399
|
|
116
|
+
sagellm_core/model/gpt2.pyc,sha256=ePTJVNy14Pl0L44WwG5KWZj_u2MMFrz-tq8Wg_SqZMQ,9993
|
|
117
|
+
sagellm_core/model/llama.pyc,sha256=HHQ8hRa4HLQ_poOl382TEP9IgAE1OUhpHTma1tor4yM,24446
|
|
118
|
+
sagellm_core/model/mixtral.pyc,sha256=dOD5Y_zqn2y2pJlaQ4dw0-ZNg6QTb4XiuSSQoUrRVls,15955
|
|
119
|
+
sagellm_core/model/model_loader.pyc,sha256=WN2g_XenQTLKSngxkNSTxBIttBwK93yXTnyJe6hd-r8,5822
|
|
120
|
+
sagellm_core/model/quantization.pyc,sha256=kPCBC3zCYnxqyrVYiuSuaewsgmvZcuhtJWZNwE0lsKk,5478
|
|
121
|
+
sagellm_core/model/qwen2.pyc,sha256=9AxgiLbzp_tu8beLTLRQwn1YK7UOVKhCDbAH4ES1-Ak,17885
|
|
122
|
+
sagellm_core/model/registry.pyc,sha256=DVOsvbPosGiMQAk45UvWpqbCaRzxrP2f8W2F4SJ0uAM,5334
|
|
123
|
+
sagellm_core/model/weight_utils.pyc,sha256=mwBOldZZjyhpld__gZ651cHJYHgVhiYKQmXEFoB_3gM,1830
|
|
124
|
+
sagellm_core/model/__pycache__/__init__.cpython-311.pyc,sha256=UfGaLmaK5sFurKzGQs7Rv0nfBmz4yQ_G8vETIQl_Ibo,3414
|
|
125
|
+
sagellm_core/model/__pycache__/base.cpython-311.pyc,sha256=2xTfORrmZ61p7Nca_7QMGc4ZxOiswzpMlQ0thgArkBI,8262
|
|
126
|
+
sagellm_core/model/__pycache__/factory.cpython-311.pyc,sha256=wI8swBf0Tc5s8uq48jK23J0o3s9-u2et--IvbAnEN_A,9443
|
|
127
|
+
sagellm_core/model/__pycache__/gpt2.cpython-311.pyc,sha256=IL_inxu83zASGeo33Bp0L5xgCbooj7OnEcj7CgMI2Gs,10037
|
|
128
|
+
sagellm_core/model/__pycache__/llama.cpython-311.pyc,sha256=MQxAWSnOc3zifbPsS3D_L0BYM99-wkuxo6fGHG7dqc0,24490
|
|
129
|
+
sagellm_core/model/__pycache__/mixtral.cpython-311.pyc,sha256=K7H-DEg6Nk4ra_tnHQJs-qwoj7mv4Ow1luQIGkIX4UE,15999
|
|
130
|
+
sagellm_core/model/__pycache__/model_loader.cpython-311.pyc,sha256=QPEOn7LbYCHvj-G-3cSsrKnPtTcx-p_dC9tTILP91cA,5866
|
|
131
|
+
sagellm_core/model/__pycache__/quantization.cpython-311.pyc,sha256=96E_bn7CRIDDswyrAGn8EgipcSBC51Oc02-IL7hqCo4,5522
|
|
132
|
+
sagellm_core/model/__pycache__/qwen2.cpython-311.pyc,sha256=rlXcbdEemEj3OvQJv9iqLEv_npy_K-jirUgP_8erzN4,17929
|
|
133
|
+
sagellm_core/model/__pycache__/registry.cpython-311.pyc,sha256=tM5qGpTDp2RBrEO-b5eEeTqkQHDIcfFMPOGo-hpDoRg,5378
|
|
134
|
+
sagellm_core/model/__pycache__/weight_utils.cpython-311.pyc,sha256=a0Wv5tKBy9n2YNGPrkmSBSV8BGa7rOzNJnjbxEvWoIU,1874
|
|
135
|
+
sagellm_core/model/weight_loader/__init__.py,sha256=hKYqGfvGcZ_o9VS6GTBP_IHuN39qikPzRGo5Yu-uTec,1474
|
|
136
|
+
sagellm_core/model/weight_loader/__init__.pyc,sha256=xTGuqPCTmVrk63JYimNGCUUYb18SRCidmIp3IwAlTrw,1521
|
|
137
|
+
sagellm_core/model/weight_loader/base.pyc,sha256=ccL1XcOpKdYFDx9iPdEA0KlYD0rtiXmcY7SOYfRltYs,12850
|
|
138
|
+
sagellm_core/model/weight_loader/pytorch.pyc,sha256=_Jl5oVFOTx2snRWJLNcLyaNk7x40Yg5Kk3ZDbvxWohA,6945
|
|
139
|
+
sagellm_core/model/weight_loader/quantized.pyc,sha256=ahsXyYEVz8n4C_3NJcC8RLxbTKVGu9Q12SlLl4_BwtM,14090
|
|
140
|
+
sagellm_core/model/weight_loader/safetensors.pyc,sha256=_13Tblgcmaz3gSJdlXLG9krcwIDFTkz3lb5QDCYsdq4,8911
|
|
141
|
+
sagellm_core/model/weight_loader/__pycache__/__init__.cpython-311.pyc,sha256=vzcetCFSikIqw9q5J-59FSfMvVjmMG9t-w3KU9CGl6E,1565
|
|
142
|
+
sagellm_core/model/weight_loader/__pycache__/base.cpython-311.pyc,sha256=1atSyz848y72l7qfbvSgVTU1HPCv5I1Vlc5pdFtMHTA,12894
|
|
143
|
+
sagellm_core/model/weight_loader/__pycache__/pytorch.cpython-311.pyc,sha256=QDOq4W0KQlIS4_DB76SHZakAVBrPIoQfbP6tBghdccQ,6989
|
|
144
|
+
sagellm_core/model/weight_loader/__pycache__/quantized.cpython-311.pyc,sha256=_iDAjyuSyc1r7McM35_SdpOoeOE7I-l1o-aSw_KTJmY,14134
|
|
145
|
+
sagellm_core/model/weight_loader/__pycache__/safetensors.cpython-311.pyc,sha256=zAET47I4KzgIhYgsfRE1RguvgaLSqz-OnDoAx3RPgL0,8955
|
|
146
|
+
sagellm_core/observability/__init__.py,sha256=lT3qt-69vwH3KlxqN0H_hjknmaXl8Yx2Q3PrWifNvd8,378
|
|
147
|
+
sagellm_core/observability/__init__.pyc,sha256=AgMxpuktnXApjcskYhtZu9txYykL0zA5pxA88GFdyZ4,608
|
|
148
|
+
sagellm_core/observability/logger.pyc,sha256=L4plrgadkvv45aDqMkKoj49NESFixBb_Ul1dVqu1PSQ,1910
|
|
149
|
+
sagellm_core/observability/metrics.pyc,sha256=BPH0Cs4BozpOGEzqzQJ8WpG_uSrWMj_p2ZpfoYPiTqA,6314
|
|
150
|
+
sagellm_core/observability/__pycache__/__init__.cpython-311.pyc,sha256=uAvN7NoVbwrmGEv9Y-9jFEfvLyuVFxS5dw9KW3S3NnQ,652
|
|
151
|
+
sagellm_core/observability/__pycache__/logger.cpython-311.pyc,sha256=PGUrMdntSbemDjZ4bBvbE6T5T0ayRc9u_6EwlVPai8c,1954
|
|
152
|
+
sagellm_core/observability/__pycache__/metrics.cpython-311.pyc,sha256=1fDSo9sL5Lu7Ft9NnpBcaWL4e04xdN8ypfBNNofwmBY,6358
|
|
153
|
+
sagellm_core/sampling/__init__.py,sha256=H8b1UnwiYfMP2rODrjDJXvoI8fRTyfCoDImHRstIDGg,330
|
|
154
|
+
sagellm_core/sampling/__init__.pyc,sha256=SNCG-L_cGlWWNFtcRIgd5PkjPCRbcxMaCA4y7ROMfYQ,556
|
|
155
|
+
sagellm_core/sampling/params.pyc,sha256=y_RtIZycw1hL__9beE1kPsfHUYf9r_bnh3K8w33Pr5s,3391
|
|
156
|
+
sagellm_core/sampling/sampler.pyc,sha256=Q9IgFuLffD_auKmaxqkSpOvHox_1jO0vMxn9rJwhDos,6721
|
|
157
|
+
sagellm_core/sampling/__pycache__/__init__.cpython-311.pyc,sha256=X_CSHSW5HfR5cF6XT_QjePpVL0yNXvApBerCQ_FD2Jc,600
|
|
158
|
+
sagellm_core/sampling/__pycache__/params.cpython-311.pyc,sha256=OWmwd4OPH7fvtPXu52OG6EwxreoIdXG0TnSVhSkoG0k,3435
|
|
159
|
+
sagellm_core/sampling/__pycache__/sampler.cpython-311.pyc,sha256=P8WXBrbB7mPizwNDxKJmlrO2gzLUCSFhZsZsHt0v1aA,6765
|
|
160
|
+
sagellm_core/worker/__init__.py,sha256=isHAvgRYHX_HBRQsJtB72ziV4xeSDyjR1xFH3h_HEHQ,258
|
|
161
|
+
sagellm_core/worker/__init__.pyc,sha256=BDzN0RkdOZUdff5r5sgymVbDzH47QDBqZW8VHzWSNMw,445
|
|
162
|
+
sagellm_core/worker/worker.pyc,sha256=gOZqeyw33WGypXtk5yq5wkRVyZ_wZjem6_GrmhJEe2k,4772
|
|
163
|
+
sagellm_core/worker/__pycache__/__init__.cpython-311.pyc,sha256=82GLZqYvY4lOSFPyl4ZJd12Az0xB1YIbtvIxo2q1bOI,489
|
|
164
|
+
sagellm_core/worker/__pycache__/worker.cpython-311.pyc,sha256=j-Bly_YPvAlXoLcAZsFYMM9vO4EQFOcgxLylaYp44l4,4816
|
|
165
|
+
sagellm_core/worker/model_runner/__init__.py,sha256=w4cq2JoxfHYNUQI3jXO-XhFCoYxNg6YHkioK-S3Ayro,246
|
|
166
|
+
sagellm_core/worker/model_runner/__init__.pyc,sha256=56vUUVM9SnXbQLa2o34DSrmwgCIsygG5dRILepb9CFA,447
|
|
167
|
+
sagellm_core/worker/model_runner/model_runner.pyc,sha256=YfoP-CAE7wz5XQojKlJyb4vXmSpjzhW-z8OKBxZBndE,17056
|
|
168
|
+
sagellm_core/worker/model_runner/__pycache__/__init__.cpython-311.pyc,sha256=SBuQvwarzMcetpu5Cda0yrjgPXxobuCs5TlbC-K1jP0,491
|
|
169
|
+
sagellm_core/worker/model_runner/__pycache__/model_runner.cpython-311.pyc,sha256=Y7oUKzfUdvFCWQwyfQf1TAUWLoLtwE6dy_GJqsG1X9c,17100
|
|
170
|
+
isagellm_core-0.4.0.19.dist-info/METADATA,sha256=u3G4oNtrSRM8WElqF1wR_REm_hq2J2wBjcqdjNBikr8,22827
|
|
171
|
+
isagellm_core-0.4.0.19.dist-info/WHEEL,sha256=JNWh1Fm1UdwIQV075glCn4MVuCRs0sotJIq-J6rbxCU,109
|
|
172
|
+
isagellm_core-0.4.0.19.dist-info/entry_points.txt,sha256=w0kgbHe7jVNOuy785wFMEBwqoZUnfU24HCImsQII3y0,64
|
|
173
|
+
isagellm_core-0.4.0.19.dist-info/top_level.txt,sha256=wcgdWrvkaoYYh_dWSFI5Toi8PZsHutVqfhTB2tb0K6g,13
|
|
174
|
+
isagellm_core-0.4.0.19.dist-info/RECORD,,
|
sagellm_core/__init__.py
CHANGED
|
@@ -26,7 +26,7 @@ Architecture (vLLM v1 style):
|
|
|
26
26
|
|
|
27
27
|
from __future__ import annotations
|
|
28
28
|
|
|
29
|
-
__version__ = "0.4.0.
|
|
29
|
+
__version__ = "0.4.0.19"
|
|
30
30
|
|
|
31
31
|
# ============================================================================
|
|
32
32
|
# New Architecture (vLLM v1 style) - Hardware Agnostic
|
|
@@ -47,7 +47,8 @@ from sagellm_core.worker.model_runner import ModelRunner
|
|
|
47
47
|
# ============================================================================
|
|
48
48
|
# Legacy Architecture (still supported, being refactored)
|
|
49
49
|
# ============================================================================
|
|
50
|
-
|
|
50
|
+
# NOTE: BaseEngine and EngineFactory have been removed (issue #24).
|
|
51
|
+
# Use LLMEngine instead - the unified hardware-agnostic engine.
|
|
51
52
|
from sagellm_core.config import (
|
|
52
53
|
BackendConfig,
|
|
53
54
|
DemoConfig,
|
|
@@ -58,14 +59,6 @@ from sagellm_core.config import (
|
|
|
58
59
|
load_config,
|
|
59
60
|
)
|
|
60
61
|
from sagellm_core.demo import main as demo_main
|
|
61
|
-
from sagellm_core.engine_factory import EngineFactory
|
|
62
|
-
|
|
63
|
-
# Only EmbeddingEngine remains from legacy engines
|
|
64
|
-
from sagellm_core.engines import (
|
|
65
|
-
EmbeddingEngine,
|
|
66
|
-
EmbeddingEngineConfig,
|
|
67
|
-
)
|
|
68
|
-
from sagellm_core.factory import create_backend, create_engine
|
|
69
62
|
from sagellm_core.health import HealthStatus
|
|
70
63
|
from sagellm_core.plugins import PluginResolutionError, list_entry_points, resolve_kind
|
|
71
64
|
from sagellm_core.runner import DemoRunner, RunnerContext
|
|
@@ -159,19 +152,8 @@ __all__ = [
|
|
|
159
152
|
"WorkloadConfig",
|
|
160
153
|
"WorkloadSegment",
|
|
161
154
|
"load_config",
|
|
162
|
-
#
|
|
163
|
-
"BaseEngine",
|
|
164
|
-
"EngineInstanceConfig", # For runtime engine instantiation
|
|
155
|
+
# Health status
|
|
165
156
|
"HealthStatus",
|
|
166
|
-
# Engine implementations
|
|
167
|
-
# DEPRECATED: Old engines removed, use LLMEngine instead
|
|
168
|
-
# Only EmbeddingEngine remains for embedding-only use cases
|
|
169
|
-
"EmbeddingEngine",
|
|
170
|
-
"EmbeddingEngineConfig",
|
|
171
|
-
# Factory functions
|
|
172
|
-
"create_backend",
|
|
173
|
-
"create_engine",
|
|
174
|
-
"EngineFactory",
|
|
175
157
|
# Plugin system
|
|
176
158
|
"PluginResolutionError",
|
|
177
159
|
"list_entry_points",
|
sagellm_core/__init__.pyc
CHANGED
|
Binary file
|
sagellm_core/__main__.pyc
CHANGED
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
sagellm_core/config.pyc
CHANGED
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
sagellm_core/decoding/base.pyc
CHANGED
|
Binary file
|
|
Binary file
|
|
Binary file
|
sagellm_core/decoding/greedy.pyc
CHANGED
|
Binary file
|
|
Binary file
|
sagellm_core/demo.pyc
CHANGED
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
sagellm_core/engine.pyc
CHANGED
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
@@ -1,19 +1,47 @@
|
|
|
1
1
|
"""Scheduler - Request scheduling for Continuous Batching.
|
|
2
2
|
|
|
3
3
|
The Scheduler is responsible for:
|
|
4
|
-
1. Selecting which requests to run in the next step
|
|
5
|
-
2. Managing
|
|
6
|
-
3.
|
|
4
|
+
1. Selecting which requests to run in the next step (via pluggable policies)
|
|
5
|
+
2. Managing KV cache allocation (via SchedulerKVBridge)
|
|
6
|
+
3. Separating prefill vs decode batches
|
|
7
|
+
4. Preemption decisions (future)
|
|
8
|
+
|
|
9
|
+
Key Components:
|
|
10
|
+
- ContinuousBatchingScheduler: Main scheduler class
|
|
11
|
+
- SchedulerKVBridge: Thin wrapper around sagellm-kv-cache
|
|
12
|
+
- SchedulerPolicy: Pluggable admission control (FCFS, Priority, etc.)
|
|
13
|
+
- Batch: Prefill or decode batch with block_tables
|
|
7
14
|
"""
|
|
8
15
|
|
|
16
|
+
from sagellm_core.engine_core.scheduler.base import (
|
|
17
|
+
SchedulerPolicy,
|
|
18
|
+
get_policy,
|
|
19
|
+
list_policies,
|
|
20
|
+
register_policy,
|
|
21
|
+
)
|
|
22
|
+
from sagellm_core.engine_core.scheduler.batch import Batch
|
|
23
|
+
from sagellm_core.engine_core.scheduler.metrics import RequestMetadata, SchedulerMetrics
|
|
9
24
|
from sagellm_core.engine_core.scheduler.scheduler import (
|
|
10
25
|
ContinuousBatchingScheduler,
|
|
11
26
|
SchedulerConfig,
|
|
12
27
|
SchedulerOutput,
|
|
13
28
|
)
|
|
29
|
+
from sagellm_core.engine_core.scheduler.scheduler_kv_bridge import SchedulerKVBridge
|
|
14
30
|
|
|
15
31
|
__all__ = [
|
|
32
|
+
# Main classes
|
|
16
33
|
"ContinuousBatchingScheduler",
|
|
17
34
|
"SchedulerConfig",
|
|
18
35
|
"SchedulerOutput",
|
|
36
|
+
"Batch",
|
|
37
|
+
# KV bridge
|
|
38
|
+
"SchedulerKVBridge",
|
|
39
|
+
# Policy system
|
|
40
|
+
"SchedulerPolicy",
|
|
41
|
+
"register_policy",
|
|
42
|
+
"get_policy",
|
|
43
|
+
"list_policies",
|
|
44
|
+
# Metrics
|
|
45
|
+
"SchedulerMetrics",
|
|
46
|
+
"RequestMetadata",
|
|
19
47
|
]
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
sagellm_core/engine_factory.pyc
CHANGED
|
Binary file
|
sagellm_core/engine_server.pyc
CHANGED
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
sagellm_core/factory.pyc
CHANGED
|
Binary file
|
sagellm_core/health.pyc
CHANGED
|
Binary file
|
sagellm_core/inputs/__init__.pyc
CHANGED
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
@@ -0,0 +1,30 @@
|
|
|
1
|
+
"""Model layers that use backend kernels.
|
|
2
|
+
|
|
3
|
+
This module provides PyTorch-style nn.Module layers that delegate
|
|
4
|
+
compute operations to BackendProvider kernels.
|
|
5
|
+
|
|
6
|
+
Key design:
|
|
7
|
+
- Layers are standard torch.nn.Module subclasses
|
|
8
|
+
- Forward passes use backend.get_kernel() instead of native ops
|
|
9
|
+
- Supports tensor parallelism via CommBackend
|
|
10
|
+
- Hardware-agnostic (CPU/CUDA/NPU/etc.)
|
|
11
|
+
"""
|
|
12
|
+
|
|
13
|
+
from sagellm_core.layers.base import BaseLayer
|
|
14
|
+
from sagellm_core.layers.embedding import Embedding, LMHead
|
|
15
|
+
from sagellm_core.layers.linear import ColumnParallelLinear, LinearLayer, RowParallelLinear
|
|
16
|
+
from sagellm_core.layers.normalization import LayerNorm, RMSNorm
|
|
17
|
+
from sagellm_core.layers.activation import SiLU, SiLUAndMul
|
|
18
|
+
|
|
19
|
+
__all__ = [
|
|
20
|
+
"BaseLayer",
|
|
21
|
+
"LinearLayer",
|
|
22
|
+
"ColumnParallelLinear",
|
|
23
|
+
"RowParallelLinear",
|
|
24
|
+
"Embedding",
|
|
25
|
+
"LMHead",
|
|
26
|
+
"RMSNorm",
|
|
27
|
+
"LayerNorm",
|
|
28
|
+
"SiLU",
|
|
29
|
+
"SiLUAndMul",
|
|
30
|
+
]
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
|
Binary file
|
sagellm_core/llm_engine.pyc
CHANGED
|
Binary file
|