sglang 0.5.4__py3-none-any.whl → 0.5.4.post1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (88) hide show
  1. sglang/bench_serving.py +56 -12
  2. sglang/launch_server.py +2 -0
  3. sglang/srt/batch_invariant_ops/batch_invariant_ops.py +101 -4
  4. sglang/srt/compilation/backend.py +1 -1
  5. sglang/srt/configs/model_config.py +5 -5
  6. sglang/srt/distributed/parallel_state.py +0 -7
  7. sglang/srt/entrypoints/engine.py +18 -15
  8. sglang/srt/entrypoints/grpc_server.py +0 -1
  9. sglang/srt/entrypoints/http_server.py +75 -94
  10. sglang/srt/environ.py +16 -2
  11. sglang/srt/eplb/expert_distribution.py +30 -0
  12. sglang/srt/function_call/function_call_parser.py +2 -0
  13. sglang/srt/function_call/minimax_m2.py +367 -0
  14. sglang/srt/layers/activation.py +6 -0
  15. sglang/srt/layers/attention/flashattention_backend.py +12 -2
  16. sglang/srt/layers/attention/flashinfer_backend.py +10 -1
  17. sglang/srt/layers/attention/flashinfer_mla_backend.py +18 -10
  18. sglang/srt/layers/attention/trtllm_mla_backend.py +1 -13
  19. sglang/srt/layers/attention/utils.py +78 -0
  20. sglang/srt/layers/communicator.py +1 -0
  21. sglang/srt/layers/deep_gemm_wrapper/compile_utils.py +1 -1
  22. sglang/srt/layers/layernorm.py +19 -4
  23. sglang/srt/layers/logits_processor.py +5 -0
  24. sglang/srt/layers/moe/cutlass_w4a8_moe.py +138 -0
  25. sglang/srt/layers/moe/ep_moe/kernels.py +194 -0
  26. sglang/srt/layers/moe/ep_moe/layer.py +79 -272
  27. sglang/srt/layers/moe/fused_moe_triton/layer.py +3 -3
  28. sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py +7 -4
  29. sglang/srt/layers/moe/moe_runner/deep_gemm.py +287 -22
  30. sglang/srt/layers/moe/moe_runner/runner.py +3 -0
  31. sglang/srt/layers/moe/moe_runner/triton_kernels.py +194 -0
  32. sglang/srt/layers/moe/token_dispatcher/__init__.py +4 -4
  33. sglang/srt/layers/moe/token_dispatcher/base.py +11 -5
  34. sglang/srt/layers/moe/token_dispatcher/deepep.py +18 -14
  35. sglang/srt/layers/moe/token_dispatcher/standard.py +1 -1
  36. sglang/srt/layers/moe/topk.py +4 -4
  37. sglang/srt/layers/moe/utils.py +3 -4
  38. sglang/srt/layers/quantization/__init__.py +3 -5
  39. sglang/srt/layers/quantization/awq.py +0 -3
  40. sglang/srt/layers/quantization/base_config.py +7 -0
  41. sglang/srt/layers/quantization/fp8.py +68 -63
  42. sglang/srt/layers/quantization/gguf.py +566 -0
  43. sglang/srt/layers/quantization/mxfp4.py +30 -38
  44. sglang/srt/layers/quantization/unquant.py +23 -45
  45. sglang/srt/layers/quantization/w4afp8.py +38 -2
  46. sglang/srt/layers/radix_attention.py +5 -2
  47. sglang/srt/layers/rotary_embedding.py +13 -1
  48. sglang/srt/layers/sampler.py +12 -1
  49. sglang/srt/managers/io_struct.py +3 -0
  50. sglang/srt/managers/multi_tokenizer_mixin.py +17 -1
  51. sglang/srt/managers/scheduler.py +21 -15
  52. sglang/srt/managers/scheduler_metrics_mixin.py +22 -14
  53. sglang/srt/managers/scheduler_profiler_mixin.py +3 -4
  54. sglang/srt/managers/tokenizer_manager.py +11 -19
  55. sglang/srt/mem_cache/hicache_storage.py +7 -1
  56. sglang/srt/mem_cache/memory_pool.py +82 -0
  57. sglang/srt/mem_cache/storage/hf3fs/mini_3fs_metadata_server.py +3 -2
  58. sglang/srt/model_executor/forward_batch_info.py +44 -3
  59. sglang/srt/model_executor/model_runner.py +1 -149
  60. sglang/srt/model_executor/piecewise_cuda_graph_runner.py +22 -12
  61. sglang/srt/models/deepseek_v2.py +147 -44
  62. sglang/srt/models/glm4_moe.py +322 -354
  63. sglang/srt/models/glm4_moe_nextn.py +4 -14
  64. sglang/srt/models/glm4v_moe.py +29 -196
  65. sglang/srt/models/minimax_m2.py +922 -0
  66. sglang/srt/models/nvila.py +355 -0
  67. sglang/srt/models/nvila_lite.py +184 -0
  68. sglang/srt/models/qwen2.py +22 -1
  69. sglang/srt/models/qwen3.py +34 -4
  70. sglang/srt/models/qwen3_moe.py +2 -4
  71. sglang/srt/multimodal/processors/base_processor.py +1 -0
  72. sglang/srt/multimodal/processors/glm4v.py +1 -1
  73. sglang/srt/multimodal/processors/{vila.py → nvila.py} +32 -24
  74. sglang/srt/multimodal/processors/points_v15_chat.py +2 -2
  75. sglang/srt/parser/reasoning_parser.py +28 -1
  76. sglang/srt/server_args.py +365 -186
  77. sglang/srt/single_batch_overlap.py +2 -7
  78. sglang/srt/utils/common.py +87 -42
  79. sglang/srt/utils/hf_transformers_utils.py +7 -3
  80. sglang/test/test_deterministic.py +235 -12
  81. sglang/test/test_deterministic_utils.py +2 -1
  82. sglang/version.py +1 -1
  83. {sglang-0.5.4.dist-info → sglang-0.5.4.post1.dist-info}/METADATA +7 -6
  84. {sglang-0.5.4.dist-info → sglang-0.5.4.post1.dist-info}/RECORD +87 -82
  85. sglang/srt/models/vila.py +0 -306
  86. {sglang-0.5.4.dist-info → sglang-0.5.4.post1.dist-info}/WHEEL +0 -0
  87. {sglang-0.5.4.dist-info → sglang-0.5.4.post1.dist-info}/licenses/LICENSE +0 -0
  88. {sglang-0.5.4.dist-info → sglang-0.5.4.post1.dist-info}/top_level.txt +0 -0
@@ -2,14 +2,14 @@ sglang/__init__.py,sha256=CK60u1J439CJZaPihWqlDjFZ8doIC-5YgIYz-E1PIh4,1823
2
2
  sglang/bench_offline_throughput.py,sha256=Bge0KG4Uiv9CHsxDnqKdXJmG_TcxM4blz3CmvLmDRvM,14815
3
3
  sglang/bench_one_batch.py,sha256=cjECJgTmPcnP-b8Fcy7ldFU6FaEqBpz7Z45RTwBwNR8,23763
4
4
  sglang/bench_one_batch_server.py,sha256=8zAjLFu0tgfIhhtEaPGdDhi15YCcHcaK19vz6Rmn_Jw,26565
5
- sglang/bench_serving.py,sha256=KrPHSzFmzyhRerLBBOm-72sOr1toBQkNIOvRPdVBBc0,94023
5
+ sglang/bench_serving.py,sha256=tcgQ3SjTEG1CYvawDbhJdQeX3JR10yiINPxcSN47Jio,95619
6
6
  sglang/check_env.py,sha256=6wRlWL7UwY1JjYRG307bLLJRoirPk2RVLYrDWV8Et0c,8413
7
7
  sglang/compile_deep_gemm.py,sha256=v7WJZLSrJw3Vc_28lTReRDJ1WdiPKLRHizFi2l2chv8,6614
8
8
  sglang/global_config.py,sha256=bVpUL_gMSA0FwJl8y8tP5CIa7d083o6Dcak-yRytzGw,767
9
- sglang/launch_server.py,sha256=VqPi2ecJmQuvw1aYppiKEp45NC_FthgBjzhHM2pXItY,620
9
+ sglang/launch_server.py,sha256=SDfZfS1i0RtakLx1zX9uclHpefKHOiXd7MQI0ktYjx4,686
10
10
  sglang/profiler.py,sha256=uprc8Lo-WeqrQY9u2Wj503swEp4P_2laLJ6cWGALgME,4854
11
11
  sglang/utils.py,sha256=YreOyt4-fWdDcg01abaMJ0y0ly4gYps26vRlmWhwGC8,17267
12
- sglang/version.py,sha256=DITpct-LrdIsTgwx2NgH5Ghx5y8Xgz1YMimy1ZV5RTY,22
12
+ sglang/version.py,sha256=TvZB2PPVmaQCmVVHStxmVi90Tm1q4CKl6ezbtlp8gnY,28
13
13
  sglang/eval/llama3_eval.py,sha256=mLNRZJIqV4CfqrY8UGnJEcHw2Xsyr1eyYZgFSUFYr1g,9997
14
14
  sglang/eval/loogle_eval.py,sha256=-CC2s2kh5qUoDrHRkQVkC_jNvBgNojXbf456ny5s78s,4557
15
15
  sglang/lang/api.py,sha256=kyfJuErqMyle6hnx3Q_oqNSFDe0q4gFob1yd5ZLTatw,7438
@@ -28,18 +28,18 @@ sglang/lang/backend/vertexai.py,sha256=gz0uNYyBb88jbPYz6ZIJ774fefrcbuVdoK33bphUZ
28
28
  sglang/srt/_custom_ops.py,sha256=P4MLtuF8DzK66R_Sw88AYsiCOn7YNGZ93H7isJq0dUA,5356
29
29
  sglang/srt/constants.py,sha256=0i-tEwG2BSYNDy96MxnGHV5HnBELkYcnsVGsE-R18o0,93
30
30
  sglang/srt/custom_op.py,sha256=m5F7x3LHlnOuesmcNmJtIWsfHGFLBJ807vKc05Gu1D0,3312
31
- sglang/srt/environ.py,sha256=2D5x1OaR_lRd-oSLilf1lZo01Pqz2_t5Bru-LHIxYys,10447
31
+ sglang/srt/environ.py,sha256=wlvu5PP68cZLbH4DquMeZLkb3aVgJkc3aMzquHeyNbg,10892
32
32
  sglang/srt/operations.py,sha256=za_h1_kcR1Te6-i_r0i_zAeumbmIRhLK2pS31sukkrw,6089
33
33
  sglang/srt/operations_strategy.py,sha256=-w6GI2VgSGvORy3pUWRAJo6244ykSW1ZBV1Dx0fZlHA,7138
34
- sglang/srt/server_args.py,sha256=Qen-c7jcgQpTrub1ogsyxX_8Joj7WfP_rA6ZMIfsH-Q,160382
34
+ sglang/srt/server_args.py,sha256=igDvB6U6cnibpTgolFV927EwB90ALkqflmsHFslk714,168328
35
35
  sglang/srt/server_args_config_parser.py,sha256=NW_tnD_ixnIpEhIuhn1W67pnAOJSGWKKN-jHcssKD-Q,5213
36
- sglang/srt/single_batch_overlap.py,sha256=mUW2yBRxLWKlDlpTqIKkICWzMkcbKsmPjUtcvGiVYq4,5388
36
+ sglang/srt/single_batch_overlap.py,sha256=73RM4rQDjw1RQxW4GCWthRLQyoP2oPRA2oN7804dI_E,5236
37
37
  sglang/srt/two_batch_overlap.py,sha256=xDDMyE1hKQPq-yu_GkVnNXskyc1CVoPYPaB6AvoPXKA,34667
38
38
  sglang/srt/warmup.py,sha256=fQYzNp-I9mZccs2BerI6mOZd1CDQjdiuFCeUkcwiOb4,1834
39
39
  sglang/srt/batch_invariant_ops/__init__.py,sha256=Z9TvOE4BL7cAaBIePEsVglH7RcWBSBIsSHs-XbveQNE,728
40
- sglang/srt/batch_invariant_ops/batch_invariant_ops.py,sha256=Kb4uxHPDwlQYg1CfEOhuRDcHTI3Yr8Kbq3GkF57iUZs,16249
40
+ sglang/srt/batch_invariant_ops/batch_invariant_ops.py,sha256=aHC9BuEm_qY_9nQ87dzMCs1c8cTi_t9JGrq4kn6bEwk,19401
41
41
  sglang/srt/checkpoint_engine/checkpoint_engine_worker.py,sha256=YlyiZ46LOi5aib0N5IyrPMuGbnVi_Xnnf9r2XdR1OtY,5509
42
- sglang/srt/compilation/backend.py,sha256=SClr9jjC8wb8vymB2cE-6DN36bEbZeBlYcFx0qe-pfM,14395
42
+ sglang/srt/compilation/backend.py,sha256=avi40bJLD_XZd9a2r9Kcl3jOT-n7uiGVZTif76EFRWk,14424
43
43
  sglang/srt/compilation/compilation_config.py,sha256=9GDBY3SAV5hIJ6hmYurJ3vfYh9-gtZP3nEzp0TrUdeM,617
44
44
  sglang/srt/compilation/compilation_counter.py,sha256=qrCqMCaui2eOBpxi3ZBiuvmJ6dkWah_6dYjhvu6_MqE,1623
45
45
  sglang/srt/compilation/compile.py,sha256=All4G5VjYBY9MOalW5YDo17eEtho-o_BG5V86lNJ-5c,6965
@@ -68,7 +68,7 @@ sglang/srt/configs/kimi_vl_moonvit.py,sha256=hx2Rt4JSFbvy2HUTeLjBpge87m8M6ITAhqs
68
68
  sglang/srt/configs/load_config.py,sha256=_x9n6Rkbi3VqYmXJ7PNdce32mvUNP1ewqrkUsJ7qprw,4765
69
69
  sglang/srt/configs/longcat_flash.py,sha256=Qp25xJVLq2K72Z80cXhcJxtqhagAdiPySDoevuT0Sno,3589
70
70
  sglang/srt/configs/mamba_utils.py,sha256=AD96wj8FCxRsEovdtGn88xzcKAw5KErbO5xFSk0xwxc,3684
71
- sglang/srt/configs/model_config.py,sha256=7KAlFFRQr9Vsj2PzFBsGnmzXQGWo3eHtftSnaQjDruE,39695
71
+ sglang/srt/configs/model_config.py,sha256=16APos-1uvf8oQsfU1yQz5HBSXI2WWQQU4pBCkeY3PE,39657
72
72
  sglang/srt/configs/modelopt_config.py,sha256=pr4Q_J4G1Ff-wy24BYRzWaN0UI34rreGef7Nt6d0X3M,1070
73
73
  sglang/srt/configs/nemotron_h.py,sha256=X39hWm2KQoAcZ4HXKDCfbua9aOTlcxcK89c52cmAq-k,13072
74
74
  sglang/srt/configs/olmo3.py,sha256=DOyp1cNi_n8ckz9Ohs3zUZqkk6n26UBsNQ3zngHNNNY,3600
@@ -126,7 +126,7 @@ sglang/srt/disaggregation/nixl/conn.py,sha256=w_kDDEB4fIvDe-Z7ufxmw_cpDR57xXJVQr
126
126
  sglang/srt/distributed/__init__.py,sha256=jFOcyt-wFAPMBUAf9zkZalNQlt-4rqmT6pCKBz1E4qo,149
127
127
  sglang/srt/distributed/communication_op.py,sha256=IBnFUdMftK_VSTMMMitGveonorFUUVNL4guqO31cMSc,1130
128
128
  sglang/srt/distributed/naive_distributed.py,sha256=GX7CHhUb9rIQuaIPX4TYm01S7XQdBXvdqaJoPdxFyAI,3317
129
- sglang/srt/distributed/parallel_state.py,sha256=SHisHdAql3dVBFUR1zIZo3apQMejRPh0hQYn5AaA9N8,70931
129
+ sglang/srt/distributed/parallel_state.py,sha256=2lenq6afSb6xGdvOw2dvpD8ssjm7XTbSF0BjJ_V-mbg,70571
130
130
  sglang/srt/distributed/utils.py,sha256=aaCxATncLGnVgB0WlGpBdee0behKW8Dy_dakqcuKSaQ,8497
131
131
  sglang/srt/distributed/device_communicators/all_reduce_utils.py,sha256=dk-uFaKZgVG-1dZDwMT6GvpFi2xP0DJRJ9BiRjHq0zw,336
132
132
  sglang/srt/distributed/device_communicators/cuda_wrapper.py,sha256=3jvPG-Ow5UBLiXhfx8T8snR7crSZbPpARAggsDPWq7k,7038
@@ -145,10 +145,10 @@ sglang/srt/distributed/device_communicators/xpu_communicator.py,sha256=ajW6132Bv
145
145
  sglang/srt/elastic_ep/elastic_ep.py,sha256=KaSUAi0JHB82desvcv-TW5_PYCrzQStslOCcl9_g-LM,2311
146
146
  sglang/srt/entrypoints/EngineBase.py,sha256=yKN76witT2jz1zhmLHmPNLGMpK2UiOTaKQ2KPD8l99U,2594
147
147
  sglang/srt/entrypoints/context.py,sha256=YQdVLmELQD1tNT6Q1BLl04sATwTJAAomCATZyD19S8g,8035
148
- sglang/srt/entrypoints/engine.py,sha256=yiIVBjbMLgL1s5A19bShgeqRdAQlv3OGfz5swHNTunc,35010
149
- sglang/srt/entrypoints/grpc_server.py,sha256=CHiZDErgPHnVp8PtfH246U6Eq_BEoKANJKAttNYXjBQ,38869
148
+ sglang/srt/entrypoints/engine.py,sha256=-Cmjdfq9QxXKCXXVSnOfg2LIvpteQlIvr0sMBUn1IZQ,35028
149
+ sglang/srt/entrypoints/grpc_server.py,sha256=3yio35-FDDYwCyt0QwTRDu4Z1ASS20UmqK7Hz6fBbRo,38813
150
150
  sglang/srt/entrypoints/harmony_utils.py,sha256=FhpPFnwgy1-qLnu_HZAk5V_RPmQkT81dFVp8A6xINEU,13594
151
- sglang/srt/entrypoints/http_server.py,sha256=Y1Rl71phsasv8Tot1wlKl1GpJK2b_xqT_EqPEfjKOTM,56378
151
+ sglang/srt/entrypoints/http_server.py,sha256=tBGTW1MA_6Dtqb0_z_mWHjmpY9ZLIaGehLHKJITvdJg,55556
152
152
  sglang/srt/entrypoints/http_server_engine.py,sha256=rWgdCYLZZP89MA-Y-hfACQqdDu0LC7lLYghi2wk-nU8,4809
153
153
  sglang/srt/entrypoints/tool.py,sha256=aAXEjBqkr5j6_IgRL8fZCKgoDPY2TikM20-LQXU9TaI,2709
154
154
  sglang/srt/entrypoints/openai/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -167,7 +167,7 @@ sglang/srt/entrypoints/openai/usage_processor.py,sha256=9LTB5rqdRuMKyZrIXiUBuF_W
167
167
  sglang/srt/entrypoints/openai/utils.py,sha256=DT9quW0F1DX1P9NAuMxpERgXcNYKKtm7rd7J1m7EaDQ,2112
168
168
  sglang/srt/eplb/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
169
169
  sglang/srt/eplb/eplb_manager.py,sha256=e8HMGzZb2QFRGdS7JZIFSy8cOIlxOlGRY-ef7Wei0Sw,4364
170
- sglang/srt/eplb/expert_distribution.py,sha256=lU1Pw8qVooiyv3LPIW1Jec09wLs22_eKdxs0kuS6vgc,32901
170
+ sglang/srt/eplb/expert_distribution.py,sha256=X28mY6j91VKFbBtMHPwYdFLB8vYtzSjxNF82W3XVGKo,33892
171
171
  sglang/srt/eplb/expert_location.py,sha256=WoOmsZ4u9le44km3nbjJjF6BVBxN3cKRz9nQM0uWH_s,18386
172
172
  sglang/srt/eplb/expert_location_dispatch.py,sha256=mZUH-jvz7yvxC-5bwMFQalfKbbJiZujMiRK_M9oGOT8,4163
173
173
  sglang/srt/eplb/expert_location_updater.py,sha256=7LOmLtY_YWYySI2GgFuTJ__Qde0LEKq70E77Q608OFU,21157
@@ -182,12 +182,13 @@ sglang/srt/function_call/core_types.py,sha256=wLUsW8mUA-i-ISz5QUDL7Ejq72W-K1HIhF
182
182
  sglang/srt/function_call/deepseekv31_detector.py,sha256=hpRjjv219mH0v1PQpMvj_gezrP7PwvLiNbBKOTCSC3U,9731
183
183
  sglang/srt/function_call/deepseekv3_detector.py,sha256=DhO3tUX1nvFlfRkHJ1Vm_7OMXFFTvWBA9u9SZKFAwuQ,9710
184
184
  sglang/srt/function_call/ebnf_composer.py,sha256=OpjfvYowLlMLnxz5fwS7zv5-d43_ZwO9ucGAMsILvm4,15321
185
- sglang/srt/function_call/function_call_parser.py,sha256=CXP_4OEo0M9aE3vXMW-m3VJTq9uVhM2w3NOcnnmXjuA,8762
185
+ sglang/srt/function_call/function_call_parser.py,sha256=JDZzRmXBypTfhGm_hZDmhw6o2XkyWCd4iYyxqvmcsxk,8869
186
186
  sglang/srt/function_call/glm4_moe_detector.py,sha256=B4GjjgoDVc4ETyqCowfWQamIhhUDwl6pA9xsAE3sOfo,6943
187
187
  sglang/srt/function_call/gpt_oss_detector.py,sha256=ti5Dwci_3J9XzqQetMILY7R-VTCCRbGbHas3DdC5x28,9263
188
188
  sglang/srt/function_call/json_array_parser.py,sha256=m37S_3bQtyAI86T3ju80dkKJxuazA1VV0J5ioK1uQbw,2205
189
189
  sglang/srt/function_call/kimik2_detector.py,sha256=VWN4Nf9l9O0uSUR0UppuoAyVObvGw-rVvklFJ1qzbRA,10641
190
190
  sglang/srt/function_call/llama32_detector.py,sha256=trZja7IXc2IWUko5PRj7p4pRU6XCVjtxr-7qJNr0EWo,3647
191
+ sglang/srt/function_call/minimax_m2.py,sha256=1Q5uo-cUUtKykYDeAWx0CxqiDtz2_oC7sprsAJL6Ki4,14689
191
192
  sglang/srt/function_call/mistral_detector.py,sha256=Ts2HrJdu5r2lCCMVKPZfnCds9pt1K5H1EaOQrF_HD60,4686
192
193
  sglang/srt/function_call/pythonic_detector.py,sha256=yAatItKtVDf9uhlB78wPWKP3fbefLJDNGGzFV5ey-YA,8756
193
194
  sglang/srt/function_call/qwen25_detector.py,sha256=nv83_sipZMU6Vie3J4HeNiZVCSRU5ei7601j50779HA,5181
@@ -202,24 +203,24 @@ sglang/srt/grpc/scheduler_launcher.py,sha256=GMuNCfF4MYYjJL3O8NqQrg1N9P7T2QyRmpx
202
203
  sglang/srt/grpc/sglang_scheduler_pb2.py,sha256=ALq0gD19OUC4CdjbOU2YYHGmgTlkJvWX3exX_SOXSv4,16016
203
204
  sglang/srt/grpc/sglang_scheduler_pb2.pyi,sha256=ibYeIZPchbx4fcLDeAa-LSnq6MZi-mh4DgzIGg-SUWY,26274
204
205
  sglang/srt/grpc/sglang_scheduler_pb2_grpc.py,sha256=8FQtALiqSyWkqL6P_rKerievE9q19V3675AEEomNSe8,12633
205
- sglang/srt/layers/activation.py,sha256=Qg-goR7CSwQeBhS4IO56wCA7jMR_bPNZJHnLDZNnm5s,13407
206
+ sglang/srt/layers/activation.py,sha256=9NArY7s3okKipcJaVLHuX9Irw71z4c338AbsqeUocXQ,13671
206
207
  sglang/srt/layers/amx_utils.py,sha256=1mENgHK2B8mgaD1oMtgbZ15Jmy_Uu1QueBmo09Ff2iA,2865
207
- sglang/srt/layers/communicator.py,sha256=dmoydeyHoiVQCr1PvMcTwM1Kirv71PZOa-JSeVD6n50,24465
208
+ sglang/srt/layers/communicator.py,sha256=ZS1A_wkCaljrOT1nrjQlUhImNFeyZsiONUjOfIa5SjA,24511
208
209
  sglang/srt/layers/dp_attention.py,sha256=dBfEtofjY9MlCDF5B-y_zrX-owfZ46mSBYioCzlIoHM,16817
209
210
  sglang/srt/layers/elementwise.py,sha256=tGbN7bbK2s-j3DoJeJfkfyPNmKdVAutAd0J3TbxUPAQ,18849
210
211
  sglang/srt/layers/flashinfer_comm_fusion.py,sha256=hnVVS_VsWukTYhREubWs2KcJ1GjVMEI9ECqxqOMXZv8,6729
211
- sglang/srt/layers/layernorm.py,sha256=Kf18oGBMTyqjaeeTJMeCYhyrQb-8NsSjhG0QDswM8rM,12334
212
+ sglang/srt/layers/layernorm.py,sha256=CI1sJ_I3nZMy-cpvcbxIAGk52iFoR6eme9S27cDdPFc,12906
212
213
  sglang/srt/layers/linear.py,sha256=1g5vEFHqSd1TPb0VxQiZ5oga45QorYxvj2CZl_NM9wc,56084
213
- sglang/srt/layers/logits_processor.py,sha256=VNMPpyxVNNXtOxd9nui0Yrm8MUkjrGBEL1cmUYXLyM0,34499
214
+ sglang/srt/layers/logits_processor.py,sha256=0xOFWdBdrQYGz7uihAscwjdeiEMgkY9hHrWzia1R_cQ,34792
214
215
  sglang/srt/layers/model_parallel.py,sha256=eLXZhvJ4wG6dh0FontNCIdVZvHYdWgaeY-5cu7TD9tE,6078
215
216
  sglang/srt/layers/modelopt_utils.py,sha256=Abhiwmu1VOoSePJWytgFxRw_6qTtN2rqT61DPDboCIw,335
216
217
  sglang/srt/layers/multimodal.py,sha256=vNswe0J0maeBiN8ehlmxfs-YYlrmMllYl6Nc_Y57Neg,5114
217
218
  sglang/srt/layers/parameter.py,sha256=6ce1lx2urWJKz87g2qg_oce_S5BV0IcguSiOGGHbcC8,18378
218
219
  sglang/srt/layers/pooler.py,sha256=uZ6WX1FLMEafZwusyZdm6KuVlIwSjbKrdwk2qzgqNGk,3812
219
- sglang/srt/layers/radix_attention.py,sha256=HvTa-gSz86XdN9mcK7H3lrQXjGfAMnBzI1lM8WKaIUc,5203
220
+ sglang/srt/layers/radix_attention.py,sha256=SqL-15JQWxjoSZyaOxfhGqUE0Vu_55O_ihN5CiPRxfM,5310
220
221
  sglang/srt/layers/rocm_linear_utils.py,sha256=7PPh-5H2IYjiLp_g_szzVBsmiMacZ1RtjVtjdrdFJKI,1374
221
- sglang/srt/layers/rotary_embedding.py,sha256=ZekORUqqnej3PP8-ETIhvlkweLMhrP1nZTH4Qz3fB-E,101467
222
- sglang/srt/layers/sampler.py,sha256=bnfa0jtHBWcXeDALGGYR6t1DOejaG2LBqgG6kmXP7Fc,20632
222
+ sglang/srt/layers/rotary_embedding.py,sha256=nAc_bIZN2UFN7O2hgoImNfv4msodVeOFf4ft-gbsS68,101948
223
+ sglang/srt/layers/sampler.py,sha256=CunUv_aB_Dw_SqOimQRdw0W21pG75TMH-lvGRr2fNR0,21177
223
224
  sglang/srt/layers/sparse_pooler.py,sha256=9gB8duR48R-FGtA4Q7D1fIDSvbKlD70N38S3Lvg773s,3424
224
225
  sglang/srt/layers/torchao_utils.py,sha256=Ws24FdRBSkTpyeyA6bQrdDm-W5wfDxKvSIPUSahyMfA,4063
225
226
  sglang/srt/layers/utils.py,sha256=F_hhE514OZ4cyMklga3mipdUzlrKo3SolIcuqgqqQqQ,1913
@@ -231,9 +232,9 @@ sglang/srt/layers/attention/base_attn_backend.py,sha256=oYk0ch5ptL2EtlhjyitKvu6H
231
232
  sglang/srt/layers/attention/cutlass_mla_backend.py,sha256=cb2dMTnDMmMVBG_lqFRciVDiF3PeEAcXYaKDFWszeTw,9849
232
233
  sglang/srt/layers/attention/double_sparsity_backend.py,sha256=wkF1GxFuLsGUWYoPWoqdz0xpePqA_nbo7xd2ha67sng,9135
233
234
  sglang/srt/layers/attention/dual_chunk_flashattention_backend.py,sha256=20vmnq68-Cq62UWIzQU_uwJzq4B8KdJeZUPVoWPiyDs,68620
234
- sglang/srt/layers/attention/flashattention_backend.py,sha256=0bbODTKS-DADucy-GmR_1LQzwezvXuXGuP21Y6WH5EU,105314
235
- sglang/srt/layers/attention/flashinfer_backend.py,sha256=R06qwUhhfeBL2qAD1CRS9KzmdoiGxO10QjAoAouNDjA,63332
236
- sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=LrhlHUVn0ZlvCIhK8iAjqEEqUUvRydJn7TZ7Hs4o3B4,39462
235
+ sglang/srt/layers/attention/flashattention_backend.py,sha256=jBN4xznXLKxgr_bJ3v3L6TvwgX4QxuH-tAW7Yl3H2mc,105725
236
+ sglang/srt/layers/attention/flashinfer_backend.py,sha256=6yfbhGS1lGhQYqgoLFCVm05fQcniu--D4uQuhCWYCUY,63842
237
+ sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=lr6SeoyzhgxX25e8Tt6lxCmeJLigNRa5kAmkE2GsARM,39786
237
238
  sglang/srt/layers/attention/flashmla_backend.py,sha256=HijFHZZ-pGE75NytFXsS0MIv8d-zWJGRRdfjdF1ViJ8,20860
238
239
  sglang/srt/layers/attention/hybrid_attn_backend.py,sha256=_Gol1e_m6vMKhpUw2-OQ37ymC5sIuSTntDylVKSZtpA,5121
239
240
  sglang/srt/layers/attention/hybrid_linear_attn_backend.py,sha256=tqwPna30r1zriVhKlit-iVfpfy6hJGxumGKsnlJ20C8,26119
@@ -245,8 +246,8 @@ sglang/srt/layers/attention/torch_flex_backend.py,sha256=MnnZLxi41R-d4P0cyklNyef
245
246
  sglang/srt/layers/attention/torch_native_backend.py,sha256=NdWD2ArmS1lQN9mZIbS2rcHueBWColNxvhcLaQGAKGQ,9728
246
247
  sglang/srt/layers/attention/triton_backend.py,sha256=30z1z_aJ9jUKGG3rc-2DI6h-3HO3w3hVpcFM18BVSQY,50504
247
248
  sglang/srt/layers/attention/trtllm_mha_backend.py,sha256=IQUu3jkCuAY5foqvR6L1IYjjVD4qfmTwG6rfo05ZVkI,27516
248
- sglang/srt/layers/attention/trtllm_mla_backend.py,sha256=7ceisj7_0X9mK1dDheEoVuIXHsMDjptoaw9HycBVxYQ,41679
249
- sglang/srt/layers/attention/utils.py,sha256=uRyxLjpRMVesPDFtGHtzJDHQvWhS4AsGW5RGCsIYPBk,3230
249
+ sglang/srt/layers/attention/trtllm_mla_backend.py,sha256=YrC662lqz5nCdGvq_6bdaxWsMYx6AVne8vTjAuQu2n4,41079
250
+ sglang/srt/layers/attention/utils.py,sha256=L1FlCmgWsH-k-ccXcuSiB9Tj4z7b-a7KMWPZKvCXowQ,5478
250
251
  sglang/srt/layers/attention/vision.py,sha256=-MX_K0_mX58xkpaS6O93vWIJVqha4iNgYNN5M5Yptnw,21763
251
252
  sglang/srt/layers/attention/vision_utils.py,sha256=6hPPAt8p3SOm7tgHNUesnMLxvQiKbaOM5EK6K-ig5dI,2771
252
253
  sglang/srt/layers/attention/wave_backend.py,sha256=dMsR7GsfDYgVizY8QJ94ASrxiiJ5_MNOuTUDDQzvpPQ,22915
@@ -297,29 +298,29 @@ sglang/srt/layers/attention/wave_ops/decode_attention.py,sha256=oJNBG57cySgxtmJe
297
298
  sglang/srt/layers/attention/wave_ops/extend_attention.py,sha256=LyZQQIvFYfcIcObgy_tETK5JxRLgAkOYlF-KhGcGEoA,3877
298
299
  sglang/srt/layers/attention/wave_ops/prefill_attention.py,sha256=viTUit0rxjVV5UahuwmVAhmL66YRFJD4g1YhH_oRBu8,2344
299
300
  sglang/srt/layers/deep_gemm_wrapper/__init__.py,sha256=esJMd0Yuj68t6QYOpmIFuiWP2J2dxTMC4bRBNH0Xk6I,26
300
- sglang/srt/layers/deep_gemm_wrapper/compile_utils.py,sha256=tvoJ2PmYJWm6j_JfRpmBhg7mUZyH27f5JJeDZ4xcZhg,8067
301
+ sglang/srt/layers/deep_gemm_wrapper/compile_utils.py,sha256=EoRu5a-eiXcBZV9bVJ0x8ATLpKLt_AUeTNixdeJ1bSw,8070
301
302
  sglang/srt/layers/deep_gemm_wrapper/configurer.py,sha256=vkMBNZx3RqukEtxMUAbTfKJii3MDXLBs83ZlsgtxNiU,559
302
303
  sglang/srt/layers/deep_gemm_wrapper/entrypoint.py,sha256=5VTBfCU6wTBS2uMJc-luyqawh1478w3Jh1qk39qhjlI,3199
303
304
  sglang/srt/layers/moe/__init__.py,sha256=P8OC-pUE5yeEr80QUDqSPwF9a9BAYPuaK7GNlQovsJw,863
304
305
  sglang/srt/layers/moe/cutlass_moe.py,sha256=335MeGbcVPsAI9oaEQCVSMxzzQ9YV1qPiNxINXtvO48,14206
305
306
  sglang/srt/layers/moe/cutlass_moe_params.py,sha256=9NRCmgP_Ug3gGqCcpi-x-QRbLjCNpw8792gKXwZsbEU,6522
306
- sglang/srt/layers/moe/cutlass_w4a8_moe.py,sha256=yTSlr_B9y1jiAmp6pX88LHb7hQ351Ensa8SR2fgW3v8,13898
307
+ sglang/srt/layers/moe/cutlass_w4a8_moe.py,sha256=2vVS2bhUuKRsDnPR2cNUKli9Pbi32lzQ--0jRpyYB_I,19210
307
308
  sglang/srt/layers/moe/flashinfer_cutedsl_moe.py,sha256=ULLAdfRad_sG2ZYXE4qMCOutQX0eckQt0fwwhfcsckA,6186
308
309
  sglang/srt/layers/moe/fused_moe_native.py,sha256=XzJPM9Z6YQ4ejrMrBFt3l1i7guBcdQTXo9-gT5H8AIA,3479
309
310
  sglang/srt/layers/moe/rocm_moe_utils.py,sha256=SglTXIzpiWKFKVEf9gS8SEocJYcSOmeKUKjHznfC_nI,4527
310
311
  sglang/srt/layers/moe/router.py,sha256=ouSNu8XU2w-BICyAYPpFq2zPb11LyTDalZElh0AXGus,13675
311
- sglang/srt/layers/moe/topk.py,sha256=reUXYWZdHVfNJnrRxd8kXjGVLhdNu3AxRqOt5N7NyGg,32306
312
- sglang/srt/layers/moe/utils.py,sha256=lP4WESNZBjCaY-dOnuJ6jkrrAXl2e3pR3MTMjyWQFic,6782
312
+ sglang/srt/layers/moe/topk.py,sha256=bjmeGhdwlSOeQpzb2XjBVNcpCX-L0chN5aanzXmTw3Q,32310
313
+ sglang/srt/layers/moe/utils.py,sha256=UZsd1KCXNZ4XFWNnxZiNywsuYEtA7xOQLd52c6RZC9U,6701
313
314
  sglang/srt/layers/moe/ep_moe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
314
- sglang/srt/layers/moe/ep_moe/kernels.py,sha256=DjgEBHIS8-S1SO46xGbnREc2vQ8dO9dDKNRYKZuwMzM,32125
315
- sglang/srt/layers/moe/ep_moe/layer.py,sha256=D8U42eegm1cwuS9zpwIOj_DV_LmiapMOh2hMWJOBWj8,26193
315
+ sglang/srt/layers/moe/ep_moe/kernels.py,sha256=jsSLb_D7u60_8NIHxTEoEerRAbQFJXPWJHMpRVsEyOU,37898
316
+ sglang/srt/layers/moe/ep_moe/layer.py,sha256=jra2o5MZ2od5T4J3CiJH7XZor2zW94fvcP7j4IvvqCU,19836
316
317
  sglang/srt/layers/moe/fused_moe_triton/__init__.py,sha256=tis0ZJmih7gKHCurbLtY_o-bY3K4MOzQLYLC3ftIOf0,977
317
318
  sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=mKH6zTTuh_Z8Ceg6d1VWjGBI3iPBn1YfGO6udxIRAtU,23306
318
319
  sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_config.py,sha256=0jTqnuw8v6uwr4g2IJ6bc3PRq77HF96mEYaSOBmpTAQ,7983
319
320
  sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_kernels.py,sha256=QOdl5uhZ8--aryXnKObdspKonGcF6Tc_U9o_lC_opo8,27760
320
- sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=E2qURbonpdnEOqEV2MmgLgUdecCSyfxyua3rmWb5kiI,39806
321
+ sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=QvljwzkINsJEt9q5HkS-0KC0QDq_vuTIMJh2QAkH_18,39827
321
322
  sglang/srt/layers/moe/fused_moe_triton/moe_align_block_size.py,sha256=U93mxPPU2RP7d3QRSvoG3OCtUQIK8YhQfHf1ZGeREmY,3284
322
- sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=8_LiuVJqeuMIsy0nBJExYH9RAftfyutCKh_2NWU10rg,10141
323
+ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=g1duB_VckkfiqyB5ePWRv8Nndwr5OoqnN9pEiVUrVXo,10408
323
324
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=iNGsE2ZeVnQEnN4A8UJ9Jv0d3hbRF2MJ9oBgjup5Szk,2737
324
325
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json",sha256=JJN0hryyLr5Zv3dSS7C8cPFhAwTT6XxUVnBGMZvV6JA,2752
325
326
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=ouRyZ5PEMPP2njPftCNhs-1g1y6wueWLmhI7G1SjV1k,4131
@@ -529,23 +530,25 @@ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=8_LiuVJqeuMI
529
530
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=512,N=64,device_name=NVIDIA_H200.json",sha256=phmhkQNz8DcLHPqN5tjmJqOgbX0BhQx9cP82fp_jyIQ,3236
530
531
  sglang/srt/layers/moe/moe_runner/__init__.py,sha256=Dc4PH6HfzQDjJWL7iuZ-0qh8oRu7OtnH6IEl675pYiU,172
531
532
  sglang/srt/layers/moe/moe_runner/base.py,sha256=GMdFI74BGO5HDjtel5QWI7W4CFix0BHkw_HrjVswhcw,8905
532
- sglang/srt/layers/moe/moe_runner/deep_gemm.py,sha256=xhxZsQpD9U8OReNaA_qwXWA98hVUS6rvcbWukQcv8tc,9342
533
- sglang/srt/layers/moe/moe_runner/runner.py,sha256=MCrPZQuuTxD4NGdnRaIkLc-xy8yOnXZW3ThJ2L-ymu4,2845
533
+ sglang/srt/layers/moe/moe_runner/deep_gemm.py,sha256=Ntif63j3HYofgc8f1FED5sRQrzGsnBKiwuTdalGGWp8,18123
534
+ sglang/srt/layers/moe/moe_runner/runner.py,sha256=eJhOjzbKwcNSGztwTKAJxpcSYm9pqv_C60MJGmPkr_g,3041
534
535
  sglang/srt/layers/moe/moe_runner/triton.py,sha256=pYzFyJDocnBfNiF6kp1cnSZmKKTsLOYXpAUXFZYKOsI,14464
535
- sglang/srt/layers/moe/token_dispatcher/__init__.py,sha256=0lIB1lkEcVYiW2iEL_hzAPk-AG85dFYAdyK9MBftHsw,1273
536
- sglang/srt/layers/moe/token_dispatcher/base.py,sha256=ZisVo2ty9vx5Oj1V1_w570_v8e8zbIpcEeXl4UUeZVQ,4015
537
- sglang/srt/layers/moe/token_dispatcher/deepep.py,sha256=lVBM2ZE4XgHX4eqVuFuoF5rPPrY54CKoiapa3txFvcc,26430
536
+ sglang/srt/layers/moe/moe_runner/triton_kernels.py,sha256=qsV9-k9iblqxE8J4JWyJS3Mfd7he7aZUYbIa8QTY1vo,6350
537
+ sglang/srt/layers/moe/token_dispatcher/__init__.py,sha256=rFv-j_zeUrKEOniMaODRi3EUaRAIufj5jIMGt45JdwE,1305
538
+ sglang/srt/layers/moe/token_dispatcher/base.py,sha256=joEgkYGDKlyYyb8hCOTYI_jAnZ1M_IRaT8WshXiolZQ,4253
539
+ sglang/srt/layers/moe/token_dispatcher/deepep.py,sha256=S1ucIB4erQgOqfAC21cB3e-WAFCxaSFH7DgxNUlXbgQ,26705
538
540
  sglang/srt/layers/moe/token_dispatcher/mooncake.py,sha256=ZQpjlv-WvEvTgFE6R_zuzFZXOfbRwVvXFYpOnWuCBXk,11855
539
- sglang/srt/layers/moe/token_dispatcher/standard.py,sha256=2il92nCW6HuuUrkT9MHumTQf0FZ-JhVBoWNzwaZ_Zwo,3461
540
- sglang/srt/layers/quantization/__init__.py,sha256=f05hWlwXrtzH0Ugk4kY6xofrnMK4A63FbSyPj5GMi6w,6343
541
- sglang/srt/layers/quantization/awq.py,sha256=jeGGkHIkmRsGHNWo27uNPB7B6M1uYSVmmjeCbhdIjew,33411
541
+ sglang/srt/layers/moe/token_dispatcher/standard.py,sha256=fbYsC4iBmRL49ha-wPSL24hP9qEZMUMeHTxIj9By9Ko,3462
542
+ sglang/srt/layers/quantization/__init__.py,sha256=4kFbEgYmLsV0H5pwU-M-yJSYzSzaBI7dFOF6N4CRB90,6301
543
+ sglang/srt/layers/quantization/awq.py,sha256=zm3wcy7k90cNlFvPT7uY2JsravExXaZuC4a3nsRdKss,33343
542
544
  sglang/srt/layers/quantization/awq_triton.py,sha256=1QwpxPoqcfe3sDU8uRs3LXBRcDZvq-M9xQ7NE9RV0Mc,12658
543
- sglang/srt/layers/quantization/base_config.py,sha256=v9apbnLDBUqQfm67kAYeky1Fe_RVyi1Upeua1w1ncK8,7895
545
+ sglang/srt/layers/quantization/base_config.py,sha256=NP7QyI1lCq5JxerPIDTy8TYQqOwSRGreNeD-Sye2Zus,8214
544
546
  sglang/srt/layers/quantization/blockwise_int8.py,sha256=pqSLo4gwazZ4ajdVzyouwh_Z5oVDbWq9wo8RnrMdY8o,13998
545
- sglang/srt/layers/quantization/fp8.py,sha256=pyJxdl5jrXjzup27BI2hmIqKic_S9qI0siMR5qL_XeY,53442
547
+ sglang/srt/layers/quantization/fp8.py,sha256=75F0a9xRIGCmZTY_KGsEEYu0VXQFJTJyWMLo2BTOjhQ,53658
546
548
  sglang/srt/layers/quantization/fp8_kernel.py,sha256=noTju6oEzKQ4mOcgWF8s0sFL5g-PuxLrCivvSbKQJWI,56181
547
549
  sglang/srt/layers/quantization/fp8_utils.py,sha256=enZUimrleDg7RJhoh7uxVLRYd1dSMKeCUhaXuwWAYyE,29831
548
550
  sglang/srt/layers/quantization/fpgemm_fp8.py,sha256=OpDJAOBpy3PtAvDwG3ZIA4ItMFvrodxAHTkHQnT_cso,6967
551
+ sglang/srt/layers/quantization/gguf.py,sha256=XCjW3-Xe63mwNUDT02U09JiBUMdxxX_slmeaoWMEIP4,19824
549
552
  sglang/srt/layers/quantization/gptq.py,sha256=oAlxR3qX06Pwc9-kkrzu7W4j0K-zWfi2JQL3yO0HHCI,39377
550
553
  sglang/srt/layers/quantization/int8_kernel.py,sha256=nl3bmwcgvs8SCe3_jz0hC5f6HfdohhEMyeWM_t8Zx5Q,13124
551
554
  sglang/srt/layers/quantization/int8_utils.py,sha256=YK9CS-lb_n91kNCTKK5o5apYF31V2giDg5G5VKrpcUA,2356
@@ -554,15 +557,15 @@ sglang/srt/layers/quantization/marlin_utils.py,sha256=Zvasw0DpgMQKTNJm1ZNGLt3P1A
554
557
  sglang/srt/layers/quantization/marlin_utils_fp8.py,sha256=iSjq-ikPOTU5plrWNTW4MletKLySIrNl5NhQmY6FyAo,12508
555
558
  sglang/srt/layers/quantization/modelopt_quant.py,sha256=yKs6xczPfjKV1UKB5S50nol4rRURMX4m7_7pYIYJZU4,60689
556
559
  sglang/srt/layers/quantization/moe_wna16.py,sha256=uoRhxJ8W_U_VFpbn03YEp0aCjbzqquWwonjuN7KBucw,19117
557
- sglang/srt/layers/quantization/mxfp4.py,sha256=OpthUaglm7Yf9jojZenHqRSVLWLy3mFuGk6PvgPNsnQ,31829
560
+ sglang/srt/layers/quantization/mxfp4.py,sha256=9DurnjCX2BBWveFfE-ISTAhE4VOW0BB0ZNPMsrgxYEM,31337
558
561
  sglang/srt/layers/quantization/mxfp4_tensor.py,sha256=bGeCXlIOhmFZFGWp_lITkIRDEgGUaLpawDvMy1cTOmA,5389
559
562
  sglang/srt/layers/quantization/petit.py,sha256=foRPfOfhq02h6yMt-8yHKofQB6l16Pz-bRCqUD3iiHU,8944
560
563
  sglang/srt/layers/quantization/petit_utils.py,sha256=-gy4zMhqNoIA1R0n7-5C0efV54jHonCUgPDUUFjGsyM,3245
561
564
  sglang/srt/layers/quantization/qoq.py,sha256=jM96uJfKz3vo1B6SSIrQXNT3vnD3UJrepK2eY-tSQU4,8139
562
565
  sglang/srt/layers/quantization/rocm_mxfp4_utils.py,sha256=Z4pYWl6ExOXq2qfTHorW16hVbJ-Rk4G8Wrxn_x8boHE,327
563
- sglang/srt/layers/quantization/unquant.py,sha256=T-KbIdvsYSqNdYfdnH7zSy9foSHMagPcFLfxkfF8e_g,15980
566
+ sglang/srt/layers/quantization/unquant.py,sha256=FtgCj24edm9AhrPpEqMAIf8w1Sz83EQ5dgBYXnRuGCk,15043
564
567
  sglang/srt/layers/quantization/utils.py,sha256=yqgmoLvrrp5aRj-LTJZ6dI1hmP1UFgbpyjVWJJdomZQ,18472
565
- sglang/srt/layers/quantization/w4afp8.py,sha256=yYvI7Tv4N3urK4m6QyO6cWa-SBz7bN6bZREnDqwX4wg,12969
568
+ sglang/srt/layers/quantization/w4afp8.py,sha256=dm8Um2oraXdrNXiyrdDshg-z3_aSTs_V7Eh-z3o9PuU,14155
566
569
  sglang/srt/layers/quantization/w8a8_fp8.py,sha256=ugLV4G4MDog-UuLqSnEasBqE3Hh6AqE5ZYI371ean90,10415
567
570
  sglang/srt/layers/quantization/w8a8_int8.py,sha256=WkhbRVnEamh78uyj9WyS9OfeSpZTsWh51kDCH4HICa4,37534
568
571
  sglang/srt/layers/quantization/compressed_tensors/__init__.py,sha256=zMpLnf9GiRhV-jg1H2UiZ6OUMSKMcmLtrr2A4XjhuUs,217
@@ -758,26 +761,26 @@ sglang/srt/managers/configure_logging.py,sha256=8sNXZ2z9pBWOwn-X3wyz013Ob8Nbm1zD
758
761
  sglang/srt/managers/data_parallel_controller.py,sha256=TAJErsNQUomHFnekrPceMZbN95PfFadticjSup3JiLY,19236
759
762
  sglang/srt/managers/detokenizer_manager.py,sha256=K6TLeBtDb8geRVKvTlFqZJN-26saYJxxLlRspvEOFe8,13080
760
763
  sglang/srt/managers/disagg_service.py,sha256=7VyRva5oniAPs8G-DYg2fv-mdjSxk9cLZPzl_TmB_2Q,1588
761
- sglang/srt/managers/io_struct.py,sha256=BEx_N4PwZnLoTBdvMp_zHz29btJvUevTM7S5gqVeB5k,50778
764
+ sglang/srt/managers/io_struct.py,sha256=2RMpLqiZbI27kR1p9yJKZT1u1sA0NZWukfU4U0WM6gU,50932
762
765
  sglang/srt/managers/mm_utils.py,sha256=xJ7Pbk1ZxIyodLyeNv_t0JeSKCqrP7u5hpMcC-0Rpzc,31283
763
- sglang/srt/managers/multi_tokenizer_mixin.py,sha256=nz_G1sLW-bN8Aa7Vy4ZUM7voaCPf7oMTe_M76H7vhyE,21050
766
+ sglang/srt/managers/multi_tokenizer_mixin.py,sha256=dELw8-Ka4-gY6ek5CSVW0DLK8Kq6jJDO6qMTNm5bOxk,21545
764
767
  sglang/srt/managers/multimodal_processor.py,sha256=0mLkwu6CGRQtt3G2T1tS3PSsh6dpyivV-vAfIHfcMbQ,1764
765
768
  sglang/srt/managers/overlap_utils.py,sha256=dDz1zUBlJ9Ohw4TPHgOxnuh6LPCsN037c14XIw3E-J8,5050
766
769
  sglang/srt/managers/schedule_batch.py,sha256=0oWPNVtdgoX2bFHOc1RN_1IYyoIE1yKwCImll65dAbQ,72622
767
770
  sglang/srt/managers/schedule_policy.py,sha256=BFWoHG3m-lkeVvOkLGoMeEbRplq4vF4thsjv-P8MG84,28818
768
- sglang/srt/managers/scheduler.py,sha256=BQ3_X5uG2a9La955Mw8OGTrhhlgKkhe3nDUE006YVnU,114768
771
+ sglang/srt/managers/scheduler.py,sha256=aJnk_T9_ZNHCMhRs0cJqfkTH7EbW_B7OhXK2WV20UFE,115088
769
772
  sglang/srt/managers/scheduler_input_blocker.py,sha256=SYZ91JNTHtqiBHUpkk_MboAiBFyl5U7ardLcYDAQ0OU,3689
770
- sglang/srt/managers/scheduler_metrics_mixin.py,sha256=duFJs6DlSFzV_1c7R2ESNGFEkGekxgDziJns4ttK-0Y,14962
773
+ sglang/srt/managers/scheduler_metrics_mixin.py,sha256=OJKCTqNX5gxragq_774EeTSrNEPYp3N7udhE51pukFg,15337
771
774
  sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=n6zvLqu-TpTaZuWfYxz7ivCBPP3Z7okTOOshTq0d4CQ,42449
772
775
  sglang/srt/managers/scheduler_pp_mixin.py,sha256=oUl5oxbFPd2gxqn4JXk-Bn-uLrmJZ6_Km5SMpSe9Gtk,16433
773
- sglang/srt/managers/scheduler_profiler_mixin.py,sha256=LKgAaQ9kNdjK7J6xSwQQzo2q_pViWnlGIvTpe5_yLLQ,13505
776
+ sglang/srt/managers/scheduler_profiler_mixin.py,sha256=4yhFzHO8ir4TbnYluDFYvCl8RgH0L-AihdIYuMLtBcw,13453
774
777
  sglang/srt/managers/scheduler_recv_skipper.py,sha256=8rVQCBjn9f26Th4XbeUS3fEsvo1GI029Me28wMjcKRY,1103
775
778
  sglang/srt/managers/scheduler_runtime_checker_mixin.py,sha256=54z5p36M2BgTQYrEz30aAtQVXWCBI9VHBjgzOf19QPo,8521
776
779
  sglang/srt/managers/scheduler_update_weights_mixin.py,sha256=AuOKrV943inXe5s4cPb4_BQiNAFwkiQGlpaBS-aal-M,6957
777
780
  sglang/srt/managers/session_controller.py,sha256=FGADRGSkRmS76o_BQ2fivpgw0Q5Q-K0Ws3aezH41YSc,6041
778
781
  sglang/srt/managers/template_manager.py,sha256=M4EshVv1OhKxUAGQPP4OntRkSkUVvG93457xsYfWnQk,11968
779
782
  sglang/srt/managers/tokenizer_communicator_mixin.py,sha256=CHry04ONVx3YMGNN5KtNJFaafxnw4LfXHceMR1q2Nwc,26088
780
- sglang/srt/managers/tokenizer_manager.py,sha256=RcK-EvZJj1iNDlhD0WPK7FxxM1cAfKlidnZeJUkpSJ8,90837
783
+ sglang/srt/managers/tokenizer_manager.py,sha256=UM54r6Ox-dfTOesahpm6QmyXtvUTDCJyTRK4n903MFo,90468
781
784
  sglang/srt/managers/tp_worker.py,sha256=qENe8zAagoTs50RJmCJi2il9JsQtuQqBHII6XBBPLJg,16212
782
785
  sglang/srt/managers/utils.py,sha256=HRPecRiWLHTX6QbkyYRY-tjlpJEb9N1k0fSJsqBxJl8,7324
783
786
  sglang/srt/mem_cache/allocator.py,sha256=TEAkK32vyYz7wow5bpZLlrzb3KHVXtw9h1KtGWg6kIo,18246
@@ -787,10 +790,10 @@ sglang/srt/mem_cache/chunk_cache.py,sha256=u4EIGuWNonVoCItF2wrKnXzh2OtoDM04Xhoff
787
790
  sglang/srt/mem_cache/common.py,sha256=PEFKzoawIIPRVboyInPKWG56qht-inp34vcj6q_fsfg,16283
788
791
  sglang/srt/mem_cache/evict_policy.py,sha256=FVI4QsFJoRR1CaxE9jpX4OzBPt4w9ftfM2Ndu4BSfhA,1012
789
792
  sglang/srt/mem_cache/flush_cache.py,sha256=GYcxmNXh4hsMpFfNOuCTpKilW7guZwTtAg_usVeM3J0,979
790
- sglang/srt/mem_cache/hicache_storage.py,sha256=t1Dl7OLamm4sPa93sKNIIjSHtX1Rom3D8G9n9GXTipw,8073
793
+ sglang/srt/mem_cache/hicache_storage.py,sha256=lvRaZesRhHQopBoNBbWlXxs4IbRwcWnpEP51MjowtWs,8366
791
794
  sglang/srt/mem_cache/hiradix_cache.py,sha256=BK52hyQjPoXKzn_PDn_LRk_3a0AjWBie1Xk4yAO1B3s,35984
792
795
  sglang/srt/mem_cache/mamba_radix_cache.py,sha256=mpKTxCzA1_u4eoHk0SvXPPNVVG_JivEAb44miY3aNuw,38678
793
- sglang/srt/mem_cache/memory_pool.py,sha256=6zpF492cuG4sEXTC41liHi5wSN_dQnDt3sLulRDOPQA,64880
796
+ sglang/srt/mem_cache/memory_pool.py,sha256=v0zHcqaOp1cUX2jNaNJOR5lnk0sdj7S4aViPjewpXJs,67163
794
797
  sglang/srt/mem_cache/memory_pool_host.py,sha256=IBUKHCmU_Fu8d22_V5ssYp4Ff97w3EaMSpyFZvPD0Go,27634
795
798
  sglang/srt/mem_cache/multimodal_cache.py,sha256=23d34nWEDtgiOM6fqAhmkQ8-OHnrNR1-n8Ert0K0n3U,2147
796
799
  sglang/srt/mem_cache/radix_cache.py,sha256=7NQHMUKjdKaAGMFdx1z0pCPBPvwux9KcqymFRxFUAY4,28181
@@ -806,7 +809,7 @@ sglang/srt/mem_cache/storage/eic/test_unit.py,sha256=PfNPpL624t23tyVgtmS5F1pGiuW
806
809
  sglang/srt/mem_cache/storage/hf3fs/hf3fs_client.py,sha256=3xG0dV5JmnbIJ8kB1_lk8jAeqshOcU7tXES27ldyb8I,5228
807
810
  sglang/srt/mem_cache/storage/hf3fs/hf3fs_usrbio_client.py,sha256=6oH4v_WF_pKH4FMSr252v6QPhBCnRHztHqzuS8j6_QI,5323
808
811
  sglang/srt/mem_cache/storage/hf3fs/hf3fs_utils.cpp,sha256=dDYPtxmL6OFhEyv_GuTgzkTDpBjcD0EK8kphnn7eaGc,1133
809
- sglang/srt/mem_cache/storage/hf3fs/mini_3fs_metadata_server.py,sha256=lJ9Jp2kOgQQaUihxlO9l-W8fYfOMa1h1y0WAtzzFGLM,17850
812
+ sglang/srt/mem_cache/storage/hf3fs/mini_3fs_metadata_server.py,sha256=IKIm5uQ9XyWx19YflkYZvBSjbVpYbMpeg3Mg7wYMwNM,17880
810
813
  sglang/srt/mem_cache/storage/hf3fs/storage_hf3fs.py,sha256=MI-x2979lvJL8d4aJluTCx6DofIe0tkLTNbrAJbV0FI,21514
811
814
  sglang/srt/mem_cache/storage/hf3fs/test_hf3fs_utils.py,sha256=g2h0Woa2CK39pRTigHCVR_hq095dTaC70lCIAIs9THM,1089
812
815
  sglang/srt/mem_cache/storage/lmcache/lmc_radix_cache.py,sha256=pd5NC37FORcF-yHmOjbARZGGPcpc-Xd3iu3KGjgYnc4,10009
@@ -822,10 +825,10 @@ sglang/srt/metrics/startup_func_log_and_timer.py,sha256=PRVg3Z2d5GBMFifZXR-VhzGc
822
825
  sglang/srt/metrics/utils.py,sha256=MGb3quRI39n4tgJS1e0UHI5TBX3D0MwsgiZFMW2EsSQ,1903
823
826
  sglang/srt/model_executor/cpu_graph_runner.py,sha256=ypp5yIW2OhRX-Xmido5mWuzEFpd-ohlq2c2wEuSW71I,23415
824
827
  sglang/srt/model_executor/cuda_graph_runner.py,sha256=hz7y3q5J7e8lnDhDPxiJIGvtGG7Ws0Og8ztbaZ_mqXw,35580
825
- sglang/srt/model_executor/forward_batch_info.py,sha256=9SsVdDZfGIF-HFm3ulEACjhj95tHQhCzVfe3vzUqZV4,42612
826
- sglang/srt/model_executor/model_runner.py,sha256=ocjmkK3yKz_z_EAd6sgOZ8xd8qzmpw9f8G1004Ew-L4,100592
828
+ sglang/srt/model_executor/forward_batch_info.py,sha256=wLkiWTAMgq-4xQFvimvRnQK9eDQKS0UurtooqueBbx4,44306
829
+ sglang/srt/model_executor/model_runner.py,sha256=82SAlFp14XbUocqGxcEkH4ToGL10Rh0Oz1YQtJ9R0rc,93938
827
830
  sglang/srt/model_executor/npu_graph_runner.py,sha256=B1YQla4jW9PiciBBisKg-qoC-vmnldRr8ut_aSmUB-E,3664
828
- sglang/srt/model_executor/piecewise_cuda_graph_runner.py,sha256=-Kb1XILyAxRTbHgT2SzV_BLW-L161eg7vgPiOF1Wrpw,21992
831
+ sglang/srt/model_executor/piecewise_cuda_graph_runner.py,sha256=yYOuLLI8hscmpnlxEKrrIpGnirMIncoy0dHBWi7XcB8,22684
829
832
  sglang/srt/model_loader/__init__.py,sha256=Y4gehllriF0JNjly4rGhQPSkUrA9u9Lr-WbfZfBIs6k,1034
830
833
  sglang/srt/model_loader/loader.py,sha256=73Pd71im3E56u9SCZmrMgeq5ZJxadeb-ENIIQW4LW9I,80809
831
834
  sglang/srt/model_loader/remote_instance_weight_loader_utils.py,sha256=_HnQD1Ab-Wv9oATOmwJe6aQaQD_Gs_yG9EsDCGJQWfs,2881
@@ -845,7 +848,7 @@ sglang/srt/models/deepseek.py,sha256=M7nyHcAbTIs8vc1g6u00oy22-pp704Xp4T3clBzu4xM
845
848
  sglang/srt/models/deepseek_janus_pro.py,sha256=td8xGs6ARfJ8AQCYwUhMOZoWigrAs7m3trF5-kXCqik,70418
846
849
  sglang/srt/models/deepseek_nextn.py,sha256=B-Xk9mh7op-Gx42yJKV353yzWzL68iwwR08r6jbNZ6A,6710
847
850
  sglang/srt/models/deepseek_ocr.py,sha256=WAPLXeg3S1UB3x3iP-tiandHk5AEnCUMeMs0ak302Gg,52416
848
- sglang/srt/models/deepseek_v2.py,sha256=EzPUoRGCcBoJIbZ9s_XztIVikp7FSNsTv42qUBzHoNQ,139536
851
+ sglang/srt/models/deepseek_v2.py,sha256=XZ2oYlX5GQ3dsRKlfr4g6RQMnXMf02S9ihszbn8ph9M,143886
849
852
  sglang/srt/models/deepseek_vl2.py,sha256=7X3gI4DE7guUtNJvMLf06jO8MUHKa2Aan8evZg5hsXc,13061
850
853
  sglang/srt/models/dots_ocr.py,sha256=sWkFsENjX5b_CecLCqXjepsr6iyyCbNTmjZbRfoB4ek,6683
851
854
  sglang/srt/models/dots_vlm.py,sha256=3uLSXO7W8UPKU7a3ixkC_gwSVDGYecCHK0kZAoD6vNs,7192
@@ -863,10 +866,10 @@ sglang/srt/models/gemma3n_audio.py,sha256=isgKfjA5UieYawxU6medL2ssXlzYPqAbagDBnL
863
866
  sglang/srt/models/gemma3n_causal.py,sha256=kBDlpSWAg6ZDmUPe08Q7sj5CbdVD_0h07zwJw8sKu7I,36335
864
867
  sglang/srt/models/gemma3n_mm.py,sha256=Il5LHjZdbHEXueUVdBp5lpSJHt56W7fpfPHD0Y7RED4,20301
865
868
  sglang/srt/models/glm4.py,sha256=dijzVTTgg8zyJ3gga95MKY0WwqwnuAaf-VIV93OFAmc,11433
866
- sglang/srt/models/glm4_moe.py,sha256=plEh-b5C2az6MMNF5hotXIusJAEdXOZy7KTRd4EIRLg,41209
867
- sglang/srt/models/glm4_moe_nextn.py,sha256=fWuDWY8nwnHBXpdEYkhyMcBkUByIrBZvEMdLEtsTVi8,5947
869
+ sglang/srt/models/glm4_moe.py,sha256=x8Y5gD4GMr6wvx3tzllMQ9dz7cWcq18rII986f_Bke8,38217
870
+ sglang/srt/models/glm4_moe_nextn.py,sha256=H-z8CKc1v_9oR6PzKE7aX6L1PHG8hHNrgyVgFO1ZZWE,5601
868
871
  sglang/srt/models/glm4v.py,sha256=LwiFQxYm2ksmaePeO57i5d4YGQjiQX52e-Dsjyh_P7I,23834
869
- sglang/srt/models/glm4v_moe.py,sha256=MxuF0pFf2frKPCp4A_2YmrXx_uvZzOFdA4hVJFbLY6E,17375
872
+ sglang/srt/models/glm4v_moe.py,sha256=px1wUjDCU7Ro8GnxpjkGh8yQS0Tr_IjYmV2C8iPqhfM,9594
870
873
  sglang/srt/models/gpt2.py,sha256=kclhxEs8oJk1KCyhmAqo7rZqecVGGHYkc-a1WZi3aIk,9841
871
874
  sglang/srt/models/gpt_bigcode.py,sha256=1D6bi8Zu760gCRZkvdLHFcg8kCkY35ARwQYaMDtYhl4,10307
872
875
  sglang/srt/models/gpt_oss.py,sha256=K9g2c9xTE2eM74isijM-KSvGPHt6Cjgjl8L8EzBTLmM,43711
@@ -898,6 +901,7 @@ sglang/srt/models/minicpm.py,sha256=CzBJyZtfMpp8jvlEl29DHI7HLVq-CxuqP1UHwxIbaUI,
898
901
  sglang/srt/models/minicpm3.py,sha256=Cflu4Tb2hxpjapRBZ5n4kX8a1nnFwffK-M8uHPRUra4,19276
899
902
  sglang/srt/models/minicpmo.py,sha256=1bNtbJM5wbMjV4ax8gesVsYVbMz4ozaIHAvvi8_d0iE,76175
900
903
  sglang/srt/models/minicpmv.py,sha256=_CnCR2y3RaYxhONAKFpBIuPQBrqn9Od4o7QnJw8CLR4,35884
904
+ sglang/srt/models/minimax_m2.py,sha256=cmdTbRl1VIBDb27t4glkhVwSy-2c3SikIcWociu5aD4,33995
901
905
  sglang/srt/models/mistral.py,sha256=ni7PppA_5X4ivTnIps3yoEaMEL-G6Gaf9b5hGC1vU5Q,3475
902
906
  sglang/srt/models/mixtral.py,sha256=bZdsTw4A3B-MIHSR8U26mBv3sLYkawVM4V1VXEyBrmE,16992
903
907
  sglang/srt/models/mixtral_quant.py,sha256=UUIq7lpUonD9IoGePyl59oJYEcVwT9wUXvtVp5tjQ9Y,15406
@@ -905,6 +909,8 @@ sglang/srt/models/mllama.py,sha256=mMhDrLd1jJ-4lwMMHKRC5Uzcs3kWdzRJJzdjhQN4LOw,3
905
909
  sglang/srt/models/mllama4.py,sha256=z6YKfmHu0lJ-oyALZNlL9-EcHzFvNgkxWU_mURyS7z4,36694
906
910
  sglang/srt/models/nemotron_h.py,sha256=clbTirOxve6yefRaf2eE0dT0IqhPDfknOtnsAEsnZOM,17904
907
911
  sglang/srt/models/nemotron_nas.py,sha256=CoSAKqlbej4Xe30uY4w76iASBqeuJf8-imisDK00zEU,15964
912
+ sglang/srt/models/nvila.py,sha256=2IVELp0pFTnN8Yz1GVns03aoLsgb8_7X_x5gQd02Vqg,12077
913
+ sglang/srt/models/nvila_lite.py,sha256=Cl7wey1bXUyyaDjntCytS4Z-cRVljK4WJU_Z-exjD1s,6206
908
914
  sglang/srt/models/olmo.py,sha256=7-q_fA6XXdG7kPUjpUzYkzMUWJobuSjhqjYw9xSUs_c,12671
909
915
  sglang/srt/models/olmo2.py,sha256=zprucQEogxPV38E_IU0edcTYP-d-dqLVeTmt2kRLznA,15448
910
916
  sglang/srt/models/olmoe.py,sha256=zryYUQEhEdhd6xcR_HyLV7gHCcKt-HWHeEeIUqmhmcc,16100
@@ -919,7 +925,7 @@ sglang/srt/models/phimoe.py,sha256=cZQIGjEvArPDiJzC3uKYje-o48QZC699P8TTLwfVIas,1
919
925
  sglang/srt/models/pixtral.py,sha256=H378jvdhwjgdAuUszhCe5tmcEPYvw2YPhg_d8QrjLZE,16776
920
926
  sglang/srt/models/points_v15_chat.py,sha256=HV_GRgLTcetKh0B2agJry02N_atcWI5NPjjQELarUGk,6415
921
927
  sglang/srt/models/qwen.py,sha256=_X1mUt_MczEE2jFK7rfGyRRtpd4U93jdD1SVpCTNsns,11856
922
- sglang/srt/models/qwen2.py,sha256=kHNZCtT0jnQXC2aJN7Bp1DzaEzKWuhUAGL3hAmt8OU8,23598
928
+ sglang/srt/models/qwen2.py,sha256=ryMQxd10i41JWYTzxXPZMBu68XK_7wpHRQg7_fmlmy4,24361
923
929
  sglang/srt/models/qwen2_5_vl.py,sha256=X7Hh-75gsoGqaK2iJg7eBUFR_8qwJRLhhkii3yxc-KA,25084
924
930
  sglang/srt/models/qwen2_audio.py,sha256=Hr4j9W-q23XjQUX4kk1NxUGA-EQkj8AKDqKVK741TjI,7097
925
931
  sglang/srt/models/qwen2_classification.py,sha256=dGrMm4ebd30_lBhHOhaV57ig2iOTx3nqB4GEzsrRIM8,2747
@@ -927,9 +933,9 @@ sglang/srt/models/qwen2_eagle.py,sha256=6spFg6JYQGeUXLv2Q5eMkVzZvnqGyvW6SdVBtFMx
927
933
  sglang/srt/models/qwen2_moe.py,sha256=-pkURmqiLazr7oq11-3hQCFKrdj1crx30Z7iK7DBs90,30920
928
934
  sglang/srt/models/qwen2_rm.py,sha256=-mQXDEv11p-I1HXgYLTtY6ROem6UYorO958WsDrzsgs,2837
929
935
  sglang/srt/models/qwen2_vl.py,sha256=xV8s6kgyjZ37SqLi9nF9J6n3gq9piUmlXOe2PVPQqjI,21488
930
- sglang/srt/models/qwen3.py,sha256=2OSKkk-AdIpg6ZnNcQ9tqZLlF-VH-QxncY1J_g8k-bc,19637
936
+ sglang/srt/models/qwen3.py,sha256=XWFC8O9WCP6oRkwUGMG5s87lGVyGa3pRQx8YwdTQzPI,20617
931
937
  sglang/srt/models/qwen3_classification.py,sha256=bdjAylXJCjXKjAho74nmtIMpEG0Af98N-aZQ-pKKMY0,3262
932
- sglang/srt/models/qwen3_moe.py,sha256=W27Yaut4mNOutT91D31MxaLfAPXJF9jItTmANkFArCM,33363
938
+ sglang/srt/models/qwen3_moe.py,sha256=jm5ntkmhdkTujJEwmIRLnaHgAEC5f4pmwMASU_Ru9-c,33211
933
939
  sglang/srt/models/qwen3_next.py,sha256=hbIiLXcPBNa41lRnqZqdXa7Q8FDYX9JlaviXIZN_BEk,37279
934
940
  sglang/srt/models/qwen3_next_mtp.py,sha256=nua9MgSa0_2Dz2Zju0chk6VXGDndBqr-1xMQ-_OirTU,4387
935
941
  sglang/srt/models/qwen3_omni_moe.py,sha256=X5dB2zB1LAAD6_baK84y6MGvEm5ArgcFDmarUyoaS9c,25444
@@ -946,19 +952,18 @@ sglang/srt/models/step3_vl.py,sha256=QeU7RQ5YnU6FcAi4c-ICVABpM1PJ5E65w5XE3UJmIbE
946
952
  sglang/srt/models/torch_native_llama.py,sha256=3xf6CzCiizJ8i94GIChpOLq9q64Xa519RtuEspPTZQk,18501
947
953
  sglang/srt/models/transformers.py,sha256=laA2h39MPeiAWKv4DEg0ydre-1pyXWFSRga-nwy1HUk,10244
948
954
  sglang/srt/models/utils.py,sha256=yB1rHC9Xk6hTQ59Fy2ExdrtntuSn6vkm-idf3CFrYP4,2032
949
- sglang/srt/models/vila.py,sha256=3NiRHWOqXnCRjXmswAldsNtiE5zRILbScEsbhUzLZF4,9846
950
955
  sglang/srt/models/xverse.py,sha256=DsNVI9JpzN4jj0Ry6aTrj7r-xq5YLOoDX2kH4YLJA-I,14035
951
956
  sglang/srt/models/xverse_moe.py,sha256=nBtG_PAK8wcp1tW2l2Zby2oEOmtWAYzH5COH-_N5IAM,17072
952
957
  sglang/srt/models/yivl.py,sha256=oToK7-u5IGO7xwpJIQ7VtudlK6-zPqJX4bt6_wv0SH8,4850
953
958
  sglang/srt/multimodal/mm_utils.py,sha256=6bV1_a7Iet9W0y3qdd0E-hFM78zalIzNZCYbLzJX2y8,12640
954
- sglang/srt/multimodal/processors/base_processor.py,sha256=RAJYoUI8XGTa97rJKz72V0UzTMzfpKvU3206GjRJ0ZQ,25053
959
+ sglang/srt/multimodal/processors/base_processor.py,sha256=h914TZNxWT8-wT0bQRXUCYE4wBTylJs9ip36nFNz_KI,25096
955
960
  sglang/srt/multimodal/processors/clip.py,sha256=5nXZuQYbyf-5mlqPwjhQrlWqxvswImWZQXivChsiHfQ,1057
956
961
  sglang/srt/multimodal/processors/deepseek_ocr.py,sha256=ZuP-zHNjPV3-lb6NkmNIitwIiXtNopNIwOLPttLjBYI,1234
957
962
  sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=nKqWQ9PmtY66cMx0YhIHGPaGIW-VyPKt_KeRqFLU60c,2479
958
963
  sglang/srt/multimodal/processors/dots_vlm.py,sha256=azazFc_lFj40NJKWf1X1MGgJ5FXgv2RlgVS-R6IhFdk,3521
959
964
  sglang/srt/multimodal/processors/gemma3.py,sha256=7aD6cR60iSC_MqjzdCDMAgtrb_cmy9YJyqLgVRClBT8,1986
960
965
  sglang/srt/multimodal/processors/gemma3n.py,sha256=mtmvBasOMxb3Y2NLZR02nMYX30RLUXhDYJ5uVOElr10,2776
961
- sglang/srt/multimodal/processors/glm4v.py,sha256=EPPILSirXexpRkWZfIhxWGgWKZGk1q6eENZS5gWyfjw,4899
966
+ sglang/srt/multimodal/processors/glm4v.py,sha256=Q9ifVo4DMsxsysta2cqUGwHGdx3pT5fS_jVB31pUfP8,4883
962
967
  sglang/srt/multimodal/processors/internvl.py,sha256=vvOlWmJ4AzbXnDxHED1NkRgHQfOnZlmEaWMA3-1_2cQ,9765
963
968
  sglang/srt/multimodal/processors/janus_pro.py,sha256=nd1v0--5733pOwWTpArnOHCfh4aHHVBUOJPOhk9rLd4,1395
964
969
  sglang/srt/multimodal/processors/kimi_vl.py,sha256=5i8KmGxnnDtQc7XqUBNyanAfGxhxj8iRFBFONHmpiFg,1565
@@ -966,19 +971,19 @@ sglang/srt/multimodal/processors/llava.py,sha256=-YtDc_7TsMWmwKkD4KJZW2Y0jPFlZtb
966
971
  sglang/srt/multimodal/processors/minicpm.py,sha256=ysJlUaxcBcWjKliz5VmXKVv0ec4QWRHXZk4ga-hXVf0,5354
967
972
  sglang/srt/multimodal/processors/mlama.py,sha256=FgPm2JQzfPFDcGYDm0mqfDfO_eJKy-NiVgF-vId6w8Y,1233
968
973
  sglang/srt/multimodal/processors/mllama4.py,sha256=pYzqbuV9Hb5RMYNLRabTMIMTwL8C5SCToZdhSg403go,1653
974
+ sglang/srt/multimodal/processors/nvila.py,sha256=MqpZmj2fO9U8DQSFGVkrUYqK7HBrhx5nIlMCdrZShfY,2524
969
975
  sglang/srt/multimodal/processors/phi4mm.py,sha256=8Co-UPT8Am2P5dfW8bjZcy-pVAPqFXW7hbK8v23NMiA,3781
970
976
  sglang/srt/multimodal/processors/pixtral.py,sha256=Lx5Z-9NkovLDTHlRBznHxGn4r2XhDz8am2XpOskOVQY,3203
971
- sglang/srt/multimodal/processors/points_v15_chat.py,sha256=n1lwAnAYk1xPhnZRpAtDDpyP8N7NlZGwX7Pdun9Kv50,1581
977
+ sglang/srt/multimodal/processors/points_v15_chat.py,sha256=bd_gpgkpcMcl6gxugqfQSJwyr50szjKOAHrsVrBnuPg,1575
972
978
  sglang/srt/multimodal/processors/qwen_audio.py,sha256=xkIFrHepF8Ok6MB-1OwVz1BmzPmEPgUe8lIb0azO2Bc,2411
973
979
  sglang/srt/multimodal/processors/qwen_vl.py,sha256=h26WSDFJiXvyCmUxNwetjgDANxXoQGxocdd_uudC2Vw,13537
974
980
  sglang/srt/multimodal/processors/sarashina2_vision.py,sha256=E0KSOw_yzc7prHkQfMHS_DzOcYL1GZJ77NopVkd_V5M,3024
975
981
  sglang/srt/multimodal/processors/step3_vl.py,sha256=2zNf1gT-fSrA88-cvkr6xJDE0sEWFKdBDUWsMiFx_uY,18330
976
- sglang/srt/multimodal/processors/vila.py,sha256=vWgV1lTdjiFiTR8w-7fC66-L_tpOOD59c-c9NljGelE,2192
977
982
  sglang/srt/parser/code_completion_parser.py,sha256=KFa95OU0TeVjJkOqIgS4xV3kaJ5dFWOmAAgISyc1oEc,3803
978
983
  sglang/srt/parser/conversation.py,sha256=r5Fp4BGNjGeuvBw7dAUt-aUl3ExsTSG00Gq8dS8_hj0,40089
979
984
  sglang/srt/parser/harmony_parser.py,sha256=YweG4azWm5jmzYGaAHEXSaORpgWctPpSGQk_jp5H-CE,23227
980
985
  sglang/srt/parser/jinja_template_utils.py,sha256=_rtLpriMmodo-tBD8B9ifu3BsZFdaQQCDPRUqF26pIg,8006
981
- sglang/srt/parser/reasoning_parser.py,sha256=Q5yC-Giug7fA0W5d1BarTKUWWFO5QUwtnonMeuDziOw,11149
986
+ sglang/srt/parser/reasoning_parser.py,sha256=sGHGN8UUYjv6qW3HtHlgGGwf_5NRzlBF1jvCEiG-5vI,12180
982
987
  sglang/srt/sampling/custom_logit_processor.py,sha256=phIOI0ttJHQ_yCZhnqD5qNs98QG0gdY9evbXkgS3544,4272
983
988
  sglang/srt/sampling/sampling_batch_info.py,sha256=xlkEs3zgrwZCNBs69JHL3og9-jJnFbDD3_RLJJ-M36U,15544
984
989
  sglang/srt/sampling/sampling_params.py,sha256=ULhZRhA9C1oK34T3cbwqaODV3iMX8HL1VOlo_gewzZw,9193
@@ -1012,8 +1017,8 @@ sglang/srt/tracing/trace.py,sha256=5SKy8XA4KLaTcBO6ZJvJSP_IYK5--2RJN0Q6O6Vg10g,1
1012
1017
  sglang/srt/utils/__init__.py,sha256=zuoHoZnKrciwFy11a6p5Ua8mYU67QUI_09L0SfEjpeo,102
1013
1018
  sglang/srt/utils/aio_rwlock.py,sha256=6LYtOdeTUY3hkfa1dmYkgsaF2ttrwIF3hUWz2AZ2fqw,2970
1014
1019
  sglang/srt/utils/bench_utils.py,sha256=0xXUeDk61RynxbOV0P_okb-5rLPpc-ZqfCGx3W35K4I,4421
1015
- sglang/srt/utils/common.py,sha256=uSu4JABt4oSwJiLFSaqLgkMkw8QDXn5ydrkslOUXb48,113357
1016
- sglang/srt/utils/hf_transformers_utils.py,sha256=x5HyF75geb7vskOU9FaHarxK_u2MprUZm1SrmgMQX0E,17696
1020
+ sglang/srt/utils/common.py,sha256=sAN5cre5l1b8IuUSQSzXVOOu2swU8k1ZEEVxWXbPBDw,114705
1021
+ sglang/srt/utils/hf_transformers_utils.py,sha256=E-K0S1ykwqxFNLmXCSmQ6taFYlbncN0EuvS1EPBcvmY,17793
1017
1022
  sglang/srt/utils/host_shared_memory.py,sha256=0tO3qMlbmEIs11XvdI7BB0AtH4Z5hm9vWEkEyau4vlM,2264
1018
1023
  sglang/srt/utils/offloader.py,sha256=mKN1Vd0ftr2mjcVIXKCZnc51pcQ6bfYvhqFvdAUyRC4,18771
1019
1024
  sglang/srt/utils/patch_torch.py,sha256=yaVs6YNm63rFYBw-v59usYR3cmb_qX6F69L5dMfQCxg,3307
@@ -1048,8 +1053,8 @@ sglang/test/test_custom_ops.py,sha256=PenQ8zM1wj5xwiVEPVzD37pO-x90aOfFMpCRZenaKs
1048
1053
  sglang/test/test_cutlass_moe.py,sha256=0kzalShZCSSbV1JLKv77mx8bXgK2wvskTuPGqK_qNnQ,10051
1049
1054
  sglang/test/test_cutlass_w4a8_moe.py,sha256=iQIZ1K43emzqI9WVKlb2fplLPcvlpm3D7qCNK-wJfa4,8924
1050
1055
  sglang/test/test_deepep_utils.py,sha256=749ysTBGNzh6rYUCJhhZBtZpeD15eWTeNHYCytcvZtc,7448
1051
- sglang/test/test_deterministic.py,sha256=ISh_2dnEgRI1Ku7lxmDKs7mwNgLrBEhKnLnvW9Uei98,15689
1052
- sglang/test/test_deterministic_utils.py,sha256=vVtwq_NjH9GzSkRUn4mep-IIvgAXtw-5l6iKjYDP8SA,2133
1056
+ sglang/test/test_deterministic.py,sha256=94QAh_y98SLjbroZ837qQ4qv2LypvbLmgX60WD9lu24,23593
1057
+ sglang/test/test_deterministic_utils.py,sha256=iGP6d7JRpk49u4l8IXI-Ix8-pfDliTt0TwD1NvIg_Y0,2212
1053
1058
  sglang/test/test_disaggregation_utils.py,sha256=k_V_vw6qCEw3iZyUeujozMBkUgGRfCWxkLyCb9ktIbk,5588
1054
1059
  sglang/test/test_dynamic_grad_mode.py,sha256=L76yUCuk_ymNpXD2CmO8r2GiGjIvD_gtTsuFDs2NolI,1638
1055
1060
  sglang/test/test_fp4_moe.py,sha256=wvHbGMH1UBr_XVWYgX57Y2bLy9h2DPQH10_Hmf2q6iw,22436
@@ -1067,8 +1072,8 @@ sglang/test/longbench_v2/__init__.py,sha256=ZcOIPSyqbDI_tzB-qltXF67-4uMMPwCkkiWD
1067
1072
  sglang/test/longbench_v2/test_longbench_v2_eval.py,sha256=NI_Om4ODw5utUNsYjrj6nueebI4U5u4N2PKBtT5O27k,7352
1068
1073
  sglang/test/longbench_v2/validate_longbench_v2.py,sha256=mJa5Lh8XiSTXKrf5qopKuAfspSVbhoacnCkz6u4lYFQ,11635
1069
1074
  sglang/test/longbench_v2/validate_longbench_v2_standalone.py,sha256=gr0zif2c680hSyIHDVJ_NHYcrMquM3fpJ26mBtbm7zs,10909
1070
- sglang-0.5.4.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
1071
- sglang-0.5.4.dist-info/METADATA,sha256=M8BtBa6y1fGn0YOx6BJttNdVgtLNOPMbLM3t58ZNCy0,25668
1072
- sglang-0.5.4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
1073
- sglang-0.5.4.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
1074
- sglang-0.5.4.dist-info/RECORD,,
1075
+ sglang-0.5.4.post1.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
1076
+ sglang-0.5.4.post1.dist-info/METADATA,sha256=NblJNZ18C87lGtQ0Ofds9W374PcXOVZ_4lljf_zeWCU,25916
1077
+ sglang-0.5.4.post1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
1078
+ sglang-0.5.4.post1.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
1079
+ sglang-0.5.4.post1.dist-info/RECORD,,