sglang 0.4.9.post2__py3-none-any.whl → 0.4.9.post4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (200) hide show
  1. sglang/bench_one_batch.py +2 -1
  2. sglang/eval/loogle_eval.py +7 -0
  3. sglang/srt/_custom_ops.py +29 -1
  4. sglang/srt/configs/deepseekvl2.py +11 -2
  5. sglang/srt/configs/internvl.py +3 -0
  6. sglang/srt/configs/janus_pro.py +3 -0
  7. sglang/srt/configs/model_config.py +10 -8
  8. sglang/srt/configs/update_config.py +3 -1
  9. sglang/srt/conversation.py +2 -1
  10. sglang/srt/custom_op.py +5 -2
  11. sglang/srt/disaggregation/common/conn.py +34 -6
  12. sglang/srt/disaggregation/decode.py +9 -1
  13. sglang/srt/disaggregation/mini_lb.py +3 -2
  14. sglang/srt/disaggregation/mooncake/conn.py +93 -76
  15. sglang/srt/disaggregation/mooncake/transfer_engine.py +4 -2
  16. sglang/srt/disaggregation/nixl/conn.py +17 -13
  17. sglang/srt/distributed/device_communicators/custom_all_reduce.py +3 -91
  18. sglang/srt/distributed/device_communicators/custom_all_reduce_utils.py +96 -1
  19. sglang/srt/distributed/device_communicators/quick_all_reduce.py +273 -0
  20. sglang/srt/distributed/device_communicators/shm_broadcast.py +12 -5
  21. sglang/srt/distributed/parallel_state.py +103 -15
  22. sglang/srt/entrypoints/engine.py +31 -33
  23. sglang/srt/entrypoints/http_server.py +20 -32
  24. sglang/srt/entrypoints/openai/protocol.py +3 -3
  25. sglang/srt/entrypoints/openai/serving_chat.py +48 -6
  26. sglang/srt/eplb/expert_location_dispatch.py +1 -1
  27. sglang/srt/function_call/base_format_detector.py +74 -12
  28. sglang/srt/function_call/deepseekv3_detector.py +26 -11
  29. sglang/srt/function_call/ebnf_composer.py +95 -63
  30. sglang/srt/function_call/function_call_parser.py +4 -2
  31. sglang/srt/function_call/kimik2_detector.py +41 -16
  32. sglang/srt/function_call/llama32_detector.py +6 -3
  33. sglang/srt/function_call/mistral_detector.py +11 -3
  34. sglang/srt/function_call/pythonic_detector.py +16 -14
  35. sglang/srt/function_call/qwen25_detector.py +12 -3
  36. sglang/srt/function_call/qwen3_coder_detector.py +151 -0
  37. sglang/srt/hf_transformers_utils.py +0 -1
  38. sglang/srt/layers/activation.py +24 -3
  39. sglang/srt/layers/attention/base_attn_backend.py +3 -1
  40. sglang/srt/layers/attention/flashattention_backend.py +3 -3
  41. sglang/srt/layers/attention/flashinfer_backend.py +40 -1
  42. sglang/srt/layers/communicator.py +12 -12
  43. sglang/srt/layers/dp_attention.py +72 -24
  44. sglang/srt/layers/linear.py +13 -102
  45. sglang/srt/layers/logits_processor.py +34 -24
  46. sglang/srt/layers/moe/ep_moe/kernels.py +4 -2
  47. sglang/srt/layers/moe/ep_moe/layer.py +23 -402
  48. sglang/srt/layers/moe/fused_moe_native.py +7 -47
  49. sglang/srt/layers/moe/fused_moe_triton/__init__.py +4 -4
  50. sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=160,N=320,device_name=NVIDIA_H20-3e.json +146 -0
  51. sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=384,N=128,device_name=NVIDIA_H20,dtype=fp8_w8a8,block_shape=[128, 128].json +146 -0
  52. sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=384,N=128,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json +146 -0
  53. sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=384,N=256,device_name=NVIDIA_H20-3e,dtype=fp8_w8a8,block_shape=[128, 128].json +146 -0
  54. sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=385,N=128,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json +146 -0
  55. sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=385,N=128,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json +146 -0
  56. sglang/srt/layers/moe/fused_moe_triton/fused_moe.py +54 -263
  57. sglang/srt/layers/moe/fused_moe_triton/layer.py +14 -396
  58. sglang/srt/layers/moe/topk.py +190 -23
  59. sglang/srt/layers/quantization/__init__.py +20 -134
  60. sglang/srt/layers/quantization/awq.py +578 -11
  61. sglang/srt/layers/quantization/awq_triton.py +339 -0
  62. sglang/srt/layers/quantization/base_config.py +85 -10
  63. sglang/srt/layers/quantization/blockwise_int8.py +17 -55
  64. sglang/srt/layers/quantization/compressed_tensors/compressed_tensors.py +13 -11
  65. sglang/srt/layers/quantization/compressed_tensors/compressed_tensors_moe.py +23 -79
  66. sglang/srt/layers/quantization/fp8.py +273 -62
  67. sglang/srt/layers/quantization/fp8_kernel.py +210 -46
  68. sglang/srt/layers/quantization/fp8_utils.py +2 -2
  69. sglang/srt/layers/quantization/gptq.py +501 -143
  70. sglang/srt/layers/quantization/marlin_utils.py +790 -0
  71. sglang/srt/layers/quantization/modelopt_quant.py +34 -112
  72. sglang/srt/layers/quantization/moe_wna16.py +45 -49
  73. sglang/srt/layers/quantization/petit.py +252 -0
  74. sglang/srt/layers/quantization/petit_utils.py +104 -0
  75. sglang/srt/layers/quantization/qoq.py +7 -6
  76. sglang/srt/layers/quantization/scalar_type.py +352 -0
  77. sglang/srt/layers/quantization/unquant.py +422 -0
  78. sglang/srt/layers/quantization/utils.py +340 -9
  79. sglang/srt/layers/quantization/w4afp8.py +8 -4
  80. sglang/srt/layers/quantization/w8a8_fp8.py +17 -51
  81. sglang/srt/layers/quantization/w8a8_int8.py +51 -115
  82. sglang/srt/layers/radix_attention.py +5 -3
  83. sglang/srt/layers/vocab_parallel_embedding.py +1 -41
  84. sglang/srt/lora/lora.py +0 -4
  85. sglang/srt/lora/lora_manager.py +162 -164
  86. sglang/srt/lora/lora_registry.py +124 -0
  87. sglang/srt/lora/mem_pool.py +83 -35
  88. sglang/srt/lora/utils.py +12 -5
  89. sglang/srt/managers/cache_controller.py +288 -0
  90. sglang/srt/managers/io_struct.py +60 -30
  91. sglang/srt/managers/mm_utils.py +7 -8
  92. sglang/srt/managers/schedule_batch.py +163 -113
  93. sglang/srt/managers/schedule_policy.py +68 -27
  94. sglang/srt/managers/scheduler.py +256 -86
  95. sglang/srt/managers/scheduler_output_processor_mixin.py +22 -4
  96. sglang/srt/managers/tokenizer_manager.py +38 -27
  97. sglang/srt/managers/tp_worker.py +16 -4
  98. sglang/srt/managers/tp_worker_overlap_thread.py +11 -0
  99. sglang/srt/mem_cache/allocator.py +74 -23
  100. sglang/srt/mem_cache/base_prefix_cache.py +14 -2
  101. sglang/srt/mem_cache/chunk_cache.py +5 -2
  102. sglang/srt/mem_cache/hicache_storage.py +168 -0
  103. sglang/srt/mem_cache/hiradix_cache.py +194 -5
  104. sglang/srt/mem_cache/memory_pool.py +16 -1
  105. sglang/srt/mem_cache/memory_pool_host.py +44 -2
  106. sglang/srt/mem_cache/radix_cache.py +26 -0
  107. sglang/srt/mem_cache/swa_radix_cache.py +1025 -0
  108. sglang/srt/metrics/collector.py +9 -0
  109. sglang/srt/model_executor/cuda_graph_runner.py +66 -31
  110. sglang/srt/model_executor/forward_batch_info.py +210 -25
  111. sglang/srt/model_executor/model_runner.py +147 -42
  112. sglang/srt/model_loader/loader.py +7 -1
  113. sglang/srt/model_loader/utils.py +4 -4
  114. sglang/srt/models/clip.py +1 -1
  115. sglang/srt/models/deepseek.py +9 -6
  116. sglang/srt/models/deepseek_janus_pro.py +1 -1
  117. sglang/srt/models/deepseek_v2.py +192 -173
  118. sglang/srt/models/deepseek_vl2.py +5 -5
  119. sglang/srt/models/gemma.py +48 -0
  120. sglang/srt/models/gemma2.py +52 -0
  121. sglang/srt/models/gemma3_causal.py +63 -0
  122. sglang/srt/models/gemma3_mm.py +1 -1
  123. sglang/srt/models/gemma3n_mm.py +2 -4
  124. sglang/srt/models/granitemoe.py +385 -0
  125. sglang/srt/models/grok.py +9 -3
  126. sglang/srt/models/hunyuan.py +63 -16
  127. sglang/srt/models/internvl.py +1 -1
  128. sglang/srt/models/kimi_vl.py +1 -1
  129. sglang/srt/models/llama.py +41 -0
  130. sglang/srt/models/llama4.py +11 -11
  131. sglang/srt/models/llava.py +2 -2
  132. sglang/srt/models/llavavid.py +1 -1
  133. sglang/srt/models/minicpm.py +0 -2
  134. sglang/srt/models/minicpmo.py +3 -7
  135. sglang/srt/models/minicpmv.py +1 -1
  136. sglang/srt/models/mistral.py +1 -1
  137. sglang/srt/models/mixtral.py +9 -2
  138. sglang/srt/models/mllama.py +3 -5
  139. sglang/srt/models/mllama4.py +13 -6
  140. sglang/srt/models/olmoe.py +8 -5
  141. sglang/srt/models/persimmon.py +330 -0
  142. sglang/srt/models/phi.py +321 -0
  143. sglang/srt/models/phi4mm.py +44 -4
  144. sglang/srt/models/phi4mm_audio.py +1260 -0
  145. sglang/srt/models/phi4mm_utils.py +1917 -0
  146. sglang/srt/models/phimoe.py +9 -3
  147. sglang/srt/models/qwen.py +37 -0
  148. sglang/srt/models/qwen2.py +41 -0
  149. sglang/srt/models/qwen2_5_vl.py +4 -4
  150. sglang/srt/models/qwen2_audio.py +1 -1
  151. sglang/srt/models/qwen2_moe.py +53 -9
  152. sglang/srt/models/qwen2_vl.py +4 -4
  153. sglang/srt/models/qwen3.py +65 -1
  154. sglang/srt/models/qwen3_moe.py +57 -24
  155. sglang/srt/models/vila.py +1 -1
  156. sglang/srt/multimodal/processors/base_processor.py +91 -97
  157. sglang/srt/multimodal/processors/clip.py +21 -19
  158. sglang/srt/multimodal/processors/deepseek_vl_v2.py +8 -26
  159. sglang/srt/multimodal/processors/gemma3.py +13 -17
  160. sglang/srt/multimodal/processors/gemma3n.py +19 -23
  161. sglang/srt/multimodal/processors/internvl.py +9 -10
  162. sglang/srt/multimodal/processors/janus_pro.py +12 -27
  163. sglang/srt/multimodal/processors/kimi_vl.py +12 -14
  164. sglang/srt/multimodal/processors/llava.py +4 -2
  165. sglang/srt/multimodal/processors/minicpm.py +35 -44
  166. sglang/srt/multimodal/processors/mlama.py +21 -18
  167. sglang/srt/multimodal/processors/mllama4.py +4 -5
  168. sglang/srt/multimodal/processors/phi4mm.py +63 -39
  169. sglang/srt/multimodal/processors/pixtral.py +14 -35
  170. sglang/srt/multimodal/processors/qwen_audio.py +65 -0
  171. sglang/srt/multimodal/processors/qwen_vl.py +16 -21
  172. sglang/srt/multimodal/processors/vila.py +14 -14
  173. sglang/srt/reasoning_parser.py +46 -4
  174. sglang/srt/sampling/sampling_batch_info.py +6 -5
  175. sglang/srt/sampling/sampling_params.py +8 -1
  176. sglang/srt/server_args.py +454 -270
  177. sglang/srt/speculative/eagle_draft_cuda_graph_runner.py +33 -28
  178. sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py +46 -37
  179. sglang/srt/speculative/eagle_utils.py +51 -23
  180. sglang/srt/speculative/eagle_worker.py +59 -44
  181. sglang/srt/two_batch_overlap.py +10 -5
  182. sglang/srt/utils.py +44 -69
  183. sglang/test/runners.py +14 -3
  184. sglang/test/test_activation.py +50 -1
  185. sglang/test/test_block_fp8.py +8 -3
  186. sglang/test/test_block_fp8_ep.py +1 -1
  187. sglang/test/test_custom_ops.py +12 -7
  188. sglang/test/test_cutlass_w4a8_moe.py +1 -3
  189. sglang/test/test_fp4_moe.py +1 -3
  190. sglang/test/test_marlin_moe.py +286 -0
  191. sglang/test/test_marlin_utils.py +171 -0
  192. sglang/test/test_utils.py +35 -0
  193. sglang/version.py +1 -1
  194. {sglang-0.4.9.post2.dist-info → sglang-0.4.9.post4.dist-info}/METADATA +10 -10
  195. {sglang-0.4.9.post2.dist-info → sglang-0.4.9.post4.dist-info}/RECORD +198 -175
  196. sglang/srt/layers/quantization/quant_utils.py +0 -166
  197. sglang/srt/managers/multimodal_processors/qwen_audio.py +0 -94
  198. {sglang-0.4.9.post2.dist-info → sglang-0.4.9.post4.dist-info}/WHEEL +0 -0
  199. {sglang-0.4.9.post2.dist-info → sglang-0.4.9.post4.dist-info}/licenses/LICENSE +0 -0
  200. {sglang-0.4.9.post2.dist-info → sglang-0.4.9.post4.dist-info}/top_level.txt +0 -0
@@ -1,7 +1,7 @@
1
1
  sglang/__init__.py,sha256=x1v8748WXS2BAptWAd5fR3YBEkngC7e_P_rkCNuNCGg,1702
2
2
  sglang/api.py,sha256=rcp3GeoyZhmJ0GDLPRkuZNcxd0TBJy_wfUDpcmQoqW8,7210
3
3
  sglang/bench_offline_throughput.py,sha256=TwgXZYmwPaHVsdPtNU9LO0p1tr5OOKLy9wYgrfGAlFU,14056
4
- sglang/bench_one_batch.py,sha256=RJsXQ7pvq8y4yzW7svURtWZF5RiawxEMrsjV0OcKsrk,19388
4
+ sglang/bench_one_batch.py,sha256=ETz7G8HazZ0iVkWVLrzgNEENnJ_xR_8UCzzRLm-AbpQ,19462
5
5
  sglang/bench_one_batch_server.py,sha256=LS1BRmFwP67IpYlU5wmkWjqquiA5drvtWe-fwHnFSKI,14170
6
6
  sglang/bench_serving.py,sha256=nOjDnqOKDezDvtCvEhC1_FAoWVkir38bSaEIcSGGVZg,71748
7
7
  sglang/check_env.py,sha256=qDMIG2rCNBH1yKnxQmF-Bp10oiFMUKMgfZLHZYOmdSY,8412
@@ -10,9 +10,9 @@ sglang/global_config.py,sha256=xzLdk8W53fneFblNh8iIjGF9C3-7mnzR1-LleD9Btxg,1495
10
10
  sglang/launch_server.py,sha256=mDXfwha8LHpWQJekcCosR98QhCQsbmilsBlI5jAIgg0,420
11
11
  sglang/profiler.py,sha256=tEHzHerXC-ymk4OrkoUcMbgcGHmb8VESthsNSP2Yx9w,4417
12
12
  sglang/utils.py,sha256=leKs-YyX1_Jk216yoKX-KRYx_EbLiuemsHbD31xSjMw,16445
13
- sglang/version.py,sha256=2VQK7_pzesJW0_F_Vd4w5UmkEfHPeIjSBRrIXNIBvAU,28
13
+ sglang/version.py,sha256=7hKPeJG6JhOmqx_uKkIvWkBNoTZDwS93b5EIfp7zQXQ,28
14
14
  sglang/eval/llama3_eval.py,sha256=gWSboDchIGybIce88bJlrCG0yiLZ513mw4gcutJlzGM,10017
15
- sglang/eval/loogle_eval.py,sha256=pRPVA4fxGmT3_oXvXnlNE-UlPrcQGLBJF-OSE9YWJXM,4336
15
+ sglang/eval/loogle_eval.py,sha256=-CC2s2kh5qUoDrHRkQVkC_jNvBgNojXbf456ny5s78s,4557
16
16
  sglang/lang/chat_template.py,sha256=HKlx7snSWFED8GKF5ex79sQrPWFw5TSXQM0_LsiD9Bc,20552
17
17
  sglang/lang/choices.py,sha256=-W1DVw9N9ZliVpvmWrzIXG4cswAah8eMQrHWzkS3D8o,6234
18
18
  sglang/lang/compiler.py,sha256=MAuzoOOpb98njJ7Io2SDmFkhTroDYiq0te0ZpfHkMY4,7597
@@ -26,38 +26,38 @@ sglang/lang/backend/litellm.py,sha256=ugmL7sfUxkUHVbHtwNzHgdQAEd4UCjNQboFuE3KThc
26
26
  sglang/lang/backend/openai.py,sha256=YFs7pCDK6_DoYmjTa-vgDVdaeE4PYr7E-sIC1q7vAns,16422
27
27
  sglang/lang/backend/runtime_endpoint.py,sha256=oxLCLXCa26VfKyPV-wbRjLrQvqTG8NzoaVgwczzyIYc,17481
28
28
  sglang/lang/backend/vertexai.py,sha256=gz0uNYyBb88jbPYz6ZIJ774fefrcbuVdoK33bphUZpI,4827
29
- sglang/srt/_custom_ops.py,sha256=0lJRMTKTjoxJPh1qQnnMY02Z3SyBDi7LJI34IBLQsgQ,4462
29
+ sglang/srt/_custom_ops.py,sha256=9GPNUyqnybgvUnzdQ8n5_NgluHmQNw0Gptos0iLPfrY,5342
30
30
  sglang/srt/aio_rwlock.py,sha256=6LYtOdeTUY3hkfa1dmYkgsaF2ttrwIF3hUWz2AZ2fqw,2970
31
31
  sglang/srt/code_completion_parser.py,sha256=KFa95OU0TeVjJkOqIgS4xV3kaJ5dFWOmAAgISyc1oEc,3803
32
32
  sglang/srt/constants.py,sha256=0i-tEwG2BSYNDy96MxnGHV5HnBELkYcnsVGsE-R18o0,93
33
- sglang/srt/conversation.py,sha256=NeXU0CFdx_b8gLvmNCXjbqllXTTNAfQCD7mr6JrVtHw,40360
34
- sglang/srt/custom_op.py,sha256=87r2PIgiGLREsIZQ8qsUD-zgI66_54y9GrE0buXzoCI,3076
33
+ sglang/srt/conversation.py,sha256=8Ne6Wcjhdo9gSqIDNEcRCiPIIUawGjfDUimp5IHCeps,40396
34
+ sglang/srt/custom_op.py,sha256=7OPQAZe3PqDXk-xM0Wxl7pm9cazilNJfkNiYIWztWgI,3198
35
35
  sglang/srt/debug_utils.py,sha256=slaFOY4BYDBFatkfu8FZlzai-u4LFS-5GUzdr-t50zE,2241
36
- sglang/srt/hf_transformers_utils.py,sha256=X3lntqlG9h7zNvAonhj47St0AR8Nx5NUHjn0wWYxTlw,12457
36
+ sglang/srt/hf_transformers_utils.py,sha256=UiGjp70ZpTaZDJ99Roc-2DTkxV3gR-2oJjjaNY9Ekh4,12391
37
37
  sglang/srt/jinja_template_utils.py,sha256=0c6nQjkGukmyXsqQ9r85R5QK9CafnjqXyrXF4K3aFhE,7177
38
38
  sglang/srt/model_parallel.py,sha256=eLXZhvJ4wG6dh0FontNCIdVZvHYdWgaeY-5cu7TD9tE,6078
39
39
  sglang/srt/operations.py,sha256=ddQ8KO63L73OciaR8MZ9h2h83gKVY4-WuWgeEGowPJA,5346
40
40
  sglang/srt/operations_strategy.py,sha256=Pwd2sKeRtKh9WJXgzlNr2tU9y6YMcI3MDLbatHqlMws,7145
41
41
  sglang/srt/patch_torch.py,sha256=OUPCGQSQz3MVZB1zZ_Eq8lXiw0uIKJ_HWjqQolI8FsM,3088
42
- sglang/srt/reasoning_parser.py,sha256=DkZrFhkJ9qe7w46fTnM9sqhXwTDgZxD4qPdGka-Dly8,7579
43
- sglang/srt/server_args.py,sha256=HOwXUp6ver6xVZNaRJH-A9rtC_VpM7tPyMBF08JFOl4,76138
42
+ sglang/srt/reasoning_parser.py,sha256=8S7oLj5a1jPPwgs9Yl4sZ2A_wn_qobrmPjUJU0BswCQ,9224
43
+ sglang/srt/server_args.py,sha256=Qdg567MVXoy2spYojSMY8MbcwFsALS7AnHCGXfqazAM,84056
44
44
  sglang/srt/torch_memory_saver_adapter.py,sha256=K_eTx0UU84MHSTXI3iqYLdHV4IWtJMJ2FKdGFJR8v1E,2417
45
- sglang/srt/two_batch_overlap.py,sha256=Pqqj4BzVbXCiOvWE20MGMo21AoAmEPd0R32DsPfD5c8,28562
46
- sglang/srt/utils.py,sha256=mQE61yjzwgI8iwxrcaiZk4Zeyd69S3ErBuXQuYNita4,91714
45
+ sglang/srt/two_batch_overlap.py,sha256=Lx4bIXJb3hd9vzuJbmp3Crf4I8_NrT9fUbs-4LRzQXk,28711
46
+ sglang/srt/utils.py,sha256=CSiP9vU3mxsAKQAK9DvgE4Ygd0LiHrl4zNJP5nuhqkU,89974
47
47
  sglang/srt/warmup.py,sha256=zldxhMlXpclRAJXmfBjJNUJd1eDizVdysibBvQyTVuA,1782
48
48
  sglang/srt/configs/__init__.py,sha256=8EcVRP95epZ49DxBa6LgKWt7eO3Qe7Hrr3V1c6HkMnY,553
49
49
  sglang/srt/configs/chatglm.py,sha256=j-b0YkdYUmQm2y1kNmMJtKeACxWKmBbvNNkDWbs6kbI,2907
50
50
  sglang/srt/configs/dbrx.py,sha256=tdhIkXAQl1yr0MxqFmsDG1E0e2puRTTKm6UTyANBLac,11005
51
- sglang/srt/configs/deepseekvl2.py,sha256=X8Q2gm7og_Ylx6tbFXetusfIJIXjWY_YH_p90C67BTI,23397
51
+ sglang/srt/configs/deepseekvl2.py,sha256=sYMmoy5_LlDXht7MTi4QGYOaiE8iMGUO44bnuOu4i8I,23683
52
52
  sglang/srt/configs/device_config.py,sha256=kdwFrk5myAURxdp4rSr8ANpBpSJfuBDoT-kuCyuscRs,442
53
53
  sglang/srt/configs/exaone.py,sha256=Duxd4yQoKy8GWEzZD_kCY_OzmN_67CTJL_Kgn0eXk3g,10731
54
- sglang/srt/configs/internvl.py,sha256=Z2kmT-5BzR4EdoLmbsgnK5HBXmpjzKAcaTuHaPYrQHE,27553
55
- sglang/srt/configs/janus_pro.py,sha256=95qLFQ43n-q5MVEDnh9OBXCUNXOCofwBKYvd7LKPvRI,19097
54
+ sglang/srt/configs/internvl.py,sha256=Ws-LNun1s5kaATSp8H0XNbUrwMa9Be9axZ6hfig_F7I,27697
55
+ sglang/srt/configs/janus_pro.py,sha256=yI2c_aWBIKiTcK6RZxK6hq8CIxyYRH_NN8uaSNKsrKI,19156
56
56
  sglang/srt/configs/kimi_vl.py,sha256=4W7VQI3pr888ZsFA2SqCQo4mI0seXTOrGQ-x3oTvWew,1358
57
57
  sglang/srt/configs/kimi_vl_moonvit.py,sha256=hx2Rt4JSFbvy2HUTeLjBpge87m8M6ITAhqsgdNf_Jd4,1163
58
58
  sglang/srt/configs/load_config.py,sha256=qs-AxuplouBx2tsv9KGBOLZPbwzuVA4vbktbGP_cRp8,3309
59
- sglang/srt/configs/model_config.py,sha256=N-S1xKCEH-5LqVfL9VEGKUHRFAujFgczB6tIk5Jr-_Y,28333
60
- sglang/srt/configs/update_config.py,sha256=2EpDVocEpMv35g1V-iPLSaLjBgylC5vN0yYSlW49k5w,4664
59
+ sglang/srt/configs/model_config.py,sha256=zLuzY5QlldWYuEb9zHlARTOuXYqZbXijhJHWMuy2lZA,28413
60
+ sglang/srt/configs/update_config.py,sha256=D-myV9Ombwp6wTF0RX9qUO6m5rxFiUcyse32FQADG28,4787
61
61
  sglang/srt/configs/utils.py,sha256=3nHUfisMs_Ltuhv8OZTNCJp63YJKJVF43h1QZB1zqx8,670
62
62
  sglang/srt/connector/__init__.py,sha256=czLX5JOxuMhH-T9eSJzoc1qv1B4z9chyffDRL5I6wo4,1247
63
63
  sglang/srt/connector/base_connector.py,sha256=i6i1TIzsz4NbSEkrdMPq-urb2sN2aLAx8dazga4gB9U,2833
@@ -74,11 +74,11 @@ sglang/srt/constrained/outlines_jump_forward.py,sha256=Gyubp-FVetxd6wP4FA_kD6cCX
74
74
  sglang/srt/constrained/reasoner_grammar_backend.py,sha256=YFxWuOTTo4e6cGhxnaBwuwli6f8FTUJtszib8dBq_8I,3207
75
75
  sglang/srt/constrained/xgrammar_backend.py,sha256=u9Ao-XX22UzALkATEAR_-0EoyBTxMTJV590qd9LAUHM,7906
76
76
  sglang/srt/constrained/triton_ops/bitmask_ops.py,sha256=WjTen9iuuFWLzkE1mAHQZB9_7aIy5QH8Wjf-lB-Fams,4614
77
- sglang/srt/disaggregation/decode.py,sha256=sND6tJTIgxdaqDOem9mAaaMQWZTVxho5sniMOYVkQ7I,33944
77
+ sglang/srt/disaggregation/decode.py,sha256=P-0OyFjjDfthEVhlJugdscWST_uoOVmHZlSlx9NYLmE,34242
78
78
  sglang/srt/disaggregation/decode_schedule_batch_mixin.py,sha256=8UdNaj8KKMLV5Cydhw8gnHM-zRrnKM_AAd3Qc-SRfWg,5648
79
79
  sglang/srt/disaggregation/kv_events.py,sha256=yFbtwOeblcCmOXTjg00TopxnyjkmCBQIVz46KB8jetY,13555
80
80
  sglang/srt/disaggregation/launch_lb.py,sha256=mcbAztN4gnHevw_T5R2_nWsymsDEY9vHkm7OJ1vr6cc,4211
81
- sglang/srt/disaggregation/mini_lb.py,sha256=BBeIdeZZxi7Ra5_hukHHX3TNdyfZ4tP1GBUxC-qrv_g,14401
81
+ sglang/srt/disaggregation/mini_lb.py,sha256=bpnz6d90nv7vAoiPxmxFKlM1Gjct0R4IPkF9SwwBk9I,14504
82
82
  sglang/srt/disaggregation/prefill.py,sha256=3u6WCrjogZSqd6yWdBZe1HO4lf6w2e9M7sQtGHyax-Y,23512
83
83
  sglang/srt/disaggregation/utils.py,sha256=ql5p9yjBCRcR0YMgcgRK6tH0kPGvLNTUgeXBr_BUcoI,12198
84
84
  sglang/srt/disaggregation/ascend/__init__.py,sha256=-lxnica6fZYmYNpKwmE8yESUpQ5Sxf2DiZoBHzboKc8,146
@@ -87,37 +87,38 @@ sglang/srt/disaggregation/ascend/transfer_engine.py,sha256=_4PszsQL6wICdg5cqpR2N
87
87
  sglang/srt/disaggregation/base/__init__.py,sha256=4VwUv0aWxwmVL1049XK82aLTNxmt0WY5RPy9li-wyVk,160
88
88
  sglang/srt/disaggregation/base/conn.py,sha256=CPDAoAkYaFtVPLa1QROfwipSVe7MH6omzIBHzo8TSYk,2811
89
89
  sglang/srt/disaggregation/common/__init__.py,sha256=7yl-EGLMVKRpBUaGF_7lwAsw2J_mqpRZV0238VGxD9o,126
90
- sglang/srt/disaggregation/common/conn.py,sha256=CZR1lMCE_mpSkvjc6BBmSr1SbHY1uZuxjpanazD-YXc,16071
90
+ sglang/srt/disaggregation/common/conn.py,sha256=3YJVviObY3fkSfQbVxE5lgcqMmqM5nDjWfEjS5-SW6I,17054
91
91
  sglang/srt/disaggregation/common/utils.py,sha256=SxRhAWisNK8seGhb5BXBJ5u53DF7yeKVPMWPcB5ywbE,1194
92
92
  sglang/srt/disaggregation/fake/__init__.py,sha256=jJGWdXwaQiGIoR6atKqkQfkJmVyQ09l55VUN2WjwaeY,77
93
93
  sglang/srt/disaggregation/fake/conn.py,sha256=oD1DArn1yDFZCu-X6p93uSLlAXEkt9lYxERICMznxGw,2286
94
94
  sglang/srt/disaggregation/mooncake/__init__.py,sha256=0TgqkAdQI1YynbHY6c0QISvVoOSk-0SwCIq5rjPSmgE,156
95
- sglang/srt/disaggregation/mooncake/conn.py,sha256=GUC1LUuO-PI7TmiZg-KBXpyccYCwE5K5byoV2eHxIFw,60891
96
- sglang/srt/disaggregation/mooncake/transfer_engine.py,sha256=a3pki0d7QauTn6slt7gVxjicABP6Uo4Ztt0wEXR9dZc,4687
95
+ sglang/srt/disaggregation/mooncake/conn.py,sha256=uHCmSIdo4-BfVez3uP4JmQ3vsRKXJhrcBAaRNi2dgBs,61314
96
+ sglang/srt/disaggregation/mooncake/transfer_engine.py,sha256=-ulLhz6DBDsmEjwNjjH5Pj8ngZKISgwBc_zL3ViGDN0,4761
97
97
  sglang/srt/disaggregation/nixl/__init__.py,sha256=qODVPIGWUXKXq4zsRIcMYoAoAeg6nBIN9vdQOlVMANE,136
98
- sglang/srt/disaggregation/nixl/conn.py,sha256=cXqWU2Gbi6E2LS0MznEcgFCrwONhYxBtD-zE9DU32z0,20333
98
+ sglang/srt/disaggregation/nixl/conn.py,sha256=eSof87fG21Dd4COszfnbeXIxne3TWvw0mSvCOkjsBZc,20323
99
99
  sglang/srt/distributed/__init__.py,sha256=jFOcyt-wFAPMBUAf9zkZalNQlt-4rqmT6pCKBz1E4qo,149
100
100
  sglang/srt/distributed/communication_op.py,sha256=IBnFUdMftK_VSTMMMitGveonorFUUVNL4guqO31cMSc,1130
101
- sglang/srt/distributed/parallel_state.py,sha256=tZL5PLVowAQvq5xlT573Di63hWKsiqJZbl-auj85wNA,54997
101
+ sglang/srt/distributed/parallel_state.py,sha256=crlAUplgruIVrDk6jFZ0-6M3W6FXX67buZ3T-4XDgFA,58530
102
102
  sglang/srt/distributed/utils.py,sha256=aaCxATncLGnVgB0WlGpBdee0behKW8Dy_dakqcuKSaQ,8497
103
103
  sglang/srt/distributed/device_communicators/cuda_wrapper.py,sha256=3jvPG-Ow5UBLiXhfx8T8snR7crSZbPpARAggsDPWq7k,7038
104
- sglang/srt/distributed/device_communicators/custom_all_reduce.py,sha256=qje-PQ3v8yaV-oYVLPws1mgIlXVsGKFCOvXHmSe8ZXg,19624
105
- sglang/srt/distributed/device_communicators/custom_all_reduce_utils.py,sha256=fLoptT_U0lVAqkhEg-ge53CdFSIKQpDRiqHYKwJVEZg,10974
104
+ sglang/srt/distributed/device_communicators/custom_all_reduce.py,sha256=p-GLYYnMSjcUvK30qcwYhXEJwGrOz6rR99p_23SWFj8,16570
105
+ sglang/srt/distributed/device_communicators/custom_all_reduce_utils.py,sha256=Fx9D70NO2dplyuqOxTasMwkzONN3wfC4WOny3tWSbPA,14159
106
106
  sglang/srt/distributed/device_communicators/hpu_communicator.py,sha256=gPjEH1-izoby5uDrfUlzNf21luPT0Ow7pJjhCRKnHy8,1728
107
107
  sglang/srt/distributed/device_communicators/npu_communicator.py,sha256=bRXN1Md_4SHQGzQYZa2GrHv2zbIU5vSpkueHiAZL1xQ,1345
108
108
  sglang/srt/distributed/device_communicators/pymscclpp.py,sha256=8Pgehd02v-BpHixTTB4OB9ZlxA7fyXiPF4Xp9F_heyU,10890
109
109
  sglang/srt/distributed/device_communicators/pynccl.py,sha256=obXyCaZznZHSt486XCnEOBNG3Cen7ysuuMuGRlTTl-8,10095
110
110
  sglang/srt/distributed/device_communicators/pynccl_wrapper.py,sha256=LblisImY9d6EMz-oPS9J16WHo2Q_SRL1DtlJKK63Hfg,15349
111
- sglang/srt/distributed/device_communicators/shm_broadcast.py,sha256=d8mykYmXM1lfbPm8GNtqCF0Un_pdXYjbNmsgoVFyyow,20874
111
+ sglang/srt/distributed/device_communicators/quick_all_reduce.py,sha256=4j1_E4azoxfd8wxtfFmt9rvbQncl8ny6wmTMl6gAkp0,9932
112
+ sglang/srt/distributed/device_communicators/shm_broadcast.py,sha256=IrSrnpZnii0EJTS1CYRwEwE7gyHxJBVgI2QuJS3AKW0,20906
112
113
  sglang/srt/distributed/device_communicators/xpu_communicator.py,sha256=ajW6132BvA6jkeipEIgN27TFycI0U06Ih2Z8WNjlA4s,1593
113
114
  sglang/srt/entrypoints/EngineBase.py,sha256=yKN76witT2jz1zhmLHmPNLGMpK2UiOTaKQ2KPD8l99U,2594
114
- sglang/srt/entrypoints/engine.py,sha256=zZGuZVdyCPf1WeCRb1Lde7fIlAT181IKT1CCmK8AHrk,31328
115
- sglang/srt/entrypoints/http_server.py,sha256=pUZgA7ILuRynIY3Cs2nbFoXSnZ7ohsMauF_RBtl-V_s,37538
115
+ sglang/srt/entrypoints/engine.py,sha256=f8FI-BcjiIlcXdcy4NHmnM8SLNe8eYsNwyv4IoKYRZI,31545
116
+ sglang/srt/entrypoints/http_server.py,sha256=-unKM0lCK7Scd3LLTxLl-3vhit6lMb-wWfjLywelRy0,37214
116
117
  sglang/srt/entrypoints/http_server_engine.py,sha256=_--j4U04OeJLlnnv1f0XmCd_Ry0z1FlhkrbePX8rYV0,4938
117
118
  sglang/srt/entrypoints/openai/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
118
- sglang/srt/entrypoints/openai/protocol.py,sha256=oAd5u_J6Wk9gzXVPS-Ps8VaxkhmMXyIuH1KZ73pEOvQ,19083
119
+ sglang/srt/entrypoints/openai/protocol.py,sha256=UUc5oJ7E60fYoUqMb53H85i7HHhDfmYLIFZidhNrP0s,19147
119
120
  sglang/srt/entrypoints/openai/serving_base.py,sha256=5NJ2S_6B2NFSwn4nLp6eaeJ5iC3IcQzMEY9lW_gPcdA,5246
120
- sglang/srt/entrypoints/openai/serving_chat.py,sha256=QhHvqRjbzwsTQNtRhia7UJd2BlXnxWD-7udRsX_8H8s,36233
121
+ sglang/srt/entrypoints/openai/serving_chat.py,sha256=WUstZZt80I2yrqUfBRx57-YMVMb45VqlyMnSmXuQFNw,38032
121
122
  sglang/srt/entrypoints/openai/serving_completions.py,sha256=emIutVmnJgOgGRuAqdB80-kVHUfQbE67n1VS-76o4QY,16690
122
123
  sglang/srt/entrypoints/openai/serving_embedding.py,sha256=hqPt2ELpT1yQ8sBXo801aLJ3sExoPXs_K5ZQtC2vpAs,6274
123
124
  sglang/srt/entrypoints/openai/serving_rerank.py,sha256=8n6y5kC6UhRpWrDtzH0eIp0dznW12FT60MLCR4bvD2U,3333
@@ -128,49 +129,50 @@ sglang/srt/eplb/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
128
129
  sglang/srt/eplb/eplb_manager.py,sha256=Wt7w4L5g1BSsXx1mqoGo8WjkB55f4nGB4KqC3y_ijl8,3394
129
130
  sglang/srt/eplb/expert_distribution.py,sha256=N2wcIzQo9nzPpH5jR63RH7iB00XvH4R8OGp-rR_07f4,31332
130
131
  sglang/srt/eplb/expert_location.py,sha256=unthN8w37bvxf_4Z1xNi-Gi4SGnZbTBbMpHC1be9QMI,16665
131
- sglang/srt/eplb/expert_location_dispatch.py,sha256=epq06lcViQXoSL9SIf2urjBDjMTlzql5GwMVFpcOAtI,4144
132
+ sglang/srt/eplb/expert_location_dispatch.py,sha256=ErUBjzDffcF0FgPI-Xv90RDrtKnQwNB9woouZFS2C7k,4126
132
133
  sglang/srt/eplb/expert_location_updater.py,sha256=oVIUYzji6BFEd2AgeRcM6kwEqLwwD3_PEEv3EyWIydk,21100
133
134
  sglang/srt/eplb/eplb_algorithms/__init__.py,sha256=c6fo4qM8N0p5DyyfGp9fxqc2wkxvzSJBzJFRG1I1leg,1959
134
135
  sglang/srt/eplb/eplb_algorithms/deepseek.py,sha256=mMZT7zAAArccdRS0xXxifvMb3qn9enSt426uUTKeiq4,8340
135
136
  sglang/srt/eplb/eplb_algorithms/deepseek_vec.py,sha256=Vzy5Iarua1VgVHzjBNZaVV_vt1LY1BLtJz7PmzB701k,10654
136
137
  sglang/srt/eplb/eplb_simulator/__init__.py,sha256=HIZaXqsvsOCMMJ81dSs1afSGZ5G6OiOZEtHpltyzzjY,21
137
138
  sglang/srt/eplb/eplb_simulator/reader.py,sha256=OlsWqsuXqVQY7PfvvrP-vsl2Ww2Kg4vD_K9BltM_QHo,1828
138
- sglang/srt/function_call/base_format_detector.py,sha256=eMSqbx99YPm2m_ChLafFRuLOzXBtA0oJn_Q4FtB3FnM,12950
139
+ sglang/srt/function_call/base_format_detector.py,sha256=FKBzsGFHfNl3Wvccsdvv9ftjbCZIyyjOLj2kHgKvX9g,15901
139
140
  sglang/srt/function_call/core_types.py,sha256=wLUsW8mUA-i-ISz5QUDL7Ejq72W-K1HIhFa9Wm-_oA8,786
140
- sglang/srt/function_call/deepseekv3_detector.py,sha256=XudIiIt2Mejokg6qOkX7vYS-3XIFstOBHv-m-Q5fBLQ,8970
141
- sglang/srt/function_call/ebnf_composer.py,sha256=1r5UPEkUeMCug-P-c1mAZbJPgEXU8hR-fDLdYG5Q-wo,13585
142
- sglang/srt/function_call/function_call_parser.py,sha256=YqtfxJYu9kWZIJTtM20miH2duXIvG6CWintBZ3_7SfQ,7785
143
- sglang/srt/function_call/kimik2_detector.py,sha256=wb--wnAp-ZtWeIJZM1dS33GNu-K9lGxvrFbtp-UmGVk,8978
144
- sglang/srt/function_call/llama32_detector.py,sha256=EHYGAy1NCIxFWKdSQByPxyJgFaFRCtGdgj4ntEAgi00,3619
145
- sglang/srt/function_call/mistral_detector.py,sha256=xNuVl2vDXVYbXyiXLkJZ9VM6njcwlS9EqryR1eJbMr4,4462
146
- sglang/srt/function_call/pythonic_detector.py,sha256=rtXSflE4w993a4OqphWG-WQzvwRz0v3dfgHOnte1fpI,8731
147
- sglang/srt/function_call/qwen25_detector.py,sha256=9JfZem_5nw91Og2biwq8eIpUQjy_3kFz4TQI8Lc3Vow,4882
141
+ sglang/srt/function_call/deepseekv3_detector.py,sha256=WzJbwCe8DoOi8guX9pdVMd70CViVrwoaxi8PZwIC9pg,9712
142
+ sglang/srt/function_call/ebnf_composer.py,sha256=cG0js5-bSl4FK66DyrTaREqLXXbtuLQxHBzxx6xaK3Q,14700
143
+ sglang/srt/function_call/function_call_parser.py,sha256=G6b2VmE2mHarRuXlzAWEY6-yWoEbt830LmykE3Jnz9s,7904
144
+ sglang/srt/function_call/kimik2_detector.py,sha256=7unW_GwH7I6jrh2BZbw22mWRZzQ0OMTYDz_xVX5abPU,10116
145
+ sglang/srt/function_call/llama32_detector.py,sha256=trZja7IXc2IWUko5PRj7p4pRU6XCVjtxr-7qJNr0EWo,3647
146
+ sglang/srt/function_call/mistral_detector.py,sha256=Ts2HrJdu5r2lCCMVKPZfnCds9pt1K5H1EaOQrF_HD60,4686
147
+ sglang/srt/function_call/pythonic_detector.py,sha256=yAatItKtVDf9uhlB78wPWKP3fbefLJDNGGzFV5ey-YA,8756
148
+ sglang/srt/function_call/qwen25_detector.py,sha256=nv83_sipZMU6Vie3J4HeNiZVCSRU5ei7601j50779HA,5181
149
+ sglang/srt/function_call/qwen3_coder_detector.py,sha256=Zwpx4NF3dL7tOKnzczmvfmY3tZQ-vJyehbvtco-8tkM,5478
148
150
  sglang/srt/function_call/utils.py,sha256=__ImDF2kNyoLWsYO5RYoryvy1mmgEjnjXlCvLv-uLCM,1695
149
- sglang/srt/layers/activation.py,sha256=UDrJcnQoIOJjMzZ9XAy5JlEJ-do44tGMtcitY7I8kPQ,7327
151
+ sglang/srt/layers/activation.py,sha256=uhfhh10N5iLoLEBCvFPRjCfDxu5jXe1ehHJb3ISIjig,7840
150
152
  sglang/srt/layers/amx_utils.py,sha256=1mENgHK2B8mgaD1oMtgbZ15Jmy_Uu1QueBmo09Ff2iA,2865
151
- sglang/srt/layers/communicator.py,sha256=yckTsQ_3SeADES7maU2bgIpzwbWu3Q3Qpxu8T8UpCoQ,20045
152
- sglang/srt/layers/dp_attention.py,sha256=V7m_PfvHHtRMJMviIqmoyqf5VFFJLYYcynDuI5dXtAU,10275
153
+ sglang/srt/layers/communicator.py,sha256=c5pJObNyP_7JsIWgLau_E-1ovtPCpAcge254fjo9Rqw,19988
154
+ sglang/srt/layers/dp_attention.py,sha256=tOre7il5Cppu930-tzM6d4AgjHuIJMCMlg9hJkuBcjA,11382
153
155
  sglang/srt/layers/elementwise.py,sha256=MyQUflyKEfPZ-BggW1Kd4hB53RFD6FXGc2S5LXjx_do,16026
154
156
  sglang/srt/layers/flashinfer_comm_fusion.py,sha256=fkTcAB7qYwSWi95qI3Rqq0JUyDpJdcYkd4TYkWO01HI,5891
155
157
  sglang/srt/layers/layernorm.py,sha256=ooqA-t-vY5erbKBwqnOotfDsJRTygP5E10CfzEAVF6M,8657
156
- sglang/srt/layers/linear.py,sha256=7XQvKQL7oS1o8aw3i0XRj4JcV6OOwGycdYJZO21AXvE,55355
157
- sglang/srt/layers/logits_processor.py,sha256=tOPMYopEQuoLBzwbjSmU9OWFYh2mmy3ViJSbA_wpFOU,25619
158
+ sglang/srt/layers/linear.py,sha256=NzjLqZrZNYcc3z2KtA9-n6pnSdBHHwU6NF_BbcAWp48,52471
159
+ sglang/srt/layers/logits_processor.py,sha256=9eZQE8pI-coXeK1XQFrBI0_aENZ2cGTtmD1FptWda5k,26270
158
160
  sglang/srt/layers/multimodal.py,sha256=YVR69WW-2aGDcZHT8IVJ6F_LRM7wraZr8VjrPDXqDmA,2104
159
161
  sglang/srt/layers/parameter.py,sha256=jCg0G-12GZqTa9gGOqEtVCsnnuBGnYg0VmF6pc6oCFg,17455
160
162
  sglang/srt/layers/pooler.py,sha256=uZ6WX1FLMEafZwusyZdm6KuVlIwSjbKrdwk2qzgqNGk,3812
161
- sglang/srt/layers/radix_attention.py,sha256=IlqRB4bk06FOH05_7zB8lik0xLpys7jFooLeCwdO0j8,3437
163
+ sglang/srt/layers/radix_attention.py,sha256=vtzCPfEiWYunglcLfqO9dcATb-LXzU4sFBwIWsWHbiY,3513
162
164
  sglang/srt/layers/rotary_embedding.py,sha256=EhxI0E8jcTWZ2COpnku7crbW8Hew5fe_ujMndj7hKvE,52246
163
165
  sglang/srt/layers/sampler.py,sha256=xNds1migup2s6b9_pS6ljkJUkvNtv7nmTGeIdOzoQ6w,11182
164
166
  sglang/srt/layers/torchao_utils.py,sha256=Ws24FdRBSkTpyeyA6bQrdDm-W5wfDxKvSIPUSahyMfA,4063
165
167
  sglang/srt/layers/utils.py,sha256=IWGg1Hb7c33Z3LHRPVJyUAzp3BnSid23ZWXAmJ_Jvp8,1204
166
- sglang/srt/layers/vocab_parallel_embedding.py,sha256=i1Uoo8TE877jLNjAjwoyMD36W7J3WwFD402YWq0qTT0,23560
168
+ sglang/srt/layers/vocab_parallel_embedding.py,sha256=FSAxHh1w9Qz4A2_8OQfIP5qsmq1s_g-Od-VLJ4vqQPw,22355
167
169
  sglang/srt/layers/attention/aiter_backend.py,sha256=7sEUgViw-xl3yok91yyOD9gTi8lQmME0g0ZiKVTCcyI,32851
168
170
  sglang/srt/layers/attention/ascend_backend.py,sha256=jPCsU9_gH1iZNoZHD9nCeDdVdXqBt31LI65N55BTJPg,8250
169
- sglang/srt/layers/attention/base_attn_backend.py,sha256=KXVcCguwXh-PSrY9Y2aUrlXXUhWdbVxqVEF2_xIMvm4,3466
171
+ sglang/srt/layers/attention/base_attn_backend.py,sha256=_vM05ddWy6SaoqWYPR8w5lflSE4MhcVFR271Q9EKK8E,3600
170
172
  sglang/srt/layers/attention/cutlass_mla_backend.py,sha256=SIR7sKCCegwzahSz82I3gsDyN5TkKoa4yG4-pBQWBi4,9813
171
173
  sglang/srt/layers/attention/double_sparsity_backend.py,sha256=2ZRL_gYz14idoVqQzeQ6N77nXer0f_8_TUYw40XUUz0,9161
172
- sglang/srt/layers/attention/flashattention_backend.py,sha256=ovi2rduqany6oalDWI7WAetjyHO5DybKA3epHimm86o,94076
173
- sglang/srt/layers/attention/flashinfer_backend.py,sha256=Ug4SkZnuHjBBwPOj2TfLlg0eU_GoZvKjhY4oYRU_qqU,49666
174
+ sglang/srt/layers/attention/flashattention_backend.py,sha256=rYsBAsFS1qNNe-3CVIaXxWRqA3eul1jVQXvfZ_wlpwg,94076
175
+ sglang/srt/layers/attention/flashinfer_backend.py,sha256=HQp14R29hQVXYjATKPoGaHY9LJ9e1cw2k-RhBEmFxt8,51505
174
176
  sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=NirRlNFxD0S2EncvvmrerIxNfuTnYpvemZV3MR5_FnU,34040
175
177
  sglang/srt/layers/attention/flashmla_backend.py,sha256=5iSic5ho-lkXNas9mR3uLbXbEl-do31gc8gjR7-a79k,20711
176
178
  sglang/srt/layers/attention/intel_amx_backend.py,sha256=hH9lxXs_o66_IVs58oPhRCOXGUrHbXSz82FKtHr9GO8,4092
@@ -189,16 +191,16 @@ sglang/srt/layers/attention/triton_ops/rocm_mla_decode_rope.py,sha256=664WnAJ91E
189
191
  sglang/srt/layers/moe/cutlass_moe.py,sha256=--bNTA2BGbHeULb_XXDoRUyWWbE-doHo5K5k1T0N0WA,14323
190
192
  sglang/srt/layers/moe/cutlass_moe_params.py,sha256=9NRCmgP_Ug3gGqCcpi-x-QRbLjCNpw8792gKXwZsbEU,6522
191
193
  sglang/srt/layers/moe/cutlass_w4a8_moe.py,sha256=bc8s5Oc36pCF0VozxZuqFOOU2fov-4wGPlyduye3Imk,7296
192
- sglang/srt/layers/moe/fused_moe_native.py,sha256=bW3KWxxz9rxKMUQqfmAtF-7ptTODA1pwLydE05ABDJE,5030
194
+ sglang/srt/layers/moe/fused_moe_native.py,sha256=SkOFgU23aZfHmLhnkVhdUWGx0-2wbo6uu9ohKBp2yOI,3486
193
195
  sglang/srt/layers/moe/router.py,sha256=UrPieRvemN7Ew48gtG7DA2xhNDBRSnZxzugTEBI-0_E,12006
194
- sglang/srt/layers/moe/topk.py,sha256=FxmdIdyMbRqIequtfwaLsz9Go-1lRooH8d8HBfQ0pvw,18426
196
+ sglang/srt/layers/moe/topk.py,sha256=bDHFcFQscnGDpCk7VejoChbpEVVz8Ph4FdzwcQRny0U,25047
195
197
  sglang/srt/layers/moe/ep_moe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
196
- sglang/srt/layers/moe/ep_moe/kernels.py,sha256=_pb2_5sNqbkImh4Ylv0hWhEQCOmItvPqB-b3dsfDHc4,42604
197
- sglang/srt/layers/moe/ep_moe/layer.py,sha256=Jl1TolpjQMtpMC2QXq5X5IA3vkF9UlfxlLl8r6qqN2k,62485
198
+ sglang/srt/layers/moe/ep_moe/kernels.py,sha256=UFH-XacP3aBjAcn6_SeC641jGzjSrY0fz50IB9URix4,42706
199
+ sglang/srt/layers/moe/ep_moe/layer.py,sha256=0vJW7RoEJ8Y3wD3q8pk289Gx5KNSVNJBbdpveliyXyM,46910
198
200
  sglang/srt/layers/moe/ep_moe/token_dispatcher.py,sha256=aiBE3mjvWV3eBrFGH9J44tuJncQwOjRS_XeyBNCEtqM,24379
199
- sglang/srt/layers/moe/fused_moe_triton/__init__.py,sha256=h9yMFAL_bagUf-qBED8gSWdCOb7d8IdA-pE-L_nIg8E,842
200
- sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=Ffcu3Jvp7-nllybh5EWtG0MamWI9PqO8a6ESiMKWEB0,63292
201
- sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=5NQh7_17xTtwSFClwgvpnzXrEO9iitl8aKfMm4jWJCo,37556
201
+ sglang/srt/layers/moe/fused_moe_triton/__init__.py,sha256=4NXZHbCw-G-uSnNUj4up0yh3xBDPnT-x0pdoIr0lku8,831
202
+ sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=6NcY-6UHQUSVP4qzc8jis4h-W9BEV4lnGmrJMx2S6eA,57164
203
+ sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=BUbo3OFiSjqs34MK09McFYqSsKguDcG6KP1905WUMFA,23933
202
204
  sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=hoWVdf8ry8IDGH2bfk2WW-y2S5h5haLTGanBSwkkeE0,5848
203
205
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=iNGsE2ZeVnQEnN4A8UJ9Jv0d3hbRF2MJ9oBgjup5Szk,2737
204
206
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json",sha256=JJN0hryyLr5Zv3dSS7C8cPFhAwTT6XxUVnBGMZvV6JA,2752
@@ -360,30 +362,41 @@ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=hoWVdf8ry8ID
360
362
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_2_0/E=288,N=64,device_name=NVIDIA_A800-SXM4-80GB.json",sha256=3T8_rF2PEojhgTMyQ8DscXgJCWWdWfDPj4M434zWcA4,3243
361
363
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_2_0/E=8,N=7168,device_name=NVIDIA_H100_80GB_HBM3.json",sha256=tme0ydWzIxdABZLk4tU8G_X2dJUYGGZNkQzNGcmcvUc,3261
362
364
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=128,N=384,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=LNx1W_BsWZcpHomiScCRap46dV0-F7S_w3Htskoqlm8,3263
365
+ "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=160,N=320,device_name=NVIDIA_H20-3e.json",sha256=cWkEpNqnyn0QS8HcgWiwWI1xqh_U93_S1kyNeb69aOc,3238
363
366
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=257,N=256,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=fo1akCuGoqcGwQgfh56hApgg-wLXfo9kHHksE_6m1F4,3262
367
+ "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=384,N=128,device_name=NVIDIA_H20,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=ENDYnC1ljPNpDVHdmqR7UbgDWT1IP_55ZIQ_Oae34mI,3264
368
+ "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=384,N=128,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=5UAs8Z1myw8F-5FY2HHWd5WMT2ii9X-aYIYkf3FsA8s,3269
369
+ "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=384,N=256,device_name=NVIDIA_H20-3e,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=941ZXJti99_GUeiylwPUWqYK8b548xuNIjv0pz9Kcqg,3262
370
+ "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=385,N=128,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=rgF-KSAUXmI7QGrhMUywPVfeTxz_j8_IP4N-6bkYdak,3260
371
+ "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=385,N=128,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=7aaoi0MI2xC5ZJkflkTZAH4tawTPdmUpmcBOgOInKxs,3268
364
372
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=8,N=7168,device_name=NVIDIA_H100_80GB_HBM3.json",sha256=a9XJZ0XudUTebAdN5guVq-3XSvZetHIRjatO1-_0xCk,3257
365
- sglang/srt/layers/quantization/__init__.py,sha256=JHV4X982TW7_U7ZobQwNIdK-Z5saEH-R1xKWrF6jgRg,12650
366
- sglang/srt/layers/quantization/awq.py,sha256=KemDG55U3B6YZVjMV71awVAIj0islFvtxcUHmOBeGy0,6739
367
- sglang/srt/layers/quantization/base_config.py,sha256=jWk_egQrVNMYmQgbTI9vkcgzScLFjB5_sywFlAfE5J0,4776
368
- sglang/srt/layers/quantization/blockwise_int8.py,sha256=vWyPZsRLhdKtSmjvlT5fsowBK_nEebYbDAUh2yqseGw,15285
369
- sglang/srt/layers/quantization/fp8.py,sha256=X97n8M7Kqhv98JvVQsSW6oYJtI2Wwrnoix-LMtsaxu4,47468
370
- sglang/srt/layers/quantization/fp8_kernel.py,sha256=PuDdACPV8xFQwcEAY57L465-yPJHbbJBKOlo1vuEOPM,34744
371
- sglang/srt/layers/quantization/fp8_utils.py,sha256=fsX1x17RwcK88N1WpF-YELQOpkpHvJnoLriZj27H2R8,25611
372
- sglang/srt/layers/quantization/gptq.py,sha256=B0J14a-OANM2uglnatukFMlvpDnUprV3-p_l4308WUQ,26838
373
+ sglang/srt/layers/quantization/__init__.py,sha256=lMjOmhMntbY55RR5eKKLB338tdzlxGuBx-pT4f9jmIM,8130
374
+ sglang/srt/layers/quantization/awq.py,sha256=gLEOx6QoGQ0McBEURXPVidKGsdNUjqc9sJwGLQx86rE,26690
375
+ sglang/srt/layers/quantization/awq_triton.py,sha256=4XwJbRNlFmlvjbMGtWF1Wvk26Kf96162vNEmuI5Kars,11737
376
+ sglang/srt/layers/quantization/base_config.py,sha256=CiSxG5iuOa-12V9kIOh0Fu8Y7knZxfFbbNGTo6nEaRE,7173
377
+ sglang/srt/layers/quantization/blockwise_int8.py,sha256=3avetVUBjCiuYWBJQbElbVXWpx0SgsFsDc5F9F_zHgA,13879
378
+ sglang/srt/layers/quantization/fp8.py,sha256=T6Gns69ot-qE4DcxhZLoY41VG450qpbM_EbuRdRleuk,56618
379
+ sglang/srt/layers/quantization/fp8_kernel.py,sha256=1nrJvQNVZszd_SIIeOEgB2CiqyqdfVHbsBXegPiEfk4,40160
380
+ sglang/srt/layers/quantization/fp8_utils.py,sha256=6FVR6_Y8akP4ihCaGG_bLYurcC_PShPtiPgiEvGN5bE,25605
381
+ sglang/srt/layers/quantization/gptq.py,sha256=3q9xfq5sJJHcrVr9C8-l9JdcLFvwKAAfWJEfZW6CzLs,39145
373
382
  sglang/srt/layers/quantization/int8_kernel.py,sha256=GfRC9FOn9exNvK4QHbUeBj3Hhv32VcyGphapFPt5b84,12625
374
383
  sglang/srt/layers/quantization/int8_utils.py,sha256=YK9CS-lb_n91kNCTKK5o5apYF31V2giDg5G5VKrpcUA,2356
375
384
  sglang/srt/layers/quantization/kv_cache.py,sha256=_9pF5rwvB7ta6Gdc5YKVVGbNzYwqmhIx4TrX1-xnodQ,3261
376
- sglang/srt/layers/quantization/modelopt_quant.py,sha256=0abOZfOyGYOQFiyMssZPey1YekQrAQBcMp-GQlrFXZY,40746
377
- sglang/srt/layers/quantization/moe_wna16.py,sha256=Fb7qc4fHec9Qst1ne55YqNAJvO5D3JoMMkhYrYh8vzE,19646
378
- sglang/srt/layers/quantization/qoq.py,sha256=adhsCixRUTh1m8sfpRWNhh5oX3I1WJli3Elg8uexP6A,8222
379
- sglang/srt/layers/quantization/quant_utils.py,sha256=kBibCBK9DCambuPy2atB82Bmalb-Vs_wbQoVHT7h2Lw,5089
380
- sglang/srt/layers/quantization/utils.py,sha256=qHdWbLQD8teKhv2tOcuyGegpFonXygoJHwCAD7Ur5MA,5439
381
- sglang/srt/layers/quantization/w4afp8.py,sha256=Rf8wMqtGUgLF8soOM16owfFI0AR1q1Ylzr5YpcdqyxU,9538
382
- sglang/srt/layers/quantization/w8a8_fp8.py,sha256=ZB6ydquyPOORDe9OCoEBRH6dsQhCeRWv1YIgm8UDQwQ,11622
383
- sglang/srt/layers/quantization/w8a8_int8.py,sha256=jXQiodlIShMWbivWPlnLFkg9W41eC-_5bWTzd5AMecA,37189
385
+ sglang/srt/layers/quantization/marlin_utils.py,sha256=ShsoxcVTYo1Es3XKp9mlQNw-TsRF_o4mHIO5MfAP5HA,25906
386
+ sglang/srt/layers/quantization/modelopt_quant.py,sha256=ZxnHbYkpSt20xwV1zhZp3Xk93JzxBQOGHobZWIMluII,37872
387
+ sglang/srt/layers/quantization/moe_wna16.py,sha256=NGcFjiMXwfOX10dkHAY3EgZHxox2k7I402Bvwj3jW1Q,19105
388
+ sglang/srt/layers/quantization/petit.py,sha256=74Jn0eICq23v_b4rEctDaYTINtbqkdM6IXycT-_FbbI,8954
389
+ sglang/srt/layers/quantization/petit_utils.py,sha256=-gy4zMhqNoIA1R0n7-5C0efV54jHonCUgPDUUFjGsyM,3245
390
+ sglang/srt/layers/quantization/qoq.py,sha256=jM96uJfKz3vo1B6SSIrQXNT3vnD3UJrepK2eY-tSQU4,8139
391
+ sglang/srt/layers/quantization/scalar_type.py,sha256=nBk4THjeRWMGW3hKWRdrjfQ0gwpuBxmYqapDBaRpnr4,12395
392
+ sglang/srt/layers/quantization/unquant.py,sha256=hzyGGJoclb1oANy3hYxrEK76F7V7LNjU2rd3NWDpeGg,13997
393
+ sglang/srt/layers/quantization/utils.py,sha256=9ZmfS0MMqueQ6zIxMIFoQy2OFBQ5vHjOHBgVvUn7ews,16213
394
+ sglang/srt/layers/quantization/w4afp8.py,sha256=r36F5f5tAan8omW2UYZwK7xIwZUAWYHBbwJtmIIVzIY,9672
395
+ sglang/srt/layers/quantization/w8a8_fp8.py,sha256=I_W9A4Pnluaf-SaT8zq-tAJTt1acpxfE_kG5mqdc5cE,10250
396
+ sglang/srt/layers/quantization/w8a8_int8.py,sha256=VGrVELArNuyw4FEtUefaeK8ayuX7cpXj1OOqCmOCzm4,34902
384
397
  sglang/srt/layers/quantization/compressed_tensors/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
385
- sglang/srt/layers/quantization/compressed_tensors/compressed_tensors.py,sha256=EaOKuIA0zXwqmH_eVhWeNdGJT9d1d9gVvFyYkgpdjDg,25665
386
- sglang/srt/layers/quantization/compressed_tensors/compressed_tensors_moe.py,sha256=w19mhCnOre3j6L2-Tc_sRtBPgwBOAKV4QmYLpzyU_Fk,26637
398
+ sglang/srt/layers/quantization/compressed_tensors/compressed_tensors.py,sha256=DsPCI82A4rqI6mjKo-WorIKUweppFV7-16Qku-zW9_g,25897
399
+ sglang/srt/layers/quantization/compressed_tensors/compressed_tensors_moe.py,sha256=vwcgwGuPhH2kHBfg7DnsndzffrbZx8xuFsl9Qeegd9s,24286
387
400
  sglang/srt/layers/quantization/compressed_tensors/utils.py,sha256=mnUmKWFQUnY8bVoFHUuNVwqsfS-cefeR-ofyaihCXcY,7621
388
401
  sglang/srt/layers/quantization/compressed_tensors/schemes/__init__.py,sha256=HWMTnmrj-mUCRXgcOwnnXLrvrAE-ONdPTSzSImjHCMA,347
389
402
  sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_scheme.py,sha256=tdKJC8c3SX8T3z8JL-1YCsg4ftcv55Wxt0vZrYftpX8,1635
@@ -546,11 +559,12 @@ sglang/srt/layers/quantization/deep_gemm_wrapper/compile_utils.py,sha256=BrzCCxX
546
559
  sglang/srt/layers/quantization/deep_gemm_wrapper/configurer.py,sha256=zkMzBAqQTSwG9TlGPuwmHV1yN0v5Y_5Hgyo0CKQDVNU,741
547
560
  sglang/srt/layers/quantization/deep_gemm_wrapper/entrypoint.py,sha256=On_uvP1ThxgQFAzOWKoteM0vIOHqmtI127A4qbPtmbc,3264
548
561
  sglang/srt/lora/layers.py,sha256=FaTYf0w3zbKKKAT1nJdAzGRtxvySB6FpNKXvEi5RHH0,12958
549
- sglang/srt/lora/lora.py,sha256=v4mkNOypfPXLW1mv_uKj2M-kR-CnzSmu0GReKafGSrc,9667
562
+ sglang/srt/lora/lora.py,sha256=sRoU7BdlTV4cnBv1-u3QjisVR9XQrrqAsmhxdNtd8dU,9433
550
563
  sglang/srt/lora/lora_config.py,sha256=qDgMTx_69jyJUl29O5FxLzYa0BMhqYVXWXfyyVOvGm0,1684
551
- sglang/srt/lora/lora_manager.py,sha256=sdfSP0o3u4sMlzaVO1N7xhprfydFG-VSutmtOFlu-cE,20060
552
- sglang/srt/lora/mem_pool.py,sha256=M4l4RO4tRjii5T4fq89nUoKJNHusaQHwvLrkryBCb1U,10132
553
- sglang/srt/lora/utils.py,sha256=f3eySsA2tqlzMkvqwtRPWKIRjDiMk6ZFh9CJfUYdeqI,5486
564
+ sglang/srt/lora/lora_manager.py,sha256=ABuqg1IhY9LNXgJd_v3Yx_VHS52t4SapHmhLiH1thdc,20147
565
+ sglang/srt/lora/lora_registry.py,sha256=q8HRG6YeWNKQFxbtaBlXSLGOgh0EtMAKPCKAsNEXdQQ,4747
566
+ sglang/srt/lora/mem_pool.py,sha256=UYvTgEPvBoVsaX5rEnipebOAlo75pML6_NO9GfCFzl8,12148
567
+ sglang/srt/lora/utils.py,sha256=5G0KiDEn-Zg4OgIOjWnU2ZdQGNstZswoAog9xU4GVDA,5660
554
568
  sglang/srt/lora/backend/base_backend.py,sha256=EIz8I-GIrdmK4fISw3ENhbJVVITaxKfyLxHXGPU4fPs,5044
555
569
  sglang/srt/lora/backend/flashinfer_backend.py,sha256=el6IAB4kTgDTbwCggmqFuukliyoapN5X6FLksG-4wJ8,4151
556
570
  sglang/srt/lora/backend/triton_backend.py,sha256=uqwBGlguXX8EkCKjSPqac6SPTgcKA31u3u6HkKPQcos,2530
@@ -559,158 +573,165 @@ sglang/srt/lora/triton_ops/gate_up_lora_b.py,sha256=QURCYxHNR8Ls4SQtt3dvdgjvdDVh
559
573
  sglang/srt/lora/triton_ops/qkv_lora_b.py,sha256=iz5scFNo2YFTeiM8beWg9Z1oZI-6AM_T1wBMCQ6qp2Q,6485
560
574
  sglang/srt/lora/triton_ops/sgemm_lora_a.py,sha256=Ksova04wgeGsFqGOXWqJtMYaHgyUYcx8VU42BZQOkVA,5129
561
575
  sglang/srt/lora/triton_ops/sgemm_lora_b.py,sha256=VqCAFvUtq_l-0RGIkx3W_fzD55QcW2FAcqpvSHOBFp4,5115
562
- sglang/srt/managers/cache_controller.py,sha256=HPQGLwjey6GeW60Vu6MVeLYtRsJrh99_-dqHYSzlBkE,13614
576
+ sglang/srt/managers/cache_controller.py,sha256=-je55waMGlOXvEKICJ9CQCRngSwhdae2agFJCwO2E7o,24503
563
577
  sglang/srt/managers/configure_logging.py,sha256=8sNXZ2z9pBWOwn-X3wyz013Ob8Nbm1zDxRkxoZjH-l4,1633
564
578
  sglang/srt/managers/data_parallel_controller.py,sha256=PZ-wOcAFn3PQqMB6I2vjIsFmplf0nlNl5hqTDKTHTG8,12112
565
579
  sglang/srt/managers/detokenizer_manager.py,sha256=SpLxTsSPKBZfD-ZMhJ5zpPPGuUb8PmcYgFSL9CsurU4,10696
566
- sglang/srt/managers/io_struct.py,sha256=DaRJxXiIAhp0Dz4FxScZkoflf4CSc6SdO9YP1hbPY2c,36582
567
- sglang/srt/managers/mm_utils.py,sha256=Pk6yWX7YThmulSjx7EWYuIKXm8Gvh0WdvPDsBHNApog,25500
580
+ sglang/srt/managers/io_struct.py,sha256=LNLG7utMidF63eYWlWYxQ3G2GzOqaQzQc-9ld2yaycI,37859
581
+ sglang/srt/managers/mm_utils.py,sha256=sHEOfM7T46btXHDArz5lS6pRL7gleAJpEz7l_z_MnWs,25476
568
582
  sglang/srt/managers/multimodal_processor.py,sha256=mzCrN-8H0bE0iMO8UzxmYmhE2M1qsbVJXGdhAYcjjYA,2016
569
- sglang/srt/managers/schedule_batch.py,sha256=T36ZokjgjzzV4VYKdxphY20O05j7DO7lrciknsW9-N0,73519
570
- sglang/srt/managers/schedule_policy.py,sha256=0T8URzQmLvEmG-42-SFBBl9WnsOSwYO8-_CcBpuD38M,20474
571
- sglang/srt/managers/scheduler.py,sha256=uaz-x3VrM77yeauYgVHYdu72iYK9Ct-qGY67j84ss5o,113502
572
- sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=XAK2aeLleZBaLtzebEKdpaz9E7uKnHV7ywHSk_WPDYo,30148
583
+ sglang/srt/managers/schedule_batch.py,sha256=GC0Pmz9eBI3da1zN0EkNvEQiOyB-qiouTcqITLx7peU,76068
584
+ sglang/srt/managers/schedule_policy.py,sha256=BFYItMXtrsO5157tpFhYwLpZ8NSlzR4_gNZC1iE10D4,22400
585
+ sglang/srt/managers/scheduler.py,sha256=OrWS4M1z68igMpFF-UROXXGec1PJOMBeUwqeOCLoBaI,120513
586
+ sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=Ei-9lyfrSQAlL9_ULuJLAhA7qpvUzjsBDzBBTDdnt4Q,31394
573
587
  sglang/srt/managers/session_controller.py,sha256=dzlMNZlo20FTSl64QqK7y7pElsdCy8ICOWWBPTBVwgs,6040
574
588
  sglang/srt/managers/template_manager.py,sha256=RrwRA2oqId_PMQ98qJQGwIxMroOxiorl2sGC9ARou_0,8543
575
- sglang/srt/managers/tokenizer_manager.py,sha256=MK7k23sOWnuq4_slZt2a_yvr3xVG-66ZKIy5-eBwlMI,74364
576
- sglang/srt/managers/tp_worker.py,sha256=kyk2EVd3eP0gpgVETJ6J_BdxIDbiB76AfpN4_-Xqkrs,10896
577
- sglang/srt/managers/tp_worker_overlap_thread.py,sha256=EFbtichmZjMoBgRa0AMIGdKGur1i8bpd3JvaDi-SsK8,10663
589
+ sglang/srt/managers/tokenizer_manager.py,sha256=EIBoSgTGKuvYTy_hwTRvw69sbKex7jqPaFuE3P0lXqY,74848
590
+ sglang/srt/managers/tp_worker.py,sha256=JEY1nJ6bx7IEYR-NlB2Ybuxw0dnD6N5G4XdFYOg4LQw,11257
591
+ sglang/srt/managers/tp_worker_overlap_thread.py,sha256=kK0pn8mz-XgLGvVlJK6LvDVp4lnFk5vJH-Cs9NQ5Un4,10959
578
592
  sglang/srt/managers/utils.py,sha256=9_VGE48EK0PXVJ26aYvbRJ6n7gIZALvCcf6uZCccCgM,1369
579
- sglang/srt/managers/multimodal_processors/qwen_audio.py,sha256=vUkXsa_Ipe_EjWPWDSSUrbm8v-fDenEy3w3fpHwaf2g,3170
580
- sglang/srt/mem_cache/allocator.py,sha256=MJUPQt4ECj4ReGeUVGVUNfwrwjHBbf3youdkyp3jCGQ,21633
581
- sglang/srt/mem_cache/base_prefix_cache.py,sha256=XHSzXKgBin-m1HsL47K-GobhLnajaGxqLqGtrLsWaZ0,2540
582
- sglang/srt/mem_cache/chunk_cache.py,sha256=MWo4DwRkHKOLKyow53YrGQdvn2dI7hVJuf2Gf-SPAr0,3110
593
+ sglang/srt/mem_cache/allocator.py,sha256=id4riucsG9d-P1ikj3-DLJbzhM8-MuJfvDmB8H4g9-o,23364
594
+ sglang/srt/mem_cache/base_prefix_cache.py,sha256=hLS2ncTMAz7Kpdk5pNwn5c6g8b61_K9OCBL4Vj1xsYc,2801
595
+ sglang/srt/mem_cache/chunk_cache.py,sha256=FU_fq8e_dodgU8EkRqE4Jr0sKwCXQnKmapO88k6_JfU,3207
583
596
  sglang/srt/mem_cache/flush_cache.py,sha256=GYcxmNXh4hsMpFfNOuCTpKilW7guZwTtAg_usVeM3J0,979
584
- sglang/srt/mem_cache/hiradix_cache.py,sha256=0jZEWFP4k5LkKMiCc-G0G9GD7oPoP9zNWaAFPMeVFSw,17137
585
- sglang/srt/mem_cache/memory_pool.py,sha256=EclwV8sNObkpw6lmIYwIFqq7jdTsbHS91H0Rt_IjPUo,40304
586
- sglang/srt/mem_cache/memory_pool_host.py,sha256=G_vmKQFw6jvPnaxjltRLXueDUjlqYgIdxRqoM1kTj5Q,8863
597
+ sglang/srt/mem_cache/hicache_storage.py,sha256=pvNeooVmCZBeZFgSHWNGPZzqtHI_qJ5BpTy_A4i6gg8,5539
598
+ sglang/srt/mem_cache/hiradix_cache.py,sha256=1cx4yT4Or7HyvC1Qpi-thEfPoht9lLE9dcgWQf8SDWc,24758
599
+ sglang/srt/mem_cache/memory_pool.py,sha256=jQdWgOr6hpMLbGaEJc4immBgZG_MZbx8LyOv029ASVw,40932
600
+ sglang/srt/mem_cache/memory_pool_host.py,sha256=xcjYyC94FOH_NguWbLUG4vF_CSBcxA_msuRsBasYCPo,10387
587
601
  sglang/srt/mem_cache/multimodal_cache.py,sha256=wZl2KeEl3xeoEsYdH33UoM-FO8kqfLo_XUgereJVvoM,1348
588
- sglang/srt/mem_cache/radix_cache.py,sha256=qZSsdlTVCZ3UCqkwe3IDYE07-QE72hYExIb2kbhyMmQ,18096
589
- sglang/srt/metrics/collector.py,sha256=C9QEJDOEdOPBwy2IJwFS3R6VbGzVzGs2xakKCCPvQDk,19903
602
+ sglang/srt/mem_cache/radix_cache.py,sha256=kp4JiVxh3eS4MsFxGKIYjYAb14B777qc1bHrABPqBMc,19101
603
+ sglang/srt/mem_cache/swa_radix_cache.py,sha256=4qt_gS7GuHiekd6VvKkx54dB2GHJzNA_kj71Np6jTDA,40300
604
+ sglang/srt/metrics/collector.py,sha256=FH6Wil2lMK7d7q74CfxfdULCaHKDXeAoo8UBZqqdepM,20289
590
605
  sglang/srt/metrics/func_timer.py,sha256=VFyNRrbnKVCwnQsrlLin1lITJfjQpf9m8sGPqL5LIsQ,3438
591
- sglang/srt/model_executor/cuda_graph_runner.py,sha256=3pc1_TpGmUAI51SxVubGGZIRuBmZrj8kOuch970RN2A,30505
592
- sglang/srt/model_executor/forward_batch_info.py,sha256=w2U4at0aQGdj7niBf2__aYG_2qAR2yDFfzm3nl1s7qo,29901
593
- sglang/srt/model_executor/model_runner.py,sha256=kfFWWHMXJ6X9WEQgEj618mx8zIc9qvhXC5-K2ICDPJM,65709
606
+ sglang/srt/model_executor/cuda_graph_runner.py,sha256=6njRGysrhBDi2bAt5DyjGnyrexYvuEVsAJwQBBW8Ut0,31886
607
+ sglang/srt/model_executor/forward_batch_info.py,sha256=NvUhReevoy6UfO4991P_5MPQyfefC3BOoTwTqUwMbYk,38430
608
+ sglang/srt/model_executor/model_runner.py,sha256=wVRFMda8oHYIeSfzINLlDMEQvff1uWMeJOwrS3U8_9Q,70162
594
609
  sglang/srt/model_loader/__init__.py,sha256=zGZkOBz1zx-pkaIy47BasL3fjDlAcxAXUTjInOhXHAE,919
595
- sglang/srt/model_loader/loader.py,sha256=xHeIiwhp26fOCkaegfWk_Gp6_E8eSAWvblY8xQKwGQ0,59562
596
- sglang/srt/model_loader/utils.py,sha256=zSZBPA9ErPmkf-HfCxJjhmiFwYueB15KUg7NFspLvPY,4454
610
+ sglang/srt/model_loader/loader.py,sha256=wxSUYrqv23w9yHYy9Lm0ozWggs9pf6Co4yqe1UO8PZk,59799
611
+ sglang/srt/model_loader/utils.py,sha256=svSrPQxViBz_-0_sByu4coCYrzJ51-4FCi_bFqa6rDo,4474
597
612
  sglang/srt/model_loader/weight_utils.py,sha256=dfepjK1lhcFoxX6Vflb3imiHaj9_Tep_uZ7j3lfN9jE,38004
598
613
  sglang/srt/models/baichuan.py,sha256=HbvlErnkCSK4pRQYCSDxMcrn-1DQyfiNoeDcnRrJas8,15807
599
614
  sglang/srt/models/bert.py,sha256=ODJe8YfNRP-hHsomFWk4_QpcuiSsNfjzGf256EDS0Pc,15802
600
615
  sglang/srt/models/chatglm.py,sha256=cajLN9caBl09e0TwOFkiTTKDqwlbmHo_yS-NCjdeQW8,13957
601
- sglang/srt/models/clip.py,sha256=mkdSNhc2SgRHyeq9tCLEjUGdnA8yS2EMMbMKSpn5dMs,19863
616
+ sglang/srt/models/clip.py,sha256=kOPSXnmgH_QKu2-ENn49HLDS9yf7Gm1HCOE_YvoNhlA,19858
602
617
  sglang/srt/models/commandr.py,sha256=5Y_b3K0QY7D37nFGkyiGgY38RleRui_GJUYcHSuHUZo,15315
603
618
  sglang/srt/models/dbrx.py,sha256=4pn_fdoATg01VEqNnIAxNEsKV5XU7gwHyd289eydq1s,15598
604
- sglang/srt/models/deepseek.py,sha256=ZnN02HdgXCB23Vno5V9UMUoOxH5HC82vNTwsVulUJ-o,17206
605
- sglang/srt/models/deepseek_janus_pro.py,sha256=nOUBFIpZpnQixcH6q18NPx7k2RSNdJOtEW1L6mnsCok,70423
619
+ sglang/srt/models/deepseek.py,sha256=sqobTr9a9c5pNLNJZE-WrJIE_qBq0lC5gCGv9NpGU_Q,17364
620
+ sglang/srt/models/deepseek_janus_pro.py,sha256=td8xGs6ARfJ8AQCYwUhMOZoWigrAs7m3trF5-kXCqik,70418
606
621
  sglang/srt/models/deepseek_nextn.py,sha256=47fehxRdiOizr0rdLg5f1fzQEx6gGAOcDcWKtblloyk,5928
607
- sglang/srt/models/deepseek_v2.py,sha256=KnGeJj_WEIntcQm67GK2NgYxyDNEurs3lTIOzDSsadQ,102964
608
- sglang/srt/models/deepseek_vl2.py,sha256=5xyOXHKTk9GrnpfJhQCSExfzdtztyt4A0BuFsjr2dW4,13068
622
+ sglang/srt/models/deepseek_v2.py,sha256=IG8hrn5j0o88mywclcyKe_djKLClC1Low6IDLNcQ23A,104131
623
+ sglang/srt/models/deepseek_vl2.py,sha256=7X3gI4DE7guUtNJvMLf06jO8MUHKa2Aan8evZg5hsXc,13061
609
624
  sglang/srt/models/exaone.py,sha256=TpO-rtCpEZ8Ua7hGFnS8l2oAYhY0Pij50grc9WQ2mvc,13576
610
- sglang/srt/models/gemma.py,sha256=4cdrPISg1VKnsuI-QPTpYvet4BrX8BMKvCIN82iLskw,12641
611
- sglang/srt/models/gemma2.py,sha256=kqtwdo93GWKm2iBN29RoIRH2ggRm-K_80LM5btgfBLo,16395
625
+ sglang/srt/models/gemma.py,sha256=2atKwFN5wCsJCmBRmURX9vaCcFjxlFirL7xsnG5KPlI,14180
626
+ sglang/srt/models/gemma2.py,sha256=lpHKN-ovN9IWz3iA9FsR5H86lGatectnM8sjx0GoinM,18033
612
627
  sglang/srt/models/gemma2_reward.py,sha256=V8U3_ADUHWPdOwvEe1jhGW-oJmBgL8t1TY3-67Ksv2A,2618
613
- sglang/srt/models/gemma3_causal.py,sha256=CJ2g08Ec7IeoObQIiGH0WIEtYOl05SbJ2g_pfJwSyBs,25130
614
- sglang/srt/models/gemma3_mm.py,sha256=oJnfckeiMWyTy-pwq5sPhmrIEatO23T7xUbYefSySq8,17194
628
+ sglang/srt/models/gemma3_causal.py,sha256=0FdI0wVoJ4ZakBl8ShO29D1uEMO0T8CRjdsfiHzCGY8,27424
629
+ sglang/srt/models/gemma3_mm.py,sha256=sRvdAOiStlDhC_-sSH226d0awx4ZQJG7Wtdf7PE6ygw,17189
615
630
  sglang/srt/models/gemma3n_audio.py,sha256=isgKfjA5UieYawxU6medL2ssXlzYPqAbagDBnLcemC0,36405
616
631
  sglang/srt/models/gemma3n_causal.py,sha256=kBDlpSWAg6ZDmUPe08Q7sj5CbdVD_0h07zwJw8sKu7I,36335
617
- sglang/srt/models/gemma3n_mm.py,sha256=REq6a63hXpEuxJ59yJDtPIXZkvd-1YcAtirnauptwsw,18735
632
+ sglang/srt/models/gemma3n_mm.py,sha256=pL_fvnkz9fKaC2Afms5KG3Me3u5sp1C2-mAUhqPGrQ4,18701
618
633
  sglang/srt/models/glm4.py,sha256=2VQzUqFkQTy_2nfkxP9SF6_9kKLTZUExGRjge7r99Es,11265
619
634
  sglang/srt/models/gpt2.py,sha256=kclhxEs8oJk1KCyhmAqo7rZqecVGGHYkc-a1WZi3aIk,9841
620
635
  sglang/srt/models/gpt_bigcode.py,sha256=1D6bi8Zu760gCRZkvdLHFcg8kCkY35ARwQYaMDtYhl4,10307
621
636
  sglang/srt/models/granite.py,sha256=5WOJyNYAlt5RNHSexNfPNihhSxIMd7wPzju1cTixKig,20852
622
- sglang/srt/models/grok.py,sha256=vESZeGS4adI_JAerXIkCcTm15-CNiGeS7VHc36C6w1A,28033
623
- sglang/srt/models/hunyuan.py,sha256=YRx9Zafs8HVTNHxlMMKdbV3ELMn6rWi9GKlk94U_R7E,28990
637
+ sglang/srt/models/granitemoe.py,sha256=diq5Xp_jg0RX5629iAu7eeTYPYOxfg95-FoKUQwt2Ic,13723
638
+ sglang/srt/models/grok.py,sha256=wY3flIJdr00wYvW-_PHXrXwh-R7vlTnf1UKhjPN8Egc,28199
639
+ sglang/srt/models/hunyuan.py,sha256=GVDeMKgcqW6HMFWPUukznL5JoDW4CpOpS5Q_PXlbHw8,31071
624
640
  sglang/srt/models/idefics2.py,sha256=U3khd3hbdawJeRNXsxmaKHdssOCT5TPOZ1D-2_zHoQo,12079
625
641
  sglang/srt/models/internlm2.py,sha256=F_iNY1gUqzAjAuUatcE47gnrcoTh5_08PY2Rw9tKr9M,13150
626
642
  sglang/srt/models/internlm2_reward.py,sha256=ndfGmyqYZbVZ7C7rJ-v9oK3wa-EpoBGybS8MlyKZi2E,2522
627
- sglang/srt/models/internvl.py,sha256=ZM5I_Dp0jaG29WfZD_S0tKZUStQm1C2C8_0WGRA0T7w,23338
628
- sglang/srt/models/kimi_vl.py,sha256=d1qOBRWmxKr-hywvF9Xl4UvW8lDDHS7zeGyZgjEZWEw,12882
643
+ sglang/srt/models/internvl.py,sha256=OeQy0wCXBdqXB98cx9TNJ64K2YdT0AVIX_1xVYa-Jbg,23333
644
+ sglang/srt/models/kimi_vl.py,sha256=XulRiufQzOSWZe8-bUl2OEdznvsVU9OBsEYipaX3YkM,12877
629
645
  sglang/srt/models/kimi_vl_moonvit.py,sha256=M5L7AJOJ2Zh2pqLZAq8aRqhbTSlipr8XOoD3ix6o2sU,23908
630
- sglang/srt/models/llama.py,sha256=Ok2Ombk80KQ8G17V2h2pz3XH_LBtO3TCW2aAAdN4k9E,27578
631
- sglang/srt/models/llama4.py,sha256=nF19fG2ZdT1bUX3pncckwJ9dRMSazNZx647EW__rBRo,18746
646
+ sglang/srt/models/llama.py,sha256=Nsxv2s1sOmLnZsTHkwbTh53cUFEQ2fnKDQi5BFbFcsk,28994
647
+ sglang/srt/models/llama4.py,sha256=J8zuYOrQ8iV7CyWuLdjFmOyi7eD4GA7iqiaoKzGO-N8,18797
632
648
  sglang/srt/models/llama_classification.py,sha256=4QWTFaUZIFKYZvEzs8bx8VkOZNIwdYCLrnwrdAw4QK0,3108
633
649
  sglang/srt/models/llama_eagle.py,sha256=Ubh_jmtfiOnriwvHgQT0ZGID7JvYvdSi_QGHOIkEgPE,5028
634
650
  sglang/srt/models/llama_eagle3.py,sha256=715soylDE3kOMWskbPy_70BFxaSc5ptaHCS1v3-ViA0,8579
635
651
  sglang/srt/models/llama_embedding.py,sha256=zq-_lNu35VBFc7eemiam0zdkGIE8fzrgk5OWYfirZnA,3254
636
652
  sglang/srt/models/llama_reward.py,sha256=LF2nqMV5XOrljGjAwJg43mBv3z6Q040I2EYlgZeCp8k,4681
637
- sglang/srt/models/llava.py,sha256=yx867BoTyWd_UPcVDbPhhDpHE243KfAtDHyUi5uAsec,37551
638
- sglang/srt/models/llavavid.py,sha256=nBGPuzN9okPk8Zy2cIjMRmx7VPJWfkB3DGKeo09Y8XU,12823
653
+ sglang/srt/models/llava.py,sha256=_UBDz_S8AObV39w0XWkCPNQTxHMc27KH9PJHz98kzx4,37541
654
+ sglang/srt/models/llavavid.py,sha256=-CSk0RJ2MQeb81sh-RISeVJFaI-XWY6nR6_I594MkME,12818
639
655
  sglang/srt/models/mimo.py,sha256=Mp-iFp4YHuiuq-H8enUF5K5QbMnVcvEa6mURH6vM3yM,6140
640
656
  sglang/srt/models/mimo_mtp.py,sha256=jSmqJAXu7G3OO7jW1oa2suI4H_Yl7u5ZT7w4lHFbHhg,7292
641
- sglang/srt/models/minicpm.py,sha256=m5HFsSJj0Po09LY9R6qj6K4gceqWDMOePz3NDGgMGT4,14691
657
+ sglang/srt/models/minicpm.py,sha256=CzBJyZtfMpp8jvlEl29DHI7HLVq-CxuqP1UHwxIbaUI,14567
642
658
  sglang/srt/models/minicpm3.py,sha256=6-gfHSfXwyB5zw7AIj-c5TzjpEKR6CM0H67MrD8LVUE,19347
643
- sglang/srt/models/minicpmo.py,sha256=HbtJ-Ds5nqzZqNdicotL5OnRnyS34U4CwfjHbQHc2j0,75945
644
- sglang/srt/models/minicpmv.py,sha256=W_ZlgT3BxB4PyTLhBdDyV_JAhTJgDQmDk8mxWI6c_mw,30399
645
- sglang/srt/models/mistral.py,sha256=Ox07RJpTYl-4Pb25UIghL_66o9TTA6lPmsUyent_Flc,3480
646
- sglang/srt/models/mixtral.py,sha256=n-Pz7fyWE4m6Uh7sjzAYKNr5Wy4QUj5Yekl0qiCwQI8,17055
659
+ sglang/srt/models/minicpmo.py,sha256=urYHq2sVgvswZtDA_pYFa4HWJv17rspn-DajmfgDr_Y,75868
660
+ sglang/srt/models/minicpmv.py,sha256=g4aAOG8PVGkZqGmlneVaScAtNpSLqSVbZGRAikyrBy8,30394
661
+ sglang/srt/models/mistral.py,sha256=ni7PppA_5X4ivTnIps3yoEaMEL-G6Gaf9b5hGC1vU5Q,3475
662
+ sglang/srt/models/mixtral.py,sha256=j2whKt4GdQqtpKL5iN0Vb4TO4el1E2qEpUCI57E_47Q,17222
647
663
  sglang/srt/models/mixtral_quant.py,sha256=UUIq7lpUonD9IoGePyl59oJYEcVwT9wUXvtVp5tjQ9Y,15406
648
- sglang/srt/models/mllama.py,sha256=pkS0UWiqKJHRsFtSZzpSI9O6B5_j1OtI5pf_nyDPp3U,39707
649
- sglang/srt/models/mllama4.py,sha256=Zq9WIOmtdtRy68LwsRXJ0NgaIAqAyBBsUdTZoCsptSY,20216
664
+ sglang/srt/models/mllama.py,sha256=OdX7brhyfGiMFPulxF77QOUi-Kcscg3Qo4ipyxzs9yA,39670
665
+ sglang/srt/models/mllama4.py,sha256=yt2YNE7S6buLAaqSfxD2LcJL1ZRzUzKWU21rCbzDzQo,20465
650
666
  sglang/srt/models/olmo.py,sha256=7-q_fA6XXdG7kPUjpUzYkzMUWJobuSjhqjYw9xSUs_c,12671
651
667
  sglang/srt/models/olmo2.py,sha256=azmljhJF4ivcQfUtfsAUxq3ducE4tRKTL6iwe0IKYMg,14327
652
- sglang/srt/models/olmoe.py,sha256=TMzt-yB891bvA4X50xL0NjNnFYSx9imlA7N1EG8KNK0,15949
668
+ sglang/srt/models/olmoe.py,sha256=WdPtyKsd3u8OpVsXmDwWuVpt1gTF0679IRkc1pvfnMM,16040
669
+ sglang/srt/models/persimmon.py,sha256=86Duo3HiZqDj9O2UzWbJgUEhQOXzGBUdhUofQhcs1VE,11244
670
+ sglang/srt/models/phi.py,sha256=n6A1d47MvnR1lmSsZ3TuzXk5kT1Lntj_YQ5uNvR0s5o,10287
653
671
  sglang/srt/models/phi3_small.py,sha256=eJb8aS_3KLObrq3PNkoIyVHaQ6SZTAJe42rbpC54QKg,16012
654
- sglang/srt/models/phi4mm.py,sha256=es6sQM6JOpfL1uR6DerK427Q4Hj7aE0RkIwhux3NZlU,19135
655
- sglang/srt/models/phimoe.py,sha256=R3uA1e9XbH2e4XP_GiH8mb7_288BC94w2XQcoQrjyfM,19026
672
+ sglang/srt/models/phi4mm.py,sha256=Yh2GnrT8zyvOTMPslHbhUlNOTAzZ6LuzMNxKaJjr38c,21107
673
+ sglang/srt/models/phi4mm_audio.py,sha256=0ChekwoYudAnbY0-JyNwz_inzMlxM8FmULqR9mwkPhQ,48877
674
+ sglang/srt/models/phi4mm_utils.py,sha256=bW3un4x3SHDvSkAOHQEFO286FGdOPeKhBpJCOmNlC9E,66956
675
+ sglang/srt/models/phimoe.py,sha256=RZzcNf3sunyoc0KyMpyd93gnn1Ni13bqO-xe00MJ-h0,19192
656
676
  sglang/srt/models/pixtral.py,sha256=ZkZrV0mEfmbBdgRko2AvsMFZbAVskgp_5a5p1xCSRN0,16835
657
- sglang/srt/models/qwen.py,sha256=xYkVmMZS2uMqWhfndc8EYm0olpKFnggfuMp_6aobVi4,10758
658
- sglang/srt/models/qwen2.py,sha256=2G-aT1izwYsi60NObMXjbsJjyYy_Blo1kjkgI65bYZo,21056
659
- sglang/srt/models/qwen2_5_vl.py,sha256=RxRDLV7F6J-q-QKKhvkafa8C0jc_PWohW9N25Rq46Mg,22737
660
- sglang/srt/models/qwen2_audio.py,sha256=linjXOVGhjyKk5DUx9Uw-BJa1N-YcqCFUpsj0Zr_98A,7877
677
+ sglang/srt/models/qwen.py,sha256=j0OU3JjznWi_TbayI09yYGM-Obov6mQzJO82Hs0qBGw,11868
678
+ sglang/srt/models/qwen2.py,sha256=0gnggs2q-_FtD75J-UM4KMNBXSapVQGz73B-C2yZHDg,22437
679
+ sglang/srt/models/qwen2_5_vl.py,sha256=vOuIyK_NLuGgz9LlAdyM7cSQUU93VnBCYXUr_n4iOLs,22708
680
+ sglang/srt/models/qwen2_audio.py,sha256=lVeYmC29eVZIR9I6ZjFe4xvC0wSXR0NtGCli6fSXtms,7870
661
681
  sglang/srt/models/qwen2_classification.py,sha256=dGrMm4ebd30_lBhHOhaV57ig2iOTx3nqB4GEzsrRIM8,2747
662
682
  sglang/srt/models/qwen2_eagle.py,sha256=6spFg6JYQGeUXLv2Q5eMkVzZvnqGyvW6SdVBtFMxlTM,4806
663
- sglang/srt/models/qwen2_moe.py,sha256=fmVDsb4ju0suMCZiDAhocPxO9gQecOWOxmdf-W1elvg,24239
683
+ sglang/srt/models/qwen2_moe.py,sha256=3OV_pR36OImR9U6H3hziSxDEIsPLKEAr_oO3hKzlNSc,25806
664
684
  sglang/srt/models/qwen2_rm.py,sha256=-mQXDEv11p-I1HXgYLTtY6ROem6UYorO958WsDrzsgs,2837
665
- sglang/srt/models/qwen2_vl.py,sha256=tm-k4vCWJa2lWppYrZxi_b6gCQm0HQKs-QTI13U0_tA,21383
666
- sglang/srt/models/qwen3.py,sha256=3alBwittpU5m44DnJZ5mjRM0x1UShepu2CREWotPYqA,17777
667
- sglang/srt/models/qwen3_moe.py,sha256=qP_UlowZPOOB9sALkRtaK3-gpXlsmgEJMaJ17bycpJ0,32867
685
+ sglang/srt/models/qwen2_vl.py,sha256=ZRAL32Ymt4ZCBqB0JorXAm4ZBrECZ9EbaXKaTSikkQM,21366
686
+ sglang/srt/models/qwen3.py,sha256=COSC1TsCQNTq3E1QoVJYj1yTn-CFEVEX7keRwrrBXLs,20121
687
+ sglang/srt/models/qwen3_moe.py,sha256=nSLBfzBzYQ6wpDmXPF2OV1v2kB1wTlnAV37LMj5guMQ,33911
668
688
  sglang/srt/models/registry.py,sha256=bH9H0OiNV0Cn7FRBM30Oh6dxICTs9mJscdLtHYPJvxc,3783
669
689
  sglang/srt/models/roberta.py,sha256=3k53V2Gbezk3jU-D03thXx8csGn5DxFK01ZQ9WFiWPI,9828
670
690
  sglang/srt/models/siglip.py,sha256=DIVJRwdtpLD2QT1kVPIHw7Bn9BE40xJbkHujDNzkjgA,9892
671
691
  sglang/srt/models/stablelm.py,sha256=0x_31uIr3WcWwecdPAI3ek9KkyKBJS7VwknTk2y0gjY,12281
672
692
  sglang/srt/models/torch_native_llama.py,sha256=oTxxof5Wx2b2egIwWx56LeHjtPGQleQ2zM5jXHMiuOU,19293
673
693
  sglang/srt/models/transformers.py,sha256=_CL0npi-_HvqzxkLgFhv2EE3bfGvCLXPYAtPFywZOr0,10260
674
- sglang/srt/models/vila.py,sha256=7HJjYw85riD5JvQdTA-UmhPJaoI4kfQIHP7HbbW_B6U,9851
694
+ sglang/srt/models/vila.py,sha256=3NiRHWOqXnCRjXmswAldsNtiE5zRILbScEsbhUzLZF4,9846
675
695
  sglang/srt/models/xverse.py,sha256=DsNVI9JpzN4jj0Ry6aTrj7r-xq5YLOoDX2kH4YLJA-I,14035
676
696
  sglang/srt/models/xverse_moe.py,sha256=7KCM2-j12towDMNvXkuuYiBOmNauH6NG4Ip40x0khqA,16782
677
697
  sglang/srt/models/yivl.py,sha256=oToK7-u5IGO7xwpJIQ7VtudlK6-zPqJX4bt6_wv0SH8,4850
678
698
  sglang/srt/multimodal/mm_utils.py,sha256=6bV1_a7Iet9W0y3qdd0E-hFM78zalIzNZCYbLzJX2y8,12640
679
- sglang/srt/multimodal/processors/base_processor.py,sha256=H3IospK9baMOtirUPnYFTA_FX3N7Uq4RlY2HGVSVHf0,24269
680
- sglang/srt/multimodal/processors/clip.py,sha256=chKReTXD4ETUQ0s7BOk_AmWHEZXR5no6fprrnHwSNIM,1271
681
- sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=OlkkeqMyaqfmxKDSIg-0Y3JKAKjzBDJfTx6p_UytleM,3275
682
- sglang/srt/multimodal/processors/gemma3.py,sha256=Icn4wLs1JKiNXnZx7VFYDO88nk79Ht01GmsxSKfcv5A,2181
683
- sglang/srt/multimodal/processors/gemma3n.py,sha256=sacfdl3sU6bgbD6fXFoLzrG5Ti5tzWewjaUh2wb4dlU,3119
684
- sglang/srt/multimodal/processors/internvl.py,sha256=wy0fj4y9y7lUZo2hAACOb57eo5nmhJvSd1s2d-CpkNI,9328
685
- sglang/srt/multimodal/processors/janus_pro.py,sha256=e5VBoL-adxdKFkkXgC9X70ESZXIhtBhUEq1i0pqrn90,1907
686
- sglang/srt/multimodal/processors/kimi_vl.py,sha256=qLYonS4YwTB1yIz5D-dfZPJprtDzILueCAyMW6a7xLY,1656
687
- sglang/srt/multimodal/processors/llava.py,sha256=tIjeDPYxvMWUMXXLcfzzuaLPvdBtPrRzM25QzP0cnaE,7962
688
- sglang/srt/multimodal/processors/minicpm.py,sha256=_bejh4YQBuYy39IKzOgkQ0XRgmYqt9FhqXn5Z3d4wV8,5398
689
- sglang/srt/multimodal/processors/mlama.py,sha256=bW0hVPtRMqYz1RR2I19QtZLUTTPzInZv_6ZhVPJBieo,1406
690
- sglang/srt/multimodal/processors/mllama4.py,sha256=nAayC-mTpvooaqBC5pltaUMTXDgIpKFA8BzOXhptDZo,5597
691
- sglang/srt/multimodal/processors/phi4mm.py,sha256=iT-fBClMecI52yQTpfjxowvpRnBo9FBjJ83ieCFVROc,2331
692
- sglang/srt/multimodal/processors/pixtral.py,sha256=B8b30tiBClsALtgcqWDAgIGxd3uwr_8VqQx8xTvrsy8,4049
693
- sglang/srt/multimodal/processors/qwen_vl.py,sha256=hniJbL7tt7DkMvjMHnxFH4PPdkXpwHRcanXgrlyGb-Q,10731
694
- sglang/srt/multimodal/processors/vila.py,sha256=SL-O3WdBVIZcSO7NGnCRr_22KntPr6Qc-4jJbgvzN4M,2179
699
+ sglang/srt/multimodal/processors/base_processor.py,sha256=ZkMeNej7Mdlhu61DEcDCs7gcM8zUntzF_J4V_Q6yZ6c,23780
700
+ sglang/srt/multimodal/processors/clip.py,sha256=bpFaqQqNtjAriO-Do8pIYgYOwUh09JLC7cA4lx6X2Bs,1023
701
+ sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=sdObVNZKXzlWlsuUKTR-NWdoAZHEHBTGCtOGfusNM5o,2535
702
+ sglang/srt/multimodal/processors/gemma3.py,sha256=wLLe6VnNs7CSW8uT2Gj0dPwszFXf2yRpY14GYNfFDq4,1952
703
+ sglang/srt/multimodal/processors/gemma3n.py,sha256=KHH3wp6zoCnlKiAh1wWn7ffvTqeT_ZuQZrBaayBHVsQ,3022
704
+ sglang/srt/multimodal/processors/internvl.py,sha256=wNXjIEyp3t4ls5GozRhUXebKClL1YXh5U52YK3H1TIE,9280
705
+ sglang/srt/multimodal/processors/janus_pro.py,sha256=bcsSBAS8joLQFtnRQ1b6SrQnVABVBNCXTkTPkmSgssA,1437
706
+ sglang/srt/multimodal/processors/kimi_vl.py,sha256=RKNOKZhEAqjeB-CWdgWjHHxtawsNR1WPHfYaEfCVkko,1531
707
+ sglang/srt/multimodal/processors/llava.py,sha256=3XnpfYdvW4GlO7NU0sBqwTd6zgSsn5fBndWcmsPgGXs,8029
708
+ sglang/srt/multimodal/processors/minicpm.py,sha256=uTfEjK1hdiGiZ-y4oEPByUP96omDQwnCbaWEWw-Acr4,5321
709
+ sglang/srt/multimodal/processors/mlama.py,sha256=l8_LG5_gLENAu92bKzNCzkA38b6tHv1oVoSpQWFJPv8,1199
710
+ sglang/srt/multimodal/processors/mllama4.py,sha256=N9Occ3NslKSQT4i8VaL-3mnkMrFAWTQad6cUArYHdoI,5573
711
+ sglang/srt/multimodal/processors/phi4mm.py,sha256=xZ7YYyVHdQ-bovh1SWLidZddxXV6Iw1Nz1yNt_li3I4,3823
712
+ sglang/srt/multimodal/processors/pixtral.py,sha256=RuLd5PTTPQSJ1tZT2YelW0-jx6P79wkZBWvCUz98VLM,3169
713
+ sglang/srt/multimodal/processors/qwen_audio.py,sha256=ILePOlBI5v8GI962q-pZ0dV-tkHrfpKeL81dWHeuO70,2333
714
+ sglang/srt/multimodal/processors/qwen_vl.py,sha256=6maMXOwX3QICy3YNVSAF4VwxrZHCT4XH0MAAXIwIaeM,10464
715
+ sglang/srt/multimodal/processors/vila.py,sha256=Dj66JpKbSdqpLNfk-NykYjhGAGuzBeMo7lFVCkeHkAM,2142
695
716
  sglang/srt/sampling/custom_logit_processor.py,sha256=AwODYVJdRkcQ8PGtJrhzKsqAgn8XZLQbAmR9fGiQzmc,1608
696
- sglang/srt/sampling/sampling_batch_info.py,sha256=m8m-mXu3N8hLYFhAkRopePDT5Ozkd4KAmWDgM_9_4iA,14536
697
- sglang/srt/sampling/sampling_params.py,sha256=L2cU3MhAo9OvfdEtTdJidp9nTOkD6tiwlegxQ5vgIfU,6127
717
+ sglang/srt/sampling/sampling_batch_info.py,sha256=Duk4Fp99QZyOFld3i4AGwkW9FlULY86CNKv6v0_kA4w,14683
718
+ sglang/srt/sampling/sampling_params.py,sha256=HbVcCeSXgPW19MRB-v0FTG1D-zHDAY6-toxyndSl-zI,6462
698
719
  sglang/srt/sampling/penaltylib/__init__.py,sha256=mtN8grFEcaBUhl4yBHmw8NNirt_i6uKO2cDNLHOpZQE,496
699
720
  sglang/srt/sampling/penaltylib/frequency_penalty.py,sha256=Loc3qjJTksNc5s-DV7QZHjgqoo5pxk7-nZzxwyhD2tQ,2144
700
721
  sglang/srt/sampling/penaltylib/min_new_tokens.py,sha256=rdU_D7RoIcrQPhysNQEzmr4TO2OoEi___p-i3QdwkgU,3331
701
722
  sglang/srt/sampling/penaltylib/orchestrator.py,sha256=XM-Lm6u7gYPtMZrTIc0FR4QxNZxBH5s_Cj82umyCzYk,5721
702
723
  sglang/srt/sampling/penaltylib/presence_penalty.py,sha256=NRh10AJrrQlGJ6S-enGdRefrTrWpyqrSm-aNnyqQNQQ,2119
703
724
  sglang/srt/speculative/build_eagle_tree.py,sha256=O9LJNaBflgJdWT94D-rGH1gJFJ18nst2oOD8HnA2mZ4,12859
704
- sglang/srt/speculative/eagle_draft_cuda_graph_runner.py,sha256=fSNaHYJOQUgy2_AHRlZPYSQRIMgSiL_Pz5h53eothx4,14239
705
- sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py,sha256=sdIHbcWwgsXDoo64-T5veDuYB5eHC9QBwu2Ns29SCSI,14930
706
- sglang/srt/speculative/eagle_utils.py,sha256=cBQYqryCr4is5E_16xIcUue0Q2_Mn4meY8NCyuu4RAg,45558
707
- sglang/srt/speculative/eagle_worker.py,sha256=iOwloJqhYIrgBdnZQz9NV3zuiAe5dXJJa0QeSIg92x8,38180
725
+ sglang/srt/speculative/eagle_draft_cuda_graph_runner.py,sha256=kVqMGj25jxtJlP-nTSlq_QJgoabFqKOU7-0WeUFhvw8,14509
726
+ sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py,sha256=hLjaD66K3ZE5SWsjvSiSdSexQ55F3EuSnfb4oe7rrSY,15261
727
+ sglang/srt/speculative/eagle_utils.py,sha256=x5MKA2GkecNAXE58KKhPJRy5KxCLhRkD-C_kVSZIyzc,46433
728
+ sglang/srt/speculative/eagle_worker.py,sha256=8yPQZxpBvcr--Ooo4nov3LqzkLRL-GOLJlwu91wMAmQ,38650
708
729
  sglang/srt/speculative/spec_info.py,sha256=rhaKG0TzyF9XZYHEWp1jccwTBohSNsUDvxHFtAoOl18,709
709
730
  sglang/test/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
710
731
  sglang/test/few_shot_gsm8k.py,sha256=qnEejCyPHGEMBEiNc7T4-t9lvoo2DNN72RXw-ei_TnY,4300
711
732
  sglang/test/few_shot_gsm8k_engine.py,sha256=Yf1Dg0Tk-tY4v1oj_UTxJ7950CWn6kRMbQKDjT2Orgo,3902
712
733
  sglang/test/run_eval.py,sha256=K4Z3OdMPvLeuGJhWWTBD0F-MOUFeBYLvsPnDQ44bd18,4036
713
- sglang/test/runners.py,sha256=BmIxB7H5N0ib1Tmc88L2gLuRYpat_lkxAewtjA1fjbE,32804
734
+ sglang/test/runners.py,sha256=kRperGVKBW6pS05iOqZ1plSaWb4lX3tmHQOnPRd137c,33473
714
735
  sglang/test/send_one.py,sha256=XNZdfZs21tXDBwrDj2pq46WQd5smiKoYETY8U09c1Z8,5079
715
736
  sglang/test/simple_eval_common.py,sha256=OW4Z7O33QqDySRFuHIC4Ouidfup4eaOEuR9i7xJzkDY,12379
716
737
  sglang/test/simple_eval_gpqa.py,sha256=8Xt9Bw05c7SZTYrCZgB68OZUqUbLo69ywiyx0bTvSUk,3220
@@ -718,25 +739,27 @@ sglang/test/simple_eval_humaneval.py,sha256=s8YuKIBkNUEOBP4XKsTMRdXGv5aRhl0oJyl-
718
739
  sglang/test/simple_eval_math.py,sha256=6kGKNwNbLN-Af3Wj8WTimWhH-Xp3enDmSvvSjsgWUpk,2550
719
740
  sglang/test/simple_eval_mgsm.py,sha256=rd7TSUyxdKbrXaVoewo24V8lCo_6kO8zxPhhmvylpw8,10259
720
741
  sglang/test/simple_eval_mmlu.py,sha256=FkwamjGMjueTixymkedF-YiPloSLiy4ftILFUrKZ9XI,4357
721
- sglang/test/test_activation.py,sha256=GeTIJHxlLQfW3kM-X1FGa8Sa3dSGKHEXl5wEy-hfGis,1489
722
- sglang/test/test_block_fp8.py,sha256=1qBD-FJr5UaR9e5qDz91vDrS_DT1utnk82qeQ2bm-1E,21630
742
+ sglang/test/test_activation.py,sha256=bDBFl4Y30siXj7Ifl66fc2HytOrcZdHFiP2i9K8TIsY,3140
743
+ sglang/test/test_block_fp8.py,sha256=hd3GXuC_wxn0HGAN3KCs6Nxf98AHO8XaRvGsvWS-CHc,21822
723
744
  sglang/test/test_block_fp8_deep_gemm_blackwell.py,sha256=Hnhq4kkyINHb4ONedkp5Kf7Xx0MjOoOBYL8J7ETvOVA,8180
724
- sglang/test/test_block_fp8_ep.py,sha256=Ufq6p32sb1RSbFKaSnsVF8RrqqwwAACBUgOJTEH2Lbc,10856
725
- sglang/test/test_custom_ops.py,sha256=2bSo9P5_rJZYFq8Y8IKRimDfFyZZGJluhL7Ngny0Pf4,5571
745
+ sglang/test/test_block_fp8_ep.py,sha256=XGZEs7cJiLjatRZcdcav4aFIQxnQB8Vq-b3HmAsw-Ww,10859
746
+ sglang/test/test_custom_ops.py,sha256=PenQ8zM1wj5xwiVEPVzD37pO-x90aOfFMpCRZenaKsY,5709
726
747
  sglang/test/test_cutlass_moe.py,sha256=beXdvpwpHh0O8fpLW-RV3Bx8Wu0lRFG_SNkL3Op5ITA,9905
727
- sglang/test/test_cutlass_w4a8_moe.py,sha256=LmeSS7BrKO6-1mnksOqmo0nvJ_y3oeeiT5ytRkHk2A0,8780
748
+ sglang/test/test_cutlass_w4a8_moe.py,sha256=u4Fk2Kdu5yodhsPuiwTIJlWCpWgW5vMBmd1EDwdkDXw,8724
728
749
  sglang/test/test_deepep_utils.py,sha256=749ysTBGNzh6rYUCJhhZBtZpeD15eWTeNHYCytcvZtc,7448
729
750
  sglang/test/test_dynamic_grad_mode.py,sha256=L76yUCuk_ymNpXD2CmO8r2GiGjIvD_gtTsuFDs2NolI,1638
730
- sglang/test/test_fp4_moe.py,sha256=U4LHzpGl6pCiCZiENRPxVP6hxqkqRZ_0WXbB29vYeAo,8187
751
+ sglang/test/test_fp4_moe.py,sha256=yOYpn1dAztaRMBQYzsxU8222HZe2V_tg0Pz_gy9PNY0,8131
731
752
  sglang/test/test_layernorm.py,sha256=2GMWqqNDuGvSMSsEBF5eDCzwVSYA9E6hGhRo6s4ecKg,3764
753
+ sglang/test/test_marlin_moe.py,sha256=PITMGcGF4ci2csXJejdLSNuxpURnFmcflsipAZsGakU,7991
754
+ sglang/test/test_marlin_utils.py,sha256=gFMJwxbfEEJDeHI-HU5FDF9FFqqcM-yahK0TWyVIVgQ,5171
732
755
  sglang/test/test_programs.py,sha256=DJIbTChloPwaDiEWHQoSTuKv3BGx0-K8Y5e1mDDTACM,18910
733
- sglang/test/test_utils.py,sha256=u3L0E_5Evrv7Wjss_ZMNnro4HwMStQcUvg6cQvL_eBY,36778
756
+ sglang/test/test_utils.py,sha256=dnn2PUNoN4VX6glRlx3MmtTIqkoz3eisYa9VOYNfodU,37840
734
757
  sglang/test/attention/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
735
758
  sglang/test/attention/test_flashattn_backend.py,sha256=_rTG849FwQdVTyGKkqhczaOqngBmRWXFmkl5NnuK1GM,13914
736
759
  sglang/test/attention/test_flashattn_mla_backend.py,sha256=g4O50WblTpM7_Gq2b76k0i25_z01BOUBQ4i6PmyxpO4,10774
737
760
  sglang/test/attention/test_prefix_chunk_info.py,sha256=hpoDe2wfSa6RlUbfyri_c0iyBTb35UXGL9I2Xh6jamM,7772
738
- sglang-0.4.9.post2.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
739
- sglang-0.4.9.post2.dist-info/METADATA,sha256=_Z1MAQxdNmJPXSJy0-sGf6MKxRciuhUY4BWxIDVqqCM,27276
740
- sglang-0.4.9.post2.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
741
- sglang-0.4.9.post2.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
742
- sglang-0.4.9.post2.dist-info/RECORD,,
761
+ sglang-0.4.9.post4.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
762
+ sglang-0.4.9.post4.dist-info/METADATA,sha256=moSWmWQPcs4bmIJ3FodeQnGZEf9NdVMbJLQlXXX4EAA,27348
763
+ sglang-0.4.9.post4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
764
+ sglang-0.4.9.post4.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
765
+ sglang-0.4.9.post4.dist-info/RECORD,,