sglang 0.4.8.post1__py3-none-any.whl → 0.4.9__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (141) hide show
  1. sglang/bench_one_batch_server.py +17 -2
  2. sglang/bench_serving.py +168 -22
  3. sglang/srt/configs/internvl.py +4 -2
  4. sglang/srt/configs/janus_pro.py +1 -1
  5. sglang/srt/configs/model_config.py +48 -0
  6. sglang/srt/configs/update_config.py +119 -0
  7. sglang/srt/conversation.py +34 -0
  8. sglang/srt/disaggregation/decode.py +21 -5
  9. sglang/srt/disaggregation/nixl/conn.py +6 -6
  10. sglang/srt/disaggregation/prefill.py +2 -2
  11. sglang/srt/disaggregation/utils.py +1 -1
  12. sglang/srt/distributed/parallel_state.py +44 -17
  13. sglang/srt/entrypoints/EngineBase.py +8 -0
  14. sglang/srt/entrypoints/engine.py +40 -6
  15. sglang/srt/entrypoints/http_server.py +111 -24
  16. sglang/srt/entrypoints/openai/protocol.py +4 -2
  17. sglang/srt/eplb/__init__.py +0 -0
  18. sglang/srt/{managers → eplb}/eplb_algorithms/__init__.py +1 -1
  19. sglang/srt/{managers → eplb}/eplb_manager.py +2 -4
  20. sglang/srt/{eplb_simulator → eplb/eplb_simulator}/reader.py +1 -1
  21. sglang/srt/{managers → eplb}/expert_distribution.py +1 -5
  22. sglang/srt/{managers → eplb}/expert_location.py +1 -1
  23. sglang/srt/{managers → eplb}/expert_location_dispatch.py +1 -1
  24. sglang/srt/{model_executor → eplb}/expert_location_updater.py +17 -1
  25. sglang/srt/hf_transformers_utils.py +2 -1
  26. sglang/srt/layers/activation.py +2 -2
  27. sglang/srt/layers/amx_utils.py +86 -0
  28. sglang/srt/layers/attention/ascend_backend.py +219 -0
  29. sglang/srt/layers/attention/flashattention_backend.py +32 -9
  30. sglang/srt/layers/attention/tbo_backend.py +37 -9
  31. sglang/srt/layers/communicator.py +18 -2
  32. sglang/srt/layers/dp_attention.py +9 -3
  33. sglang/srt/layers/elementwise.py +76 -12
  34. sglang/srt/layers/flashinfer_comm_fusion.py +202 -0
  35. sglang/srt/layers/layernorm.py +26 -0
  36. sglang/srt/layers/linear.py +84 -14
  37. sglang/srt/layers/logits_processor.py +4 -4
  38. sglang/srt/layers/moe/ep_moe/kernels.py +23 -8
  39. sglang/srt/layers/moe/ep_moe/layer.py +36 -13
  40. sglang/srt/layers/moe/ep_moe/token_dispatcher.py +23 -17
  41. sglang/srt/layers/moe/fused_moe_triton/fused_moe.py +1 -2
  42. sglang/srt/layers/moe/fused_moe_triton/layer.py +76 -16
  43. sglang/srt/layers/moe/router.py +60 -22
  44. sglang/srt/layers/moe/topk.py +10 -28
  45. sglang/srt/layers/parameter.py +67 -7
  46. sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a16_fp8.py +1 -1
  47. sglang/srt/layers/quantization/fp8.py +44 -0
  48. sglang/srt/layers/quantization/fp8_kernel.py +1 -1
  49. sglang/srt/layers/quantization/fp8_utils.py +1 -2
  50. sglang/srt/layers/quantization/gptq.py +5 -1
  51. sglang/srt/layers/quantization/moe_wna16.py +1 -1
  52. sglang/srt/layers/quantization/quant_utils.py +166 -0
  53. sglang/srt/layers/quantization/w8a8_int8.py +52 -1
  54. sglang/srt/layers/rotary_embedding.py +2 -2
  55. sglang/srt/layers/vocab_parallel_embedding.py +11 -7
  56. sglang/srt/lora/lora.py +4 -5
  57. sglang/srt/lora/lora_manager.py +73 -20
  58. sglang/srt/managers/configure_logging.py +1 -1
  59. sglang/srt/managers/io_struct.py +50 -13
  60. sglang/srt/managers/mm_utils.py +73 -59
  61. sglang/srt/managers/multimodal_processor.py +2 -6
  62. sglang/srt/managers/multimodal_processors/qwen_audio.py +94 -0
  63. sglang/srt/managers/schedule_batch.py +77 -84
  64. sglang/srt/managers/scheduler.py +113 -59
  65. sglang/srt/managers/scheduler_output_processor_mixin.py +8 -2
  66. sglang/srt/managers/session_controller.py +12 -3
  67. sglang/srt/managers/tokenizer_manager.py +314 -103
  68. sglang/srt/managers/tp_worker.py +13 -1
  69. sglang/srt/managers/tp_worker_overlap_thread.py +8 -0
  70. sglang/srt/mem_cache/allocator.py +290 -0
  71. sglang/srt/mem_cache/chunk_cache.py +34 -2
  72. sglang/srt/mem_cache/memory_pool.py +289 -3
  73. sglang/srt/mem_cache/multimodal_cache.py +3 -0
  74. sglang/srt/model_executor/cuda_graph_runner.py +2 -1
  75. sglang/srt/model_executor/forward_batch_info.py +17 -4
  76. sglang/srt/model_executor/model_runner.py +297 -56
  77. sglang/srt/model_loader/loader.py +41 -0
  78. sglang/srt/model_loader/weight_utils.py +72 -4
  79. sglang/srt/models/deepseek_nextn.py +1 -3
  80. sglang/srt/models/deepseek_v2.py +181 -45
  81. sglang/srt/models/deepseek_vl2.py +3 -5
  82. sglang/srt/models/gemma3_causal.py +1 -2
  83. sglang/srt/models/gemma3n_causal.py +4 -3
  84. sglang/srt/models/gemma3n_mm.py +4 -20
  85. sglang/srt/models/hunyuan.py +1 -1
  86. sglang/srt/models/kimi_vl.py +1 -2
  87. sglang/srt/models/llama.py +10 -4
  88. sglang/srt/models/llama4.py +32 -45
  89. sglang/srt/models/llama_eagle3.py +61 -11
  90. sglang/srt/models/llava.py +5 -5
  91. sglang/srt/models/minicpmo.py +2 -2
  92. sglang/srt/models/mistral.py +1 -1
  93. sglang/srt/models/mllama4.py +43 -11
  94. sglang/srt/models/phi4mm.py +1 -3
  95. sglang/srt/models/pixtral.py +3 -7
  96. sglang/srt/models/qwen2.py +31 -3
  97. sglang/srt/models/qwen2_5_vl.py +1 -3
  98. sglang/srt/models/qwen2_audio.py +200 -0
  99. sglang/srt/models/qwen2_moe.py +32 -6
  100. sglang/srt/models/qwen2_vl.py +1 -4
  101. sglang/srt/models/qwen3.py +94 -25
  102. sglang/srt/models/qwen3_moe.py +68 -21
  103. sglang/srt/models/vila.py +3 -8
  104. sglang/srt/{managers/multimodal_processors → multimodal/processors}/base_processor.py +140 -158
  105. sglang/srt/{managers/multimodal_processors → multimodal/processors}/clip.py +2 -13
  106. sglang/srt/{managers/multimodal_processors → multimodal/processors}/deepseek_vl_v2.py +4 -11
  107. sglang/srt/{managers/multimodal_processors → multimodal/processors}/gemma3.py +3 -10
  108. sglang/srt/{managers/multimodal_processors → multimodal/processors}/gemma3n.py +5 -20
  109. sglang/srt/{managers/multimodal_processors → multimodal/processors}/internvl.py +3 -10
  110. sglang/srt/{managers/multimodal_processors → multimodal/processors}/janus_pro.py +3 -9
  111. sglang/srt/{managers/multimodal_processors → multimodal/processors}/kimi_vl.py +6 -13
  112. sglang/srt/{managers/multimodal_processors → multimodal/processors}/llava.py +2 -10
  113. sglang/srt/{managers/multimodal_processors → multimodal/processors}/minicpm.py +5 -12
  114. sglang/srt/{managers/multimodal_processors → multimodal/processors}/mlama.py +2 -14
  115. sglang/srt/{managers/multimodal_processors → multimodal/processors}/mllama4.py +3 -6
  116. sglang/srt/{managers/multimodal_processors → multimodal/processors}/phi4mm.py +4 -14
  117. sglang/srt/{managers/multimodal_processors → multimodal/processors}/pixtral.py +3 -9
  118. sglang/srt/{managers/multimodal_processors → multimodal/processors}/qwen_vl.py +8 -14
  119. sglang/srt/{managers/multimodal_processors → multimodal/processors}/vila.py +13 -31
  120. sglang/srt/operations_strategy.py +6 -2
  121. sglang/srt/reasoning_parser.py +26 -0
  122. sglang/srt/sampling/sampling_batch_info.py +39 -1
  123. sglang/srt/server_args.py +69 -22
  124. sglang/srt/speculative/build_eagle_tree.py +57 -18
  125. sglang/srt/speculative/eagle_worker.py +6 -4
  126. sglang/srt/two_batch_overlap.py +200 -27
  127. sglang/srt/utils.py +306 -146
  128. sglang/srt/warmup.py +12 -3
  129. sglang/test/runners.py +10 -1
  130. sglang/test/test_utils.py +15 -3
  131. sglang/version.py +1 -1
  132. {sglang-0.4.8.post1.dist-info → sglang-0.4.9.dist-info}/METADATA +9 -6
  133. {sglang-0.4.8.post1.dist-info → sglang-0.4.9.dist-info}/RECORD +140 -133
  134. sglang/math_utils.py +0 -8
  135. /sglang/srt/{managers → eplb}/eplb_algorithms/deepseek.py +0 -0
  136. /sglang/srt/{managers → eplb}/eplb_algorithms/deepseek_vec.py +0 -0
  137. /sglang/srt/{eplb_simulator → eplb/eplb_simulator}/__init__.py +0 -0
  138. /sglang/srt/{mm_utils.py → multimodal/mm_utils.py} +0 -0
  139. {sglang-0.4.8.post1.dist-info → sglang-0.4.9.dist-info}/WHEEL +0 -0
  140. {sglang-0.4.8.post1.dist-info → sglang-0.4.9.dist-info}/licenses/LICENSE +0 -0
  141. {sglang-0.4.8.post1.dist-info → sglang-0.4.9.dist-info}/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: sglang
3
- Version: 0.4.8.post1
3
+ Version: 0.4.9
4
4
  Summary: SGLang is yet another fast serving framework for large language models and vision language models.
5
5
  License: Apache License
6
6
  Version 2.0, January 2004
@@ -219,6 +219,7 @@ Requires-Dist: IPython
219
219
  Requires-Dist: setproctitle
220
220
  Provides-Extra: runtime-common
221
221
  Requires-Dist: blobfile==3.0.0; extra == "runtime-common"
222
+ Requires-Dist: build; extra == "runtime-common"
222
223
  Requires-Dist: compressed-tensors; extra == "runtime-common"
223
224
  Requires-Dist: datasets; extra == "runtime-common"
224
225
  Requires-Dist: fastapi; extra == "runtime-common"
@@ -243,19 +244,20 @@ Requires-Dist: pyzmq>=25.1.2; extra == "runtime-common"
243
244
  Requires-Dist: soundfile==0.13.1; extra == "runtime-common"
244
245
  Requires-Dist: scipy; extra == "runtime-common"
245
246
  Requires-Dist: torchao==0.9.0; extra == "runtime-common"
246
- Requires-Dist: transformers==4.52.3; extra == "runtime-common"
247
+ Requires-Dist: transformers==4.53.0; extra == "runtime-common"
248
+ Requires-Dist: timm==1.0.16; extra == "runtime-common"
247
249
  Requires-Dist: uvicorn; extra == "runtime-common"
248
250
  Requires-Dist: uvloop; extra == "runtime-common"
249
251
  Requires-Dist: xgrammar==0.1.19; extra == "runtime-common"
250
252
  Provides-Extra: srt
251
253
  Requires-Dist: sglang[runtime_common]; extra == "srt"
252
- Requires-Dist: sgl-kernel==0.1.9; extra == "srt"
254
+ Requires-Dist: sgl-kernel==0.2.4; extra == "srt"
253
255
  Requires-Dist: torch==2.7.1; extra == "srt"
254
256
  Requires-Dist: torchaudio==2.7.1; extra == "srt"
255
257
  Requires-Dist: torchvision==0.22.1; extra == "srt"
256
258
  Requires-Dist: cuda-python; extra == "srt"
257
259
  Requires-Dist: einops; extra == "srt"
258
- Requires-Dist: flashinfer_python==0.2.6.post1; extra == "srt"
260
+ Requires-Dist: flashinfer_python==0.2.7.post1; extra == "srt"
259
261
  Provides-Extra: blackwell
260
262
  Requires-Dist: sglang[runtime_common]; extra == "blackwell"
261
263
  Requires-Dist: sgl-kernel; extra == "blackwell"
@@ -264,7 +266,7 @@ Requires-Dist: torchaudio==2.7.1; extra == "blackwell"
264
266
  Requires-Dist: torchvision==0.22.1; extra == "blackwell"
265
267
  Requires-Dist: cuda-python; extra == "blackwell"
266
268
  Requires-Dist: einops; extra == "blackwell"
267
- Requires-Dist: flashinfer_python==0.2.6.post1; extra == "blackwell"
269
+ Requires-Dist: flashinfer_python==0.2.7.post1; extra == "blackwell"
268
270
  Provides-Extra: srt-hip
269
271
  Requires-Dist: sglang[runtime_common]; extra == "srt-hip"
270
272
  Requires-Dist: torch; extra == "srt-hip"
@@ -295,7 +297,6 @@ Requires-Dist: jsonlines; extra == "test"
295
297
  Requires-Dist: matplotlib; extra == "test"
296
298
  Requires-Dist: pandas; extra == "test"
297
299
  Requires-Dist: peft; extra == "test"
298
- Requires-Dist: timm; extra == "test"
299
300
  Requires-Dist: sentence_transformers; extra == "test"
300
301
  Provides-Extra: all
301
302
  Requires-Dist: sglang[srt]; extra == "all"
@@ -373,6 +374,8 @@ Dynamic: license-file
373
374
  | [**Slides**](https://github.com/sgl-project/sgl-learning-materials?tab=readme-ov-file#slides) |
374
375
 
375
376
  ## News
377
+ - [2025/06] 🔥 SGLang, the high-performance serving infrastructure powering trillions of tokens daily, has been awarded the third batch of the Open Source AI Grant by a16z ([a16z blog](https://a16z.com/advancing-open-source-ai-through-benchmarks-and-bold-experimentation/)).
378
+ - [2025/06] 🔥 Deploying DeepSeek on GB200 NVL72 with PD and Large Scale EP (Part I): 2.7x Higher Decoding Throughput ([blog](https://lmsys.org/blog/2025-06-16-gb200-part-1/)).
376
379
  - [2025/05] 🔥 Deploying DeepSeek with PD Disaggregation and Large-scale Expert Parallelism on 96 H100 GPUs ([blog](https://lmsys.org/blog/2025-05-05-large-scale-ep/)).
377
380
  - [2025/03] Supercharge DeepSeek-R1 Inference on AMD Instinct MI300X ([AMD blog](https://rocm.blogs.amd.com/artificial-intelligence/DeepSeekR1-Part2/README.html))
378
381
  - [2025/03] SGLang Joins PyTorch Ecosystem: Efficient LLM Serving Engine ([PyTorch blog](https://pytorch.org/blog/sglang-joins-pytorch/))
@@ -2,16 +2,15 @@ sglang/__init__.py,sha256=x1v8748WXS2BAptWAd5fR3YBEkngC7e_P_rkCNuNCGg,1702
2
2
  sglang/api.py,sha256=rcp3GeoyZhmJ0GDLPRkuZNcxd0TBJy_wfUDpcmQoqW8,7210
3
3
  sglang/bench_offline_throughput.py,sha256=TwgXZYmwPaHVsdPtNU9LO0p1tr5OOKLy9wYgrfGAlFU,14056
4
4
  sglang/bench_one_batch.py,sha256=RJsXQ7pvq8y4yzW7svURtWZF5RiawxEMrsjV0OcKsrk,19388
5
- sglang/bench_one_batch_server.py,sha256=4Jbs8UI-Sbt3TL3SJBC3fySZPe4apz2glKWOvvaYsQQ,13486
6
- sglang/bench_serving.py,sha256=EzZn91DuScAEhUMQv-LPWm3UoGjzj8OEzHMzVwoEA34,65672
5
+ sglang/bench_one_batch_server.py,sha256=LS1BRmFwP67IpYlU5wmkWjqquiA5drvtWe-fwHnFSKI,14170
6
+ sglang/bench_serving.py,sha256=sQKEgJZIfHRu3vNh8QWqIrTQzOfUMaoVidG05ewTVUE,71744
7
7
  sglang/check_env.py,sha256=qDMIG2rCNBH1yKnxQmF-Bp10oiFMUKMgfZLHZYOmdSY,8412
8
8
  sglang/compile_deep_gemm.py,sha256=H118s76CKdpZr-cDeFfBCePe7--c_teEBNVIzchYVSo,6243
9
9
  sglang/global_config.py,sha256=xzLdk8W53fneFblNh8iIjGF9C3-7mnzR1-LleD9Btxg,1495
10
10
  sglang/launch_server.py,sha256=mDXfwha8LHpWQJekcCosR98QhCQsbmilsBlI5jAIgg0,420
11
- sglang/math_utils.py,sha256=QYtbaIA76P33ojcOrL32VR6yXWv-Od_3WCZNO4kQ-YQ,177
12
11
  sglang/profiler.py,sha256=tEHzHerXC-ymk4OrkoUcMbgcGHmb8VESthsNSP2Yx9w,4417
13
12
  sglang/utils.py,sha256=VH6zrnkjzcR3DE__WfVph6wswJ4JuzoQD47VmbZ38eI,16435
14
- sglang/version.py,sha256=E6iPG1WE6yyF-fToZYo4ZM-iwegVLaXOKuEXlAJ_kvg,28
13
+ sglang/version.py,sha256=LdxLMJM_JXsCQBeSvnxCNyGWmINE0yWfna3DQaT41Vs,22
15
14
  sglang/eval/llama3_eval.py,sha256=gWSboDchIGybIce88bJlrCG0yiLZ513mw4gcutJlzGM,10017
16
15
  sglang/eval/loogle_eval.py,sha256=pRPVA4fxGmT3_oXvXnlNE-UlPrcQGLBJF-OSE9YWJXM,4336
17
16
  sglang/lang/chat_template.py,sha256=HKlx7snSWFED8GKF5ex79sQrPWFw5TSXQM0_LsiD9Bc,20552
@@ -31,34 +30,34 @@ sglang/srt/_custom_ops.py,sha256=0lJRMTKTjoxJPh1qQnnMY02Z3SyBDi7LJI34IBLQsgQ,446
31
30
  sglang/srt/aio_rwlock.py,sha256=6LYtOdeTUY3hkfa1dmYkgsaF2ttrwIF3hUWz2AZ2fqw,2970
32
31
  sglang/srt/code_completion_parser.py,sha256=KFa95OU0TeVjJkOqIgS4xV3kaJ5dFWOmAAgISyc1oEc,3803
33
32
  sglang/srt/constants.py,sha256=0i-tEwG2BSYNDy96MxnGHV5HnBELkYcnsVGsE-R18o0,93
34
- sglang/srt/conversation.py,sha256=xkV_OWdotT_Tf1QzpxLL-oZ-THAKKtJj49Q9B_L-WT8,37144
33
+ sglang/srt/conversation.py,sha256=fFP6RxkRolz-YLl55o0juzp0Ov-78j89RCt7Cflzr2Q,38335
35
34
  sglang/srt/custom_op.py,sha256=87r2PIgiGLREsIZQ8qsUD-zgI66_54y9GrE0buXzoCI,3076
36
35
  sglang/srt/debug_utils.py,sha256=slaFOY4BYDBFatkfu8FZlzai-u4LFS-5GUzdr-t50zE,2241
37
- sglang/srt/hf_transformers_utils.py,sha256=S1ZF4aFKTocenXvj9ti6M-buiCBus4FrP1AdwFz_Wbw,11943
36
+ sglang/srt/hf_transformers_utils.py,sha256=1Ku6POAyk1Hb4Q1VcHTE_2EjujVhPerPO9V9NAcHbOI,11997
38
37
  sglang/srt/jinja_template_utils.py,sha256=Jc6Vl-lYtUyMBSWWQGIMpJQ1O-ceU9c8DbOi_bN-oVk,6719
39
- sglang/srt/mm_utils.py,sha256=7o4w1W0VAWgEquVIz7qw7-IxYbZY2g3MrXw9php90oY,12621
40
38
  sglang/srt/model_parallel.py,sha256=eLXZhvJ4wG6dh0FontNCIdVZvHYdWgaeY-5cu7TD9tE,6078
41
39
  sglang/srt/operations.py,sha256=ddQ8KO63L73OciaR8MZ9h2h83gKVY4-WuWgeEGowPJA,5346
42
- sglang/srt/operations_strategy.py,sha256=6DDLEdmkLrFDTXWZoFO0q9MZjEThvfyvoO-LbQsNpPQ,7023
40
+ sglang/srt/operations_strategy.py,sha256=Pwd2sKeRtKh9WJXgzlNr2tU9y6YMcI3MDLbatHqlMws,7145
43
41
  sglang/srt/patch_torch.py,sha256=OUPCGQSQz3MVZB1zZ_Eq8lXiw0uIKJ_HWjqQolI8FsM,3088
44
- sglang/srt/reasoning_parser.py,sha256=vf0kWBM4IXwbuzGBIOMdiXdn9gavqkHb1QIaTbkU7vc,6742
45
- sglang/srt/server_args.py,sha256=MVp3qB7PmJlw82hY8dQPoVsJZ26RpmiBqLDgzq1vjOc,73495
42
+ sglang/srt/reasoning_parser.py,sha256=DkZrFhkJ9qe7w46fTnM9sqhXwTDgZxD4qPdGka-Dly8,7579
43
+ sglang/srt/server_args.py,sha256=Fg1CqO92iiKA5jLd9vqKZ59uwnw0l23DO6KL47kBJgY,75458
46
44
  sglang/srt/torch_memory_saver_adapter.py,sha256=K_eTx0UU84MHSTXI3iqYLdHV4IWtJMJ2FKdGFJR8v1E,2417
47
- sglang/srt/two_batch_overlap.py,sha256=M5Ca3LV4_j7g3o78WQDjWzgsSCpY4E75SIKnwoa7tQg,21922
48
- sglang/srt/utils.py,sha256=Xg7K6VaTFDrEdW8b07AVREPHdx9M4vJuOI3aIct82JM,80640
49
- sglang/srt/warmup.py,sha256=FmJiYfjRr3X_eAe7ojQaPoN17LvHpjDmRWRnO-k86AQ,1469
45
+ sglang/srt/two_batch_overlap.py,sha256=kunhMhCF_ucK4EkthOUEUegd1C9j4aSbpBLYaIKYgas,28447
46
+ sglang/srt/utils.py,sha256=pI-0YtHmQrC2B2Q_uK13qvje1y_ni6TNzqs8W7T3hts,85846
47
+ sglang/srt/warmup.py,sha256=zldxhMlXpclRAJXmfBjJNUJd1eDizVdysibBvQyTVuA,1782
50
48
  sglang/srt/configs/__init__.py,sha256=8EcVRP95epZ49DxBa6LgKWt7eO3Qe7Hrr3V1c6HkMnY,553
51
49
  sglang/srt/configs/chatglm.py,sha256=j-b0YkdYUmQm2y1kNmMJtKeACxWKmBbvNNkDWbs6kbI,2907
52
50
  sglang/srt/configs/dbrx.py,sha256=tdhIkXAQl1yr0MxqFmsDG1E0e2puRTTKm6UTyANBLac,11005
53
51
  sglang/srt/configs/deepseekvl2.py,sha256=X8Q2gm7og_Ylx6tbFXetusfIJIXjWY_YH_p90C67BTI,23397
54
52
  sglang/srt/configs/device_config.py,sha256=kdwFrk5myAURxdp4rSr8ANpBpSJfuBDoT-kuCyuscRs,442
55
53
  sglang/srt/configs/exaone.py,sha256=Duxd4yQoKy8GWEzZD_kCY_OzmN_67CTJL_Kgn0eXk3g,10731
56
- sglang/srt/configs/internvl.py,sha256=NseEdxsLPJNpj5iyDueYw836jZq7-swozC3hAkFnmtI,27401
57
- sglang/srt/configs/janus_pro.py,sha256=Rrb7kQsNaUP-TiZrjNk8Lr1momFrql8ScEunnrH0_xM,19086
54
+ sglang/srt/configs/internvl.py,sha256=Z2kmT-5BzR4EdoLmbsgnK5HBXmpjzKAcaTuHaPYrQHE,27553
55
+ sglang/srt/configs/janus_pro.py,sha256=95qLFQ43n-q5MVEDnh9OBXCUNXOCofwBKYvd7LKPvRI,19097
58
56
  sglang/srt/configs/kimi_vl.py,sha256=4W7VQI3pr888ZsFA2SqCQo4mI0seXTOrGQ-x3oTvWew,1358
59
57
  sglang/srt/configs/kimi_vl_moonvit.py,sha256=hx2Rt4JSFbvy2HUTeLjBpge87m8M6ITAhqsgdNf_Jd4,1163
60
58
  sglang/srt/configs/load_config.py,sha256=qs-AxuplouBx2tsv9KGBOLZPbwzuVA4vbktbGP_cRp8,3309
61
- sglang/srt/configs/model_config.py,sha256=ESZEDSvxVfRH4CiZoy8JVpapJU5yPTYCAxZB38AJ7b0,25245
59
+ sglang/srt/configs/model_config.py,sha256=EzF91fOMu97BxPFSrVU4r-RTuUS3pqoDObKAstnPxGE,26983
60
+ sglang/srt/configs/update_config.py,sha256=2EpDVocEpMv35g1V-iPLSaLjBgylC5vN0yYSlW49k5w,4664
62
61
  sglang/srt/configs/utils.py,sha256=3nHUfisMs_Ltuhv8OZTNCJp63YJKJVF43h1QZB1zqx8,670
63
62
  sglang/srt/connector/__init__.py,sha256=czLX5JOxuMhH-T9eSJzoc1qv1B4z9chyffDRL5I6wo4,1247
64
63
  sglang/srt/connector/base_connector.py,sha256=i6i1TIzsz4NbSEkrdMPq-urb2sN2aLAx8dazga4gB9U,2833
@@ -75,13 +74,13 @@ sglang/srt/constrained/outlines_jump_forward.py,sha256=Gyubp-FVetxd6wP4FA_kD6cCX
75
74
  sglang/srt/constrained/reasoner_grammar_backend.py,sha256=YFxWuOTTo4e6cGhxnaBwuwli6f8FTUJtszib8dBq_8I,3207
76
75
  sglang/srt/constrained/xgrammar_backend.py,sha256=u9Ao-XX22UzALkATEAR_-0EoyBTxMTJV590qd9LAUHM,7906
77
76
  sglang/srt/constrained/triton_ops/bitmask_ops.py,sha256=WjTen9iuuFWLzkE1mAHQZB9_7aIy5QH8Wjf-lB-Fams,4614
78
- sglang/srt/disaggregation/decode.py,sha256=lqpmpQYMXzDCM19R4Pe4RF8q92UvBqKUITauFGDylEs,33335
77
+ sglang/srt/disaggregation/decode.py,sha256=sND6tJTIgxdaqDOem9mAaaMQWZTVxho5sniMOYVkQ7I,33944
79
78
  sglang/srt/disaggregation/decode_schedule_batch_mixin.py,sha256=8UdNaj8KKMLV5Cydhw8gnHM-zRrnKM_AAd3Qc-SRfWg,5648
80
79
  sglang/srt/disaggregation/kv_events.py,sha256=yFbtwOeblcCmOXTjg00TopxnyjkmCBQIVz46KB8jetY,13555
81
80
  sglang/srt/disaggregation/launch_lb.py,sha256=mcbAztN4gnHevw_T5R2_nWsymsDEY9vHkm7OJ1vr6cc,4211
82
81
  sglang/srt/disaggregation/mini_lb.py,sha256=BBeIdeZZxi7Ra5_hukHHX3TNdyfZ4tP1GBUxC-qrv_g,14401
83
- sglang/srt/disaggregation/prefill.py,sha256=jWOqYXBBiNuOC78a028FN6mlklzEki4MjRdTA6UE5zU,23518
84
- sglang/srt/disaggregation/utils.py,sha256=LBiRVbJ4jjYJXn0JL4VMTmGwAMAIGqJ_zaqPLjrmfkU,11339
82
+ sglang/srt/disaggregation/prefill.py,sha256=3u6WCrjogZSqd6yWdBZe1HO4lf6w2e9M7sQtGHyax-Y,23512
83
+ sglang/srt/disaggregation/utils.py,sha256=pKy2MDWqnfHmktc7bJg0hi_x92ellCtfWB-RJSg1jSw,11343
85
84
  sglang/srt/disaggregation/base/__init__.py,sha256=4VwUv0aWxwmVL1049XK82aLTNxmt0WY5RPy9li-wyVk,160
86
85
  sglang/srt/disaggregation/base/conn.py,sha256=CPDAoAkYaFtVPLa1QROfwipSVe7MH6omzIBHzo8TSYk,2811
87
86
  sglang/srt/disaggregation/common/__init__.py,sha256=7yl-EGLMVKRpBUaGF_7lwAsw2J_mqpRZV0238VGxD9o,126
@@ -93,10 +92,10 @@ sglang/srt/disaggregation/mooncake/__init__.py,sha256=0TgqkAdQI1YynbHY6c0QISvVoO
93
92
  sglang/srt/disaggregation/mooncake/conn.py,sha256=MATJkiS_5Vh8fc8Gx6S6cI3zCYDbgKXVEAa1xkUsCKA,58879
94
93
  sglang/srt/disaggregation/mooncake/transfer_engine.py,sha256=JYB9T-EPdJNfv4I_sVpmMOZCOJ14itD97ws6tTvj240,4281
95
94
  sglang/srt/disaggregation/nixl/__init__.py,sha256=qODVPIGWUXKXq4zsRIcMYoAoAeg6nBIN9vdQOlVMANE,136
96
- sglang/srt/disaggregation/nixl/conn.py,sha256=G2l-FuXUvtsEo3Z24vyQ8iTcFjqG-sise4ItAtiny30,20327
95
+ sglang/srt/disaggregation/nixl/conn.py,sha256=cXqWU2Gbi6E2LS0MznEcgFCrwONhYxBtD-zE9DU32z0,20333
97
96
  sglang/srt/distributed/__init__.py,sha256=jFOcyt-wFAPMBUAf9zkZalNQlt-4rqmT6pCKBz1E4qo,149
98
97
  sglang/srt/distributed/communication_op.py,sha256=IBnFUdMftK_VSTMMMitGveonorFUUVNL4guqO31cMSc,1130
99
- sglang/srt/distributed/parallel_state.py,sha256=0_G1TtBOFMYDix5rfuEHYBMpy9A-OuPs9yFd5nCiZ8Q,53927
98
+ sglang/srt/distributed/parallel_state.py,sha256=tZL5PLVowAQvq5xlT573Di63hWKsiqJZbl-auj85wNA,54997
100
99
  sglang/srt/distributed/utils.py,sha256=aaCxATncLGnVgB0WlGpBdee0behKW8Dy_dakqcuKSaQ,8497
101
100
  sglang/srt/distributed/device_communicators/cuda_wrapper.py,sha256=3jvPG-Ow5UBLiXhfx8T8snR7crSZbPpARAggsDPWq7k,7038
102
101
  sglang/srt/distributed/device_communicators/custom_all_reduce.py,sha256=qje-PQ3v8yaV-oYVLPws1mgIlXVsGKFCOvXHmSe8ZXg,19624
@@ -108,12 +107,12 @@ sglang/srt/distributed/device_communicators/pynccl.py,sha256=obXyCaZznZHSt486XCn
108
107
  sglang/srt/distributed/device_communicators/pynccl_wrapper.py,sha256=LblisImY9d6EMz-oPS9J16WHo2Q_SRL1DtlJKK63Hfg,15349
109
108
  sglang/srt/distributed/device_communicators/shm_broadcast.py,sha256=d8mykYmXM1lfbPm8GNtqCF0Un_pdXYjbNmsgoVFyyow,20874
110
109
  sglang/srt/distributed/device_communicators/xpu_communicator.py,sha256=ajW6132BvA6jkeipEIgN27TFycI0U06Ih2Z8WNjlA4s,1593
111
- sglang/srt/entrypoints/EngineBase.py,sha256=FCwqQMJE_8CCCMThAXUZaKafsHvh2BaQ31J-7_ormwA,2310
112
- sglang/srt/entrypoints/engine.py,sha256=uSlN1vorCBCYk8n8AnCpbnCu-4p9JjukLyXJZZzTrGU,30283
113
- sglang/srt/entrypoints/http_server.py,sha256=Fyb3z9OKXF9h_-duhWsHLjZayE3uoZ2dHpeV757bxXc,34745
110
+ sglang/srt/entrypoints/EngineBase.py,sha256=yKN76witT2jz1zhmLHmPNLGMpK2UiOTaKQ2KPD8l99U,2594
111
+ sglang/srt/entrypoints/engine.py,sha256=o6sccP-gdeO6rOY9vbSqVmUNlBrK2YsinrDf42URg5A,31328
112
+ sglang/srt/entrypoints/http_server.py,sha256=7q6TK02vkppIrW_oa_Xxhr-EV3SNaAwAt_pcnLNfC8w,37503
114
113
  sglang/srt/entrypoints/http_server_engine.py,sha256=ncN45ti9mawSOimPSedI6zugfoMhMQOYh4tmdfC9LcE,4936
115
114
  sglang/srt/entrypoints/openai/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
116
- sglang/srt/entrypoints/openai/protocol.py,sha256=QqC3XeJ0RxlFBsPuobjtf6c7iRkEOC8Td4E_GvjKwxM,18759
115
+ sglang/srt/entrypoints/openai/protocol.py,sha256=qIwhokAlAVbp7Nin1eE4TCnUyrAhKcPS47kzHkhzZg4,18799
117
116
  sglang/srt/entrypoints/openai/serving_base.py,sha256=5NJ2S_6B2NFSwn4nLp6eaeJ5iC3IcQzMEY9lW_gPcdA,5246
118
117
  sglang/srt/entrypoints/openai/serving_chat.py,sha256=tWKWjspTpNnuk-Aqfl_S6OmpZe6gz5XxmSGEwfIvCsY,35935
119
118
  sglang/srt/entrypoints/openai/serving_completions.py,sha256=emIutVmnJgOgGRuAqdB80-kVHUfQbE67n1VS-76o4QY,16690
@@ -122,8 +121,17 @@ sglang/srt/entrypoints/openai/serving_rerank.py,sha256=8n6y5kC6UhRpWrDtzH0eIp0dz
122
121
  sglang/srt/entrypoints/openai/serving_score.py,sha256=ebAts-m6Pq-LTgFKwggkywBUrAgUSppHHVEzgwYHUzo,1955
123
122
  sglang/srt/entrypoints/openai/usage_processor.py,sha256=9LTB5rqdRuMKyZrIXiUBuF_WKaSg9X45YdzERDxbtCY,2746
124
123
  sglang/srt/entrypoints/openai/utils.py,sha256=DT9quW0F1DX1P9NAuMxpERgXcNYKKtm7rd7J1m7EaDQ,2112
125
- sglang/srt/eplb_simulator/__init__.py,sha256=HIZaXqsvsOCMMJ81dSs1afSGZ5G6OiOZEtHpltyzzjY,21
126
- sglang/srt/eplb_simulator/reader.py,sha256=R9wV7PqaCjILSnfYk90hNY95iJeST08a55Uj2Qk4iE0,1832
124
+ sglang/srt/eplb/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
125
+ sglang/srt/eplb/eplb_manager.py,sha256=Wt7w4L5g1BSsXx1mqoGo8WjkB55f4nGB4KqC3y_ijl8,3394
126
+ sglang/srt/eplb/expert_distribution.py,sha256=N2wcIzQo9nzPpH5jR63RH7iB00XvH4R8OGp-rR_07f4,31332
127
+ sglang/srt/eplb/expert_location.py,sha256=unthN8w37bvxf_4Z1xNi-Gi4SGnZbTBbMpHC1be9QMI,16665
128
+ sglang/srt/eplb/expert_location_dispatch.py,sha256=epq06lcViQXoSL9SIf2urjBDjMTlzql5GwMVFpcOAtI,4144
129
+ sglang/srt/eplb/expert_location_updater.py,sha256=oVIUYzji6BFEd2AgeRcM6kwEqLwwD3_PEEv3EyWIydk,21100
130
+ sglang/srt/eplb/eplb_algorithms/__init__.py,sha256=c6fo4qM8N0p5DyyfGp9fxqc2wkxvzSJBzJFRG1I1leg,1959
131
+ sglang/srt/eplb/eplb_algorithms/deepseek.py,sha256=mMZT7zAAArccdRS0xXxifvMb3qn9enSt426uUTKeiq4,8340
132
+ sglang/srt/eplb/eplb_algorithms/deepseek_vec.py,sha256=Vzy5Iarua1VgVHzjBNZaVV_vt1LY1BLtJz7PmzB701k,10654
133
+ sglang/srt/eplb/eplb_simulator/__init__.py,sha256=HIZaXqsvsOCMMJ81dSs1afSGZ5G6OiOZEtHpltyzzjY,21
134
+ sglang/srt/eplb/eplb_simulator/reader.py,sha256=OlsWqsuXqVQY7PfvvrP-vsl2Ww2Kg4vD_K9BltM_QHo,1828
127
135
  sglang/srt/function_call/base_format_detector.py,sha256=eMSqbx99YPm2m_ChLafFRuLOzXBtA0oJn_Q4FtB3FnM,12950
128
136
  sglang/srt/function_call/core_types.py,sha256=wLUsW8mUA-i-ISz5QUDL7Ejq72W-K1HIhFa9Wm-_oA8,786
129
137
  sglang/srt/function_call/deepseekv3_detector.py,sha256=XudIiIt2Mejokg6qOkX7vYS-3XIFstOBHv-m-Q5fBLQ,8970
@@ -134,33 +142,36 @@ sglang/srt/function_call/mistral_detector.py,sha256=xNuVl2vDXVYbXyiXLkJZ9VM6njcw
134
142
  sglang/srt/function_call/pythonic_detector.py,sha256=rtXSflE4w993a4OqphWG-WQzvwRz0v3dfgHOnte1fpI,8731
135
143
  sglang/srt/function_call/qwen25_detector.py,sha256=9JfZem_5nw91Og2biwq8eIpUQjy_3kFz4TQI8Lc3Vow,4882
136
144
  sglang/srt/function_call/utils.py,sha256=__ImDF2kNyoLWsYO5RYoryvy1mmgEjnjXlCvLv-uLCM,1695
137
- sglang/srt/layers/activation.py,sha256=w8gr84LdpbBxmSjK9cfqFGXiGxALOwkBzqHChdZ6z7M,7327
138
- sglang/srt/layers/communicator.py,sha256=WbefauUNbwfAtaBySi-rqqXkoFZZpxdOJURLBHpF5qA,18597
139
- sglang/srt/layers/dp_attention.py,sha256=e-AgUTa70NsNgsw4hB1a-B_yDv7T8PyXW3jqR8sIKgY,9807
140
- sglang/srt/layers/elementwise.py,sha256=XCrR2i-9dP-H6jQo2zUuquwZrsl_wEQqj5Wxk6WUf7o,13987
141
- sglang/srt/layers/layernorm.py,sha256=x6VDTFxvcJMx2txpBW4Y7G1sWfKYsksNpf-L4_ySSDo,7660
142
- sglang/srt/layers/linear.py,sha256=ToLkotx239ze3rwizk3r05Gg7_LJk39hAdjgqWwYusE,52462
143
- sglang/srt/layers/logits_processor.py,sha256=TTR7LgSwthaH6Qfmcda2Ampibtt-JcwpLSs6-OJI_sQ,25604
145
+ sglang/srt/layers/activation.py,sha256=UDrJcnQoIOJjMzZ9XAy5JlEJ-do44tGMtcitY7I8kPQ,7327
146
+ sglang/srt/layers/amx_utils.py,sha256=1mENgHK2B8mgaD1oMtgbZ15Jmy_Uu1QueBmo09Ff2iA,2865
147
+ sglang/srt/layers/communicator.py,sha256=_aq6rDgDlRRVXO1EquSNtmMADuQJGdRZkbt0vCxTxqo,19314
148
+ sglang/srt/layers/dp_attention.py,sha256=V7m_PfvHHtRMJMviIqmoyqf5VFFJLYYcynDuI5dXtAU,10275
149
+ sglang/srt/layers/elementwise.py,sha256=MyQUflyKEfPZ-BggW1Kd4hB53RFD6FXGc2S5LXjx_do,16026
150
+ sglang/srt/layers/flashinfer_comm_fusion.py,sha256=IwI3VPHVZaWTgf_rsSH_5QROTcmoWnjlZ9annh7cYRs,5888
151
+ sglang/srt/layers/layernorm.py,sha256=4KGaB4QSO5hBcr26TtPfspD3XZwr5X55Pkn5xN9eJrQ,8647
152
+ sglang/srt/layers/linear.py,sha256=cxth3pvLGdud-ZoHrGFhrPeuhLnBX4IWohyBr2gCCv0,54890
153
+ sglang/srt/layers/logits_processor.py,sha256=tOPMYopEQuoLBzwbjSmU9OWFYh2mmy3ViJSbA_wpFOU,25619
144
154
  sglang/srt/layers/multimodal.py,sha256=YVR69WW-2aGDcZHT8IVJ6F_LRM7wraZr8VjrPDXqDmA,2104
145
- sglang/srt/layers/parameter.py,sha256=zqWyEzpWzP4NNTjq3G9khq6XofgpcmJqQLg6Vd4WyWE,15084
155
+ sglang/srt/layers/parameter.py,sha256=hu1l8Yzd38xQfkRaIOE1ouzxjG6Ro84pt6SfoUB61qU,16936
146
156
  sglang/srt/layers/pooler.py,sha256=uZ6WX1FLMEafZwusyZdm6KuVlIwSjbKrdwk2qzgqNGk,3812
147
157
  sglang/srt/layers/radix_attention.py,sha256=IlqRB4bk06FOH05_7zB8lik0xLpys7jFooLeCwdO0j8,3437
148
- sglang/srt/layers/rotary_embedding.py,sha256=iOxdJEw9jhxYih7WpNkzlGybzewNu9GgqU8dLM-TyD0,52209
158
+ sglang/srt/layers/rotary_embedding.py,sha256=EhxI0E8jcTWZ2COpnku7crbW8Hew5fe_ujMndj7hKvE,52246
149
159
  sglang/srt/layers/sampler.py,sha256=xNds1migup2s6b9_pS6ljkJUkvNtv7nmTGeIdOzoQ6w,11182
150
160
  sglang/srt/layers/torchao_utils.py,sha256=Ws24FdRBSkTpyeyA6bQrdDm-W5wfDxKvSIPUSahyMfA,4063
151
161
  sglang/srt/layers/utils.py,sha256=IWGg1Hb7c33Z3LHRPVJyUAzp3BnSid23ZWXAmJ_Jvp8,1204
152
- sglang/srt/layers/vocab_parallel_embedding.py,sha256=65N0e4PlOwoTRZC9QpC2G83Crn-OI4rY9wZTRnOVNvg,23166
162
+ sglang/srt/layers/vocab_parallel_embedding.py,sha256=1Av2YHpx-Oa18-33ps0lpkOuUgnY-Y--Yt_I7YcpYBU,23438
153
163
  sglang/srt/layers/attention/aiter_backend.py,sha256=7sEUgViw-xl3yok91yyOD9gTi8lQmME0g0ZiKVTCcyI,32851
164
+ sglang/srt/layers/attention/ascend_backend.py,sha256=jPCsU9_gH1iZNoZHD9nCeDdVdXqBt31LI65N55BTJPg,8250
154
165
  sglang/srt/layers/attention/base_attn_backend.py,sha256=KXVcCguwXh-PSrY9Y2aUrlXXUhWdbVxqVEF2_xIMvm4,3466
155
166
  sglang/srt/layers/attention/cutlass_mla_backend.py,sha256=SIR7sKCCegwzahSz82I3gsDyN5TkKoa4yG4-pBQWBi4,9813
156
167
  sglang/srt/layers/attention/double_sparsity_backend.py,sha256=2ZRL_gYz14idoVqQzeQ6N77nXer0f_8_TUYw40XUUz0,9161
157
- sglang/srt/layers/attention/flashattention_backend.py,sha256=j4rnX5IARna-pZmVnSR9kjf_yINGnkKO6itTLwkx82k,93278
168
+ sglang/srt/layers/attention/flashattention_backend.py,sha256=ovi2rduqany6oalDWI7WAetjyHO5DybKA3epHimm86o,94076
158
169
  sglang/srt/layers/attention/flashinfer_backend.py,sha256=Ug4SkZnuHjBBwPOj2TfLlg0eU_GoZvKjhY4oYRU_qqU,49666
159
170
  sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=NirRlNFxD0S2EncvvmrerIxNfuTnYpvemZV3MR5_FnU,34040
160
171
  sglang/srt/layers/attention/flashmla_backend.py,sha256=5iSic5ho-lkXNas9mR3uLbXbEl-do31gc8gjR7-a79k,20711
161
172
  sglang/srt/layers/attention/intel_amx_backend.py,sha256=hH9lxXs_o66_IVs58oPhRCOXGUrHbXSz82FKtHr9GO8,4092
162
173
  sglang/srt/layers/attention/merge_state.py,sha256=OnWmNV6LYTUj0y8SCy_IK7A9q6v9bZwR4_XiLOIvbrk,1423
163
- sglang/srt/layers/attention/tbo_backend.py,sha256=xpU8pR_xOwhfWnmAgLL892nb0ujBQWxIbHZAL_d84zI,8175
174
+ sglang/srt/layers/attention/tbo_backend.py,sha256=CBnSDUmDvT-Tbhi9NHNo1LLkgUAcIsWMJgKa-sAIKW8,9318
164
175
  sglang/srt/layers/attention/torch_native_backend.py,sha256=RsI4lYiQJAj-Xy0vKkzbyKOWHAVPOD9b0n0dEehwlos,9496
165
176
  sglang/srt/layers/attention/triton_backend.py,sha256=AryrPc4kzioxkiucPkApMA__0HoQTKOHNpwN0GEgm98,36923
166
177
  sglang/srt/layers/attention/utils.py,sha256=KiRSIHaGBhErUhPWCSD3Uiaqb0pSEF0NJFwTTQXoMks,2887
@@ -174,15 +185,15 @@ sglang/srt/layers/attention/triton_ops/rocm_mla_decode_rope.py,sha256=664WnAJ91E
174
185
  sglang/srt/layers/moe/cutlass_moe.py,sha256=--bNTA2BGbHeULb_XXDoRUyWWbE-doHo5K5k1T0N0WA,14323
175
186
  sglang/srt/layers/moe/cutlass_moe_params.py,sha256=9NRCmgP_Ug3gGqCcpi-x-QRbLjCNpw8792gKXwZsbEU,6522
176
187
  sglang/srt/layers/moe/fused_moe_native.py,sha256=bW3KWxxz9rxKMUQqfmAtF-7ptTODA1pwLydE05ABDJE,5030
177
- sglang/srt/layers/moe/router.py,sha256=5Aeqoix_AS4uymb665OJE904wVSBkQeFdZP4e7KKPvg,10530
178
- sglang/srt/layers/moe/topk.py,sha256=_hIyTURqx6Id1C3NQmHVuPxivMN0ywmDoyhFvtgHIZY,18624
188
+ sglang/srt/layers/moe/router.py,sha256=UrPieRvemN7Ew48gtG7DA2xhNDBRSnZxzugTEBI-0_E,12006
189
+ sglang/srt/layers/moe/topk.py,sha256=DhG8EIqyhn41erCKRwX2wGrYOOF-1VdBrCZwyyc1Ks0,18048
179
190
  sglang/srt/layers/moe/ep_moe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
180
- sglang/srt/layers/moe/ep_moe/kernels.py,sha256=xdYak2dkrUJjmUigKJ-GbWfdf-tXlUKbvtJgxVekbMA,40130
181
- sglang/srt/layers/moe/ep_moe/layer.py,sha256=U-R2mffzW_snuAxvX1AfN0xgcbt-w9fNFUidd2Hi4eQ,55783
182
- sglang/srt/layers/moe/ep_moe/token_dispatcher.py,sha256=IR5RtdL9aIG04QaeySsq4Oy-S8obivBBZKbFfPCGpXc,24077
191
+ sglang/srt/layers/moe/ep_moe/kernels.py,sha256=bHn50WQ9K57wLxLWZ8ytNJrCi7bAQ6MegN2o7qxB_Mc,40690
192
+ sglang/srt/layers/moe/ep_moe/layer.py,sha256=DjUSrRAiRzvuDRvF3JyTqupL3z7smzwXO9hQpQOK0Io,56658
193
+ sglang/srt/layers/moe/ep_moe/token_dispatcher.py,sha256=aiBE3mjvWV3eBrFGH9J44tuJncQwOjRS_XeyBNCEtqM,24379
183
194
  sglang/srt/layers/moe/fused_moe_triton/__init__.py,sha256=h9yMFAL_bagUf-qBED8gSWdCOb7d8IdA-pE-L_nIg8E,842
184
- sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=gM_nctg15Wc06pxiMq0IRE0QBCfNyebSsWwm5zdM_Uk,63225
185
- sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=AAEb9pvd3bxiuvIKV2FZboWNvffccYmhF9R09SQSRlo,32038
195
+ sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=GQk0WVdPYI1lOsa0ItkiYcGHS_k8r5y7Mfy485MBZl8,63177
196
+ sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=wsNUtzqE2Emi0RAwVzpFHUOVOqUMXr3pCMSJHqkc7EE,34126
186
197
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=iNGsE2ZeVnQEnN4A8UJ9Jv0d3hbRF2MJ9oBgjup5Szk,2737
187
198
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json",sha256=JJN0hryyLr5Zv3dSS7C8cPFhAwTT6XxUVnBGMZvV6JA,2752
188
199
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=ouRyZ5PEMPP2njPftCNhs-1g1y6wueWLmhI7G1SjV1k,4131
@@ -349,26 +360,27 @@ sglang/srt/layers/quantization/__init__.py,sha256=isMl8LINJFMzEse4r2Ta_7JXT15eKC
349
360
  sglang/srt/layers/quantization/awq.py,sha256=KemDG55U3B6YZVjMV71awVAIj0islFvtxcUHmOBeGy0,6739
350
361
  sglang/srt/layers/quantization/base_config.py,sha256=jWk_egQrVNMYmQgbTI9vkcgzScLFjB5_sywFlAfE5J0,4776
351
362
  sglang/srt/layers/quantization/blockwise_int8.py,sha256=vWyPZsRLhdKtSmjvlT5fsowBK_nEebYbDAUh2yqseGw,15285
352
- sglang/srt/layers/quantization/fp8.py,sha256=Ne3K177lBdWI8TXyJs8qSaH67KaAv2j4LrZeHyqyH_8,44678
353
- sglang/srt/layers/quantization/fp8_kernel.py,sha256=pUda_glnAprnFIj3VUgCUYMKb2-uK3UOC3yPahgRMBQ,34743
354
- sglang/srt/layers/quantization/fp8_utils.py,sha256=QYHx_OLXFxFCmSMgoKmbJ3Vgl4mVEcXykdnhHO7tU0g,25650
355
- sglang/srt/layers/quantization/gptq.py,sha256=d1frUjvXmZfQKkcMQY5t0BA4sXWHE9Jze24qxniptJE,26719
363
+ sglang/srt/layers/quantization/fp8.py,sha256=fPzEIAYqiSgVjVTu6_CceyW-kemzSRGS_Q-FZ0eGAD0,46375
364
+ sglang/srt/layers/quantization/fp8_kernel.py,sha256=vziHnk-gVbeY3z94216UDCU5kyev36ZrKldMgglSmpw,34718
365
+ sglang/srt/layers/quantization/fp8_utils.py,sha256=fsX1x17RwcK88N1WpF-YELQOpkpHvJnoLriZj27H2R8,25611
366
+ sglang/srt/layers/quantization/gptq.py,sha256=B0J14a-OANM2uglnatukFMlvpDnUprV3-p_l4308WUQ,26838
356
367
  sglang/srt/layers/quantization/int8_kernel.py,sha256=GfRC9FOn9exNvK4QHbUeBj3Hhv32VcyGphapFPt5b84,12625
357
368
  sglang/srt/layers/quantization/int8_utils.py,sha256=YK9CS-lb_n91kNCTKK5o5apYF31V2giDg5G5VKrpcUA,2356
358
369
  sglang/srt/layers/quantization/kv_cache.py,sha256=_9pF5rwvB7ta6Gdc5YKVVGbNzYwqmhIx4TrX1-xnodQ,3261
359
370
  sglang/srt/layers/quantization/modelopt_quant.py,sha256=wW90ZS1ZrGOXf7l5svudmXqAi3JE2SkCV-fwqWeYfdg,30905
360
- sglang/srt/layers/quantization/moe_wna16.py,sha256=PBgcQULe9oD2i96BeJRZtIdIUkWzS0IWU9ev3C-h7mw,19646
371
+ sglang/srt/layers/quantization/moe_wna16.py,sha256=9w3TYF1aQ0N0zNBgcuyOX-z-zfq4it2ul_MjKk_fPCA,19680
361
372
  sglang/srt/layers/quantization/qoq.py,sha256=adhsCixRUTh1m8sfpRWNhh5oX3I1WJli3Elg8uexP6A,8222
373
+ sglang/srt/layers/quantization/quant_utils.py,sha256=kBibCBK9DCambuPy2atB82Bmalb-Vs_wbQoVHT7h2Lw,5089
362
374
  sglang/srt/layers/quantization/utils.py,sha256=qHdWbLQD8teKhv2tOcuyGegpFonXygoJHwCAD7Ur5MA,5439
363
375
  sglang/srt/layers/quantization/w8a8_fp8.py,sha256=ZB6ydquyPOORDe9OCoEBRH6dsQhCeRWv1YIgm8UDQwQ,11622
364
- sglang/srt/layers/quantization/w8a8_int8.py,sha256=_BG6Zo4tis0UGZ47EVfBmfpOxRKzXvd3EM15qDWy7OM,9147
376
+ sglang/srt/layers/quantization/w8a8_int8.py,sha256=aPMm-sk5nBpHwHzkedvuAWXiqWpp_NPyVaPHxHnuhVg,10847
365
377
  sglang/srt/layers/quantization/compressed_tensors/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
366
378
  sglang/srt/layers/quantization/compressed_tensors/compressed_tensors.py,sha256=EaOKuIA0zXwqmH_eVhWeNdGJT9d1d9gVvFyYkgpdjDg,25665
367
379
  sglang/srt/layers/quantization/compressed_tensors/compressed_tensors_moe.py,sha256=w19mhCnOre3j6L2-Tc_sRtBPgwBOAKV4QmYLpzyU_Fk,26637
368
380
  sglang/srt/layers/quantization/compressed_tensors/utils.py,sha256=mnUmKWFQUnY8bVoFHUuNVwqsfS-cefeR-ofyaihCXcY,7621
369
381
  sglang/srt/layers/quantization/compressed_tensors/schemes/__init__.py,sha256=HWMTnmrj-mUCRXgcOwnnXLrvrAE-ONdPTSzSImjHCMA,347
370
382
  sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_scheme.py,sha256=tdKJC8c3SX8T3z8JL-1YCsg4ftcv55Wxt0vZrYftpX8,1635
371
- sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a16_fp8.py,sha256=-iq634sU38yWFA-h3w-B4kTALeXMo7uRZQI6CckMZTo,5494
383
+ sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a16_fp8.py,sha256=VvqVpAr66AlS5IPVuIR5Nu0ESH0oAoKo545jNart6lI,5493
372
384
  sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a8_fp8.py,sha256=SkeQYXW5i6M3ZLp867KFwQXVBcIPAcdYFILUTY0A850,5934
373
385
  "sglang/srt/layers/quantization/configs/N=1536,K=1536,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a8,block_shape=[128, 128].json",sha256=RdHQxWXwXqvio31192vsLaKjEr4f_DjpMPKlarY1IAk,3251
374
386
  "sglang/srt/layers/quantization/configs/N=1536,K=1536,device_name=NVIDIA_A800-SXM4-80GB,dtype=int8_w8a8,block_shape=[128, 128].json",sha256=0vLaJgo5B9ti-XMFKJuvSoMGjsZQ-RhHSx4cC8Xji-U,3254
@@ -527,9 +539,9 @@ sglang/srt/layers/quantization/deep_gemm_wrapper/compile_utils.py,sha256=BrzCCxX
527
539
  sglang/srt/layers/quantization/deep_gemm_wrapper/configurer.py,sha256=zkMzBAqQTSwG9TlGPuwmHV1yN0v5Y_5Hgyo0CKQDVNU,741
528
540
  sglang/srt/layers/quantization/deep_gemm_wrapper/entrypoint.py,sha256=On_uvP1ThxgQFAzOWKoteM0vIOHqmtI127A4qbPtmbc,3264
529
541
  sglang/srt/lora/layers.py,sha256=FaTYf0w3zbKKKAT1nJdAzGRtxvySB6FpNKXvEi5RHH0,12958
530
- sglang/srt/lora/lora.py,sha256=WY3cISWrQ5Ye3YcNKJUwAWRImzlpLQva2fGepg6P5EY,9744
542
+ sglang/srt/lora/lora.py,sha256=v4mkNOypfPXLW1mv_uKj2M-kR-CnzSmu0GReKafGSrc,9667
531
543
  sglang/srt/lora/lora_config.py,sha256=qDgMTx_69jyJUl29O5FxLzYa0BMhqYVXWXfyyVOvGm0,1684
532
- sglang/srt/lora/lora_manager.py,sha256=pXQuS30X1KaqzDk1bD6Cb-cClcGopJcoNvGpXMshe54,18316
544
+ sglang/srt/lora/lora_manager.py,sha256=sdfSP0o3u4sMlzaVO1N7xhprfydFG-VSutmtOFlu-cE,20060
533
545
  sglang/srt/lora/mem_pool.py,sha256=M4l4RO4tRjii5T4fq89nUoKJNHusaQHwvLrkryBCb1U,10132
534
546
  sglang/srt/lora/utils.py,sha256=f3eySsA2tqlzMkvqwtRPWKIRjDiMk6ZFh9CJfUYdeqI,5486
535
547
  sglang/srt/lora/backend/base_backend.py,sha256=EIz8I-GIrdmK4fISw3ENhbJVVITaxKfyLxHXGPU4fPs,5044
@@ -541,64 +553,41 @@ sglang/srt/lora/triton_ops/qkv_lora_b.py,sha256=qCpJAksCSXS3Znm-ABx1QfrdNqj9hrP6
541
553
  sglang/srt/lora/triton_ops/sgemm_lora_a.py,sha256=yNBgl8jS76DPlGJg8puRkSnKkewf2_2oKfVZZRq4lYY,4351
542
554
  sglang/srt/lora/triton_ops/sgemm_lora_b.py,sha256=EoF9HymgQ1V9DwyOJOvbw1hCbEjprVOne_fC4VHgj-s,4518
543
555
  sglang/srt/managers/cache_controller.py,sha256=K00t5dSZU6gbAMHZWhNyj0ndgHISvelTl7UMI5KqBuE,19352
544
- sglang/srt/managers/configure_logging.py,sha256=fOJaXAQ1n9m-8KPJndpsKvS885i69SMafoEADLIVfIM,1633
556
+ sglang/srt/managers/configure_logging.py,sha256=8sNXZ2z9pBWOwn-X3wyz013Ob8Nbm1zDxRkxoZjH-l4,1633
545
557
  sglang/srt/managers/data_parallel_controller.py,sha256=PZ-wOcAFn3PQqMB6I2vjIsFmplf0nlNl5hqTDKTHTG8,12112
546
558
  sglang/srt/managers/detokenizer_manager.py,sha256=SpLxTsSPKBZfD-ZMhJ5zpPPGuUb8PmcYgFSL9CsurU4,10696
547
- sglang/srt/managers/eplb_manager.py,sha256=YaxnvD1-wMV7BhtF9AxoNRVsJUdlQzFF7N-JDP43ojE,3411
548
- sglang/srt/managers/expert_distribution.py,sha256=TzOSO7xFJ1VaxvbC2wqHq4l8UtWLX8K0rBmu5g_V2rU,31562
549
- sglang/srt/managers/expert_location.py,sha256=ZSsH17k5bAgbE1wuvpGaHGueiyhfPrgQakBFPu9jswo,16669
550
- sglang/srt/managers/expert_location_dispatch.py,sha256=U6-XLZ77RK0oy_JUVug2q-2LJjwoYX-js0_zhBNMXuM,4148
551
- sglang/srt/managers/io_struct.py,sha256=gyP8JGyX4DSPYs4_0LIKUs4fj7tonrDhnreiSajgric,34022
552
- sglang/srt/managers/mm_utils.py,sha256=mA9W4xZBnXfs-4ZeALvhdpGAYxrJGfOxBWyoHVrt44Q,26518
553
- sglang/srt/managers/multimodal_processor.py,sha256=XlRYvNhF6XOssreRX9DZPhLSpps_VE62gSKw3EGdNPo,2088
554
- sglang/srt/managers/schedule_batch.py,sha256=_Bt9hGWtiY3Dy0_GNijQVB9TT1b1V2xFOYK_M2aRvuo,73146
559
+ sglang/srt/managers/io_struct.py,sha256=DQ2zg8InwXHgOa06n47rbwTzR5mYkj4OGQe5rZ0T77k,35137
560
+ sglang/srt/managers/mm_utils.py,sha256=px_pMotzBLhuqw-mLXXzf8N1DthhDn9ILsIVIzW9y74,26582
561
+ sglang/srt/managers/multimodal_processor.py,sha256=mzCrN-8H0bE0iMO8UzxmYmhE2M1qsbVJXGdhAYcjjYA,2016
562
+ sglang/srt/managers/schedule_batch.py,sha256=3NF590tt4TJ99svwdrlsrFiICH_8X2DpSOj1ebEUSC8,73119
555
563
  sglang/srt/managers/schedule_policy.py,sha256=0T8URzQmLvEmG-42-SFBBl9WnsOSwYO8-_CcBpuD38M,20474
556
- sglang/srt/managers/scheduler.py,sha256=nejUktfqa3Qwf6TrN4CUVTYLELNwfUGFpExw-a8WFFw,110046
557
- sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=aaj0z1PD3fGIOPoTtWwqoKsii0yQCR7txVFXMPECveQ,29879
558
- sglang/srt/managers/session_controller.py,sha256=Lh1kruMcKqR7WVWYJRZbYgowtsssVlP7_paIVXLLIcE,5756
564
+ sglang/srt/managers/scheduler.py,sha256=ZC49CVTsVlDh77QCq5UPhy04NM9FV5YHXuMg4M0cwEE,112191
565
+ sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=XAK2aeLleZBaLtzebEKdpaz9E7uKnHV7ywHSk_WPDYo,30148
566
+ sglang/srt/managers/session_controller.py,sha256=dzlMNZlo20FTSl64QqK7y7pElsdCy8ICOWWBPTBVwgs,6040
559
567
  sglang/srt/managers/template_manager.py,sha256=RrwRA2oqId_PMQ98qJQGwIxMroOxiorl2sGC9ARou_0,8543
560
- sglang/srt/managers/tokenizer_manager.py,sha256=zZR4c-jCm0n8LBn_5PT5eSv8Jptt50HM7OQeCvxBVqk,65586
561
- sglang/srt/managers/tp_worker.py,sha256=A010h6fHS4gjsaqymQyAFiqLnZGUZiTi9rHIr3blmk0,10436
562
- sglang/srt/managers/tp_worker_overlap_thread.py,sha256=jB9W7qSXKKnBrTep1yNKrYgLlylJvL-ab2Sa1ki6f0s,10349
568
+ sglang/srt/managers/tokenizer_manager.py,sha256=I2M8Hpj9T120rJYP5Hdu6cV72oPmsoRr829LiT7O4Dk,73655
569
+ sglang/srt/managers/tp_worker.py,sha256=kyk2EVd3eP0gpgVETJ6J_BdxIDbiB76AfpN4_-Xqkrs,10896
570
+ sglang/srt/managers/tp_worker_overlap_thread.py,sha256=EFbtichmZjMoBgRa0AMIGdKGur1i8bpd3JvaDi-SsK8,10663
563
571
  sglang/srt/managers/utils.py,sha256=9_VGE48EK0PXVJ26aYvbRJ6n7gIZALvCcf6uZCccCgM,1369
564
- sglang/srt/managers/eplb_algorithms/__init__.py,sha256=wVUv2ZhhC-_VbLaStpk3vulzhqExwfHGZJQqoohs-Fw,1963
565
- sglang/srt/managers/eplb_algorithms/deepseek.py,sha256=mMZT7zAAArccdRS0xXxifvMb3qn9enSt426uUTKeiq4,8340
566
- sglang/srt/managers/eplb_algorithms/deepseek_vec.py,sha256=Vzy5Iarua1VgVHzjBNZaVV_vt1LY1BLtJz7PmzB701k,10654
567
- sglang/srt/managers/multimodal_processors/base_processor.py,sha256=1fl0eW24ju9FiKflieYEo2mooYFayWGVtamxhAtcWJM,23348
568
- sglang/srt/managers/multimodal_processors/clip.py,sha256=lRc2mcuDbAhZVf-0EfkO81pqDiol9zLvTpDqtPIBQ2k,1525
569
- sglang/srt/managers/multimodal_processors/deepseek_vl_v2.py,sha256=CMfhhdq7u6GzT8ZENo7ByClvQEx-HKaTGVgdYM1vMNw,3460
570
- sglang/srt/managers/multimodal_processors/gemma3.py,sha256=oBHXlbwto_84ZkjkW2A7F3Z7kNuDf039uDH4HVXKE1s,2290
571
- sglang/srt/managers/multimodal_processors/gemma3n.py,sha256=UjAHeX4a2ZyPccCV_O9isxm61J-w5dglfhYO2IUQkyo,3578
572
- sglang/srt/managers/multimodal_processors/internvl.py,sha256=ASv3MQ0Ju6oZG7UceS5ziy4rL2d8Xf1_LbIFmEAuz2E,9512
573
- sglang/srt/managers/multimodal_processors/janus_pro.py,sha256=nSZYKLoCZtv7sQIM21KCt4jpnzVfcsF84m9CFPWwR7s,2058
574
- sglang/srt/managers/multimodal_processors/kimi_vl.py,sha256=8DER6QFDrmD0sZMjlAffY4z3jtBrrIYoU8ogpZIKNio,1868
575
- sglang/srt/managers/multimodal_processors/llava.py,sha256=90D2A09EHgdWwapVSeLg5J4YsioeT2AvGmJkepZA-5I,8100
576
- sglang/srt/managers/multimodal_processors/minicpm.py,sha256=y-1UHmXq2bmDtTax2b-rJf-CI478MMpoz9nY3b-OKzI,5561
577
- sglang/srt/managers/multimodal_processors/mlama.py,sha256=MLiGS606LzVtdoXvjWGANx-K_7nE9J_fMVmkXN7Gz8k,1661
578
- sglang/srt/managers/multimodal_processors/mllama4.py,sha256=IAu09ZPMAHxZKsfGiKjZU_Fruj4AmKA0poqXC0zufWQ,5813
579
- sglang/srt/managers/multimodal_processors/phi4mm.py,sha256=-yTlt2kQkrgks2IzaRKmEj-7siAvTDhZHDR_J3NVFdw,2610
580
- sglang/srt/managers/multimodal_processors/pixtral.py,sha256=uQJYbxhafNCmg0xP52FdElnkUatAyintER1XNuKz3b8,4195
581
- sglang/srt/managers/multimodal_processors/qwen_vl.py,sha256=RLv8sBuKhAjeaVqrFR7hwEEw7fX1WOMZ6r2R4gFeV04,7025
582
- sglang/srt/managers/multimodal_processors/vila.py,sha256=AeQlhdIKKoN0lre8_zYQ7YpGu7I_rux1bRLt70sPKJ0,2594
583
- sglang/srt/mem_cache/allocator.py,sha256=gujYY5DFYQIz8VDAUOjATKtxUMpdRo6xkBunPF08SG4,12526
572
+ sglang/srt/managers/multimodal_processors/qwen_audio.py,sha256=vUkXsa_Ipe_EjWPWDSSUrbm8v-fDenEy3w3fpHwaf2g,3170
573
+ sglang/srt/mem_cache/allocator.py,sha256=MJUPQt4ECj4ReGeUVGVUNfwrwjHBbf3youdkyp3jCGQ,21633
584
574
  sglang/srt/mem_cache/base_prefix_cache.py,sha256=XHSzXKgBin-m1HsL47K-GobhLnajaGxqLqGtrLsWaZ0,2540
585
- sglang/srt/mem_cache/chunk_cache.py,sha256=580NlAzr9Pm4yjvX5S_QP9ify998oOEPQuMpRye7uW8,2005
575
+ sglang/srt/mem_cache/chunk_cache.py,sha256=MWo4DwRkHKOLKyow53YrGQdvn2dI7hVJuf2Gf-SPAr0,3110
586
576
  sglang/srt/mem_cache/flush_cache.py,sha256=GYcxmNXh4hsMpFfNOuCTpKilW7guZwTtAg_usVeM3J0,979
587
577
  sglang/srt/mem_cache/hiradix_cache.py,sha256=Z_XgbLBxI8SN7kgsi1R6iX6AfgDUF5-ynVnBVRF7KUw,17061
588
- sglang/srt/mem_cache/memory_pool.py,sha256=yLYDZ7-rLQi-nkhC_KuT4YmxnEOqM6Rq-j4_HAPehh4,27583
578
+ sglang/srt/mem_cache/memory_pool.py,sha256=soOE9l5qZlWHFbqIHwSEW4l7NQXzmEjpJKk1rfehQZc,37055
589
579
  sglang/srt/mem_cache/memory_pool_host.py,sha256=9N34Y7P0aM2xkmhsEw2_W8xN897h-HEwzRPIu1REwac,13186
590
- sglang/srt/mem_cache/multimodal_cache.py,sha256=Q-lYcI-3HoLu0WJhE2F_An8g9mkZ8LwMrYnQ4383Rf0,1266
580
+ sglang/srt/mem_cache/multimodal_cache.py,sha256=wZl2KeEl3xeoEsYdH33UoM-FO8kqfLo_XUgereJVvoM,1348
591
581
  sglang/srt/mem_cache/radix_cache.py,sha256=ojr9_bUwnPocmpbGZXz8JKac4dS-PrfNYk8UqF4Gvi8,17936
592
582
  sglang/srt/metrics/collector.py,sha256=C9QEJDOEdOPBwy2IJwFS3R6VbGzVzGs2xakKCCPvQDk,19903
593
583
  sglang/srt/metrics/func_timer.py,sha256=VFyNRrbnKVCwnQsrlLin1lITJfjQpf9m8sGPqL5LIsQ,3438
594
- sglang/srt/model_executor/cuda_graph_runner.py,sha256=MyZg9hw1dGcjIE5canm5TplUhFptIXt9FIKpDgXWjTQ,30450
595
- sglang/srt/model_executor/expert_location_updater.py,sha256=HWLY5lJAWefy2tobWJKlHs3qlBSCS57EwSMdfUuPFc4,20585
596
- sglang/srt/model_executor/forward_batch_info.py,sha256=ueHsjmGm52YqVK-8f-TRYpERCCdeSBuc2yaqxD9pWkQ,29268
597
- sglang/srt/model_executor/model_runner.py,sha256=9EIHTDKRtXNrzURQYcC_rBjjWUPGnKHKYCV_GiW70zM,54490
584
+ sglang/srt/model_executor/cuda_graph_runner.py,sha256=3pc1_TpGmUAI51SxVubGGZIRuBmZrj8kOuch970RN2A,30505
585
+ sglang/srt/model_executor/forward_batch_info.py,sha256=uzWEXYdVJie1xLikH6pmOnT64BDnZvJvfK7gCHH82x4,29572
586
+ sglang/srt/model_executor/model_runner.py,sha256=kfFWWHMXJ6X9WEQgEj618mx8zIc9qvhXC5-K2ICDPJM,65709
598
587
  sglang/srt/model_loader/__init__.py,sha256=zGZkOBz1zx-pkaIy47BasL3fjDlAcxAXUTjInOhXHAE,919
599
- sglang/srt/model_loader/loader.py,sha256=-Pr8-YMaF3jIGXfhnEMM1WOloeWcPQnaUgSgWN6aAGI,57626
588
+ sglang/srt/model_loader/loader.py,sha256=oHIX6qiGfXDQWzP6NuPQfc_haFsWykbcVTKEGUwC_t0,59164
600
589
  sglang/srt/model_loader/utils.py,sha256=zSZBPA9ErPmkf-HfCxJjhmiFwYueB15KUg7NFspLvPY,4454
601
- sglang/srt/model_loader/weight_utils.py,sha256=jkd4R6wroef5A3xpVe6rst5xosVitxndnNwH6cMp_zo,35668
590
+ sglang/srt/model_loader/weight_utils.py,sha256=dfepjK1lhcFoxX6Vflb3imiHaj9_Tep_uZ7j3lfN9jE,38004
602
591
  sglang/srt/models/baichuan.py,sha256=HbvlErnkCSK4pRQYCSDxMcrn-1DQyfiNoeDcnRrJas8,15807
603
592
  sglang/srt/models/bert.py,sha256=ODJe8YfNRP-hHsomFWk4_QpcuiSsNfjzGf256EDS0Pc,15802
604
593
  sglang/srt/models/chatglm.py,sha256=cajLN9caBl09e0TwOFkiTTKDqwlbmHo_yS-NCjdeQW8,13957
@@ -607,95 +596,113 @@ sglang/srt/models/commandr.py,sha256=5Y_b3K0QY7D37nFGkyiGgY38RleRui_GJUYcHSuHUZo
607
596
  sglang/srt/models/dbrx.py,sha256=4pn_fdoATg01VEqNnIAxNEsKV5XU7gwHyd289eydq1s,15598
608
597
  sglang/srt/models/deepseek.py,sha256=ZnN02HdgXCB23Vno5V9UMUoOxH5HC82vNTwsVulUJ-o,17206
609
598
  sglang/srt/models/deepseek_janus_pro.py,sha256=OeeI7vZbE4HGpxa8CwT6-Lbfs7J7WMQ3oBNpVJQpv3w,70450
610
- sglang/srt/models/deepseek_nextn.py,sha256=FMeM-5oaUWhonnP7tP8oGvFympGoRkv8h9AfFocI-T4,5941
611
- sglang/srt/models/deepseek_v2.py,sha256=KvRQntryvAu9IEY8OHrLhqIGND3qC-EKM5dr5sYhIXA,95084
612
- sglang/srt/models/deepseek_vl2.py,sha256=j8BdxZsMjm6lPdbDipEIKhVIVywCP1Vl1Kl46BZ5_0Y,13147
599
+ sglang/srt/models/deepseek_nextn.py,sha256=47fehxRdiOizr0rdLg5f1fzQEx6gGAOcDcWKtblloyk,5928
600
+ sglang/srt/models/deepseek_v2.py,sha256=L0ewZPnxM6xCCB8tJxswwNKAjE-q_SCloJfZx8Y8LoU,100660
601
+ sglang/srt/models/deepseek_vl2.py,sha256=F-nf2qRiiZNg9js__rYFEc9fNs_HVEfAi_Mh1jvqwkQ,13095
613
602
  sglang/srt/models/exaone.py,sha256=TpO-rtCpEZ8Ua7hGFnS8l2oAYhY0Pij50grc9WQ2mvc,13576
614
603
  sglang/srt/models/gemma.py,sha256=4cdrPISg1VKnsuI-QPTpYvet4BrX8BMKvCIN82iLskw,12641
615
604
  sglang/srt/models/gemma2.py,sha256=kqtwdo93GWKm2iBN29RoIRH2ggRm-K_80LM5btgfBLo,16395
616
605
  sglang/srt/models/gemma2_reward.py,sha256=V8U3_ADUHWPdOwvEe1jhGW-oJmBgL8t1TY3-67Ksv2A,2618
617
- sglang/srt/models/gemma3_causal.py,sha256=Vm605KeF7CBXbtxzOWF-v0TLbl0G12CLF-bEgTV9T0E,25197
606
+ sglang/srt/models/gemma3_causal.py,sha256=CJ2g08Ec7IeoObQIiGH0WIEtYOl05SbJ2g_pfJwSyBs,25130
618
607
  sglang/srt/models/gemma3_mm.py,sha256=b9YmkipsfVb5IXVeIVwW_PviXiCkRULhEsqNOvPoDxU,17221
619
608
  sglang/srt/models/gemma3n_audio.py,sha256=isgKfjA5UieYawxU6medL2ssXlzYPqAbagDBnLcemC0,36405
620
- sglang/srt/models/gemma3n_causal.py,sha256=nPGjcEOoLP-dhl7l94CB0XSC0g33ljFuIT_QeXb4BBE,36271
621
- sglang/srt/models/gemma3n_mm.py,sha256=jFNhWCdPd4eChD0OlfSVtJfuufJr6qTj04c-oEXorQo,19273
609
+ sglang/srt/models/gemma3n_causal.py,sha256=kBDlpSWAg6ZDmUPe08Q7sj5CbdVD_0h07zwJw8sKu7I,36335
610
+ sglang/srt/models/gemma3n_mm.py,sha256=nCCnVbGvkYit6UXljZWRAQagGeSe0Ej9YnH0DbEaN8Q,18689
622
611
  sglang/srt/models/glm4.py,sha256=2VQzUqFkQTy_2nfkxP9SF6_9kKLTZUExGRjge7r99Es,11265
623
612
  sglang/srt/models/gpt2.py,sha256=kclhxEs8oJk1KCyhmAqo7rZqecVGGHYkc-a1WZi3aIk,9841
624
613
  sglang/srt/models/gpt_bigcode.py,sha256=1D6bi8Zu760gCRZkvdLHFcg8kCkY35ARwQYaMDtYhl4,10307
625
614
  sglang/srt/models/granite.py,sha256=5WOJyNYAlt5RNHSexNfPNihhSxIMd7wPzju1cTixKig,20852
626
615
  sglang/srt/models/grok.py,sha256=vESZeGS4adI_JAerXIkCcTm15-CNiGeS7VHc36C6w1A,28033
627
- sglang/srt/models/hunyuan.py,sha256=dD9kWKTwh1DLa7b-laccQvh2PVVgAHx6487UT8VXhao,28994
616
+ sglang/srt/models/hunyuan.py,sha256=YRx9Zafs8HVTNHxlMMKdbV3ELMn6rWi9GKlk94U_R7E,28990
628
617
  sglang/srt/models/idefics2.py,sha256=U3khd3hbdawJeRNXsxmaKHdssOCT5TPOZ1D-2_zHoQo,12079
629
618
  sglang/srt/models/internlm2.py,sha256=F_iNY1gUqzAjAuUatcE47gnrcoTh5_08PY2Rw9tKr9M,13150
630
619
  sglang/srt/models/internlm2_reward.py,sha256=ndfGmyqYZbVZ7C7rJ-v9oK3wa-EpoBGybS8MlyKZi2E,2522
631
620
  sglang/srt/models/internvl.py,sha256=fZ18eKFYvvtYqoBRXKmS7KlgHMewJSAykADnrf0N3nk,23267
632
- sglang/srt/models/kimi_vl.py,sha256=rMJezfEYaEjOaMZ7vt0rg9ZlbV9p1Ax6-kDsVWzf_bI,12868
621
+ sglang/srt/models/kimi_vl.py,sha256=oFmkPGaCW3QcrExie5o0fqnvk73w6K8zVbaRXw0kV3k,12811
633
622
  sglang/srt/models/kimi_vl_moonvit.py,sha256=M5L7AJOJ2Zh2pqLZAq8aRqhbTSlipr8XOoD3ix6o2sU,23908
634
- sglang/srt/models/llama.py,sha256=qLBfL77XG3pI-UDxg5HLcgJN1tUMeWNj9-AUR4fUVGg,27144
635
- sglang/srt/models/llama4.py,sha256=NwG0mBZQR4B6KVR-Xzp89UQYvVnFMOgkZKVWvtT7Jt4,19454
623
+ sglang/srt/models/llama.py,sha256=xUVXptse-TTTPaZGLPYf8OoL2giczzl9FGiNRjy1CWA,27505
624
+ sglang/srt/models/llama4.py,sha256=nF19fG2ZdT1bUX3pncckwJ9dRMSazNZx647EW__rBRo,18746
636
625
  sglang/srt/models/llama_classification.py,sha256=4QWTFaUZIFKYZvEzs8bx8VkOZNIwdYCLrnwrdAw4QK0,3108
637
626
  sglang/srt/models/llama_eagle.py,sha256=Ubh_jmtfiOnriwvHgQT0ZGID7JvYvdSi_QGHOIkEgPE,5028
638
- sglang/srt/models/llama_eagle3.py,sha256=KCvUrWn17t7T28G60HwMyy99iB9AbdbPnS2el9n3r6o,6804
627
+ sglang/srt/models/llama_eagle3.py,sha256=715soylDE3kOMWskbPy_70BFxaSc5ptaHCS1v3-ViA0,8579
639
628
  sglang/srt/models/llama_embedding.py,sha256=zq-_lNu35VBFc7eemiam0zdkGIE8fzrgk5OWYfirZnA,3254
640
629
  sglang/srt/models/llama_reward.py,sha256=LF2nqMV5XOrljGjAwJg43mBv3z6Q040I2EYlgZeCp8k,4681
641
- sglang/srt/models/llava.py,sha256=m0-qcEWEUyN7kIiCYJAZTi58MwL4ioqCAD99PSTpsuY,37496
630
+ sglang/srt/models/llava.py,sha256=r0nHLVRI7AcFEhruqdRXTLWeQ-Cx3uty9wIkHh3TxZs,37507
642
631
  sglang/srt/models/llavavid.py,sha256=q0lHlRnoYHKJZsWnkIQdd6dYAQ26t7XsmrqA0zDGmZc,12829
643
632
  sglang/srt/models/mimo.py,sha256=Mp-iFp4YHuiuq-H8enUF5K5QbMnVcvEa6mURH6vM3yM,6140
644
633
  sglang/srt/models/mimo_mtp.py,sha256=jSmqJAXu7G3OO7jW1oa2suI4H_Yl7u5ZT7w4lHFbHhg,7292
645
634
  sglang/srt/models/minicpm.py,sha256=m5HFsSJj0Po09LY9R6qj6K4gceqWDMOePz3NDGgMGT4,14691
646
635
  sglang/srt/models/minicpm3.py,sha256=6-gfHSfXwyB5zw7AIj-c5TzjpEKR6CM0H67MrD8LVUE,19347
647
- sglang/srt/models/minicpmo.py,sha256=IBMFTmak4qokNl8zBXHLYfS5slPf88ECwox6CKHbiAU,76081
636
+ sglang/srt/models/minicpmo.py,sha256=CwcogzxwTRAInBynhP3z_YAFVq4DC_YN3gG_95C6MQ8,76034
648
637
  sglang/srt/models/minicpmv.py,sha256=7YYWwk4LX0Z7lZegnsldctb-a9zGGgJUdjFeGo-oLv4,30426
649
- sglang/srt/models/mistral.py,sha256=z7q5NBVbQcboQTIwhULtsLpFvNferaIv49EzOXVgh7g,3487
638
+ sglang/srt/models/mistral.py,sha256=Ox07RJpTYl-4Pb25UIghL_66o9TTA6lPmsUyent_Flc,3480
650
639
  sglang/srt/models/mixtral.py,sha256=n-Pz7fyWE4m6Uh7sjzAYKNr5Wy4QUj5Yekl0qiCwQI8,17055
651
640
  sglang/srt/models/mixtral_quant.py,sha256=-kQw9r8KcLdO8SNN9RKXzrGq9Q2Al9l9cWHi1VrZSRM,15260
652
641
  sglang/srt/models/mllama.py,sha256=pkS0UWiqKJHRsFtSZzpSI9O6B5_j1OtI5pf_nyDPp3U,39707
653
- sglang/srt/models/mllama4.py,sha256=ejuhIVX0MDojdB5EPR-V-Qd_E9st8KYjnjyeArFbdFs,9084
642
+ sglang/srt/models/mllama4.py,sha256=4E7qGicVuTKAs3vHF2SnoNlQP1mm2eBrsLU7QK3x9ow,10519
654
643
  sglang/srt/models/olmo.py,sha256=7-q_fA6XXdG7kPUjpUzYkzMUWJobuSjhqjYw9xSUs_c,12671
655
644
  sglang/srt/models/olmo2.py,sha256=azmljhJF4ivcQfUtfsAUxq3ducE4tRKTL6iwe0IKYMg,14327
656
645
  sglang/srt/models/olmoe.py,sha256=TMzt-yB891bvA4X50xL0NjNnFYSx9imlA7N1EG8KNK0,15949
657
646
  sglang/srt/models/phi3_small.py,sha256=eJb8aS_3KLObrq3PNkoIyVHaQ6SZTAJe42rbpC54QKg,16012
658
- sglang/srt/models/phi4mm.py,sha256=pX1UYlvT6r8wdEbge-FrXh1CvNA2qQRvsg594uZtcLo,19162
659
- sglang/srt/models/pixtral.py,sha256=Iu7OTvM_nnApk1VjpUb1ucPBU2F1Kov5w6ddYn7gGqE,16983
647
+ sglang/srt/models/phi4mm.py,sha256=rBGRtTLGBJZGYXhvotBjJbAUpbLxsCZahDtrInP_FGM,19064
648
+ sglang/srt/models/pixtral.py,sha256=ZkZrV0mEfmbBdgRko2AvsMFZbAVskgp_5a5p1xCSRN0,16835
660
649
  sglang/srt/models/qwen.py,sha256=xYkVmMZS2uMqWhfndc8EYm0olpKFnggfuMp_6aobVi4,10758
661
- sglang/srt/models/qwen2.py,sha256=2_e20-4uKqZ8IK7_bz26SuSVDt8UD237jVzxaWIr530,19915
662
- sglang/srt/models/qwen2_5_vl.py,sha256=6DdLfONY3ZDSCzWFPWSR8jKwVnvJh2lMx5ZZbJy9xok,22661
650
+ sglang/srt/models/qwen2.py,sha256=uF71yk7ZbW4ENbfdq7Sf4dWwZjLT2JNLyzkcFtmLEoU,20983
651
+ sglang/srt/models/qwen2_5_vl.py,sha256=SuJe8YfRQkJJo_bBSgRodY2-hUl_evYdNuAal16jrxs,22563
652
+ sglang/srt/models/qwen2_audio.py,sha256=linjXOVGhjyKk5DUx9Uw-BJa1N-YcqCFUpsj0Zr_98A,7877
663
653
  sglang/srt/models/qwen2_classification.py,sha256=dGrMm4ebd30_lBhHOhaV57ig2iOTx3nqB4GEzsrRIM8,2747
664
654
  sglang/srt/models/qwen2_eagle.py,sha256=6spFg6JYQGeUXLv2Q5eMkVzZvnqGyvW6SdVBtFMxlTM,4806
665
- sglang/srt/models/qwen2_moe.py,sha256=mrmEwGclGpfW-9aIRKGlvi9peecYKIE0SMvdk8Ek4Zg,23319
655
+ sglang/srt/models/qwen2_moe.py,sha256=fmVDsb4ju0suMCZiDAhocPxO9gQecOWOxmdf-W1elvg,24239
666
656
  sglang/srt/models/qwen2_rm.py,sha256=-mQXDEv11p-I1HXgYLTtY6ROem6UYorO958WsDrzsgs,2837
667
- sglang/srt/models/qwen2_vl.py,sha256=A6YGktXkc9rvotLo0KcZpoUP60eUcFzoiDG65UzXZeI,20941
668
- sglang/srt/models/qwen3.py,sha256=L-m441pSsduaayMzILrN3isnNqK7jVraUmm_6bEJb1M,14989
669
- sglang/srt/models/qwen3_moe.py,sha256=2nOngjhOw93m6nNx0Rc3fM0Yh5lBz_GM1Ri-FCRB-s4,30824
657
+ sglang/srt/models/qwen2_vl.py,sha256=Xo7f-ChWZJNJpM0RNe-GsYU4_VXPR62ZNMSXBVYr4QY,20842
658
+ sglang/srt/models/qwen3.py,sha256=3alBwittpU5m44DnJZ5mjRM0x1UShepu2CREWotPYqA,17777
659
+ sglang/srt/models/qwen3_moe.py,sha256=qP_UlowZPOOB9sALkRtaK3-gpXlsmgEJMaJ17bycpJ0,32867
670
660
  sglang/srt/models/registry.py,sha256=bH9H0OiNV0Cn7FRBM30Oh6dxICTs9mJscdLtHYPJvxc,3783
671
661
  sglang/srt/models/roberta.py,sha256=3k53V2Gbezk3jU-D03thXx8csGn5DxFK01ZQ9WFiWPI,9828
672
662
  sglang/srt/models/siglip.py,sha256=DIVJRwdtpLD2QT1kVPIHw7Bn9BE40xJbkHujDNzkjgA,9892
673
663
  sglang/srt/models/stablelm.py,sha256=0x_31uIr3WcWwecdPAI3ek9KkyKBJS7VwknTk2y0gjY,12281
674
664
  sglang/srt/models/torch_native_llama.py,sha256=oTxxof5Wx2b2egIwWx56LeHjtPGQleQ2zM5jXHMiuOU,19293
675
665
  sglang/srt/models/transformers.py,sha256=_CL0npi-_HvqzxkLgFhv2EE3bfGvCLXPYAtPFywZOr0,10260
676
- sglang/srt/models/vila.py,sha256=DRGJXP6iSv0XjgHYIJpMzBDNYZb3__Gg_wFkmZ5D66Y,9865
666
+ sglang/srt/models/vila.py,sha256=Q8Z4q8DH3SAiaYocGys6AkEpw8zg3-l3pb5wLcyVves,9780
677
667
  sglang/srt/models/xverse.py,sha256=DsNVI9JpzN4jj0Ry6aTrj7r-xq5YLOoDX2kH4YLJA-I,14035
678
668
  sglang/srt/models/xverse_moe.py,sha256=7KCM2-j12towDMNvXkuuYiBOmNauH6NG4Ip40x0khqA,16782
679
669
  sglang/srt/models/yivl.py,sha256=oToK7-u5IGO7xwpJIQ7VtudlK6-zPqJX4bt6_wv0SH8,4850
670
+ sglang/srt/multimodal/mm_utils.py,sha256=7o4w1W0VAWgEquVIz7qw7-IxYbZY2g3MrXw9php90oY,12621
671
+ sglang/srt/multimodal/processors/base_processor.py,sha256=05moS0iDYUfI9CKzio5ip8cjsfUjqYi_S5fzArWJxw8,21539
672
+ sglang/srt/multimodal/processors/clip.py,sha256=chKReTXD4ETUQ0s7BOk_AmWHEZXR5no6fprrnHwSNIM,1271
673
+ sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=VHrUbOTF_18fPYaEx_awS1UMhOy0nhTXoA17wakwyQ4,3281
674
+ sglang/srt/multimodal/processors/gemma3.py,sha256=11tIvfpUAc9E_dkZZ-5kupUCn2TJ9e-yBriCpF38Ino,2084
675
+ sglang/srt/multimodal/processors/gemma3n.py,sha256=FzwkaEhk4ATn4nV9zkGdBgcHTTTVK5CbnTx_vBr0QxI,3116
676
+ sglang/srt/multimodal/processors/internvl.py,sha256=ffLizY9v3jYIm026UZg6MHBNadyUWYgag8HbL3hFtis,9334
677
+ sglang/srt/multimodal/processors/janus_pro.py,sha256=TOxSQH8gVirAYZvcQ_3Gd2uvNMzzWwubF4ROKDWUO9g,1913
678
+ sglang/srt/multimodal/processors/kimi_vl.py,sha256=2KMB6iEXizHXzE6yjtzS7V1RFhsA2hhuxk3Bx0ySMDM,1653
679
+ sglang/srt/multimodal/processors/llava.py,sha256=tIjeDPYxvMWUMXXLcfzzuaLPvdBtPrRzM25QzP0cnaE,7962
680
+ sglang/srt/multimodal/processors/minicpm.py,sha256=9Y8KCo5eCX274CJIx1D8BVWgferjc0Uf6Zd_HR_IMnY,5316
681
+ sglang/srt/multimodal/processors/mlama.py,sha256=bW0hVPtRMqYz1RR2I19QtZLUTTPzInZv_6ZhVPJBieo,1406
682
+ sglang/srt/multimodal/processors/mllama4.py,sha256=V2Y3G-bv2wdqkgE_XGPLMJp_nSEEr-MD8_S4h8QTDDk,5752
683
+ sglang/srt/multimodal/processors/phi4mm.py,sha256=ZYH1fWTpbz6wLGyV6c51kd54vwPRm0qdZiQcc0GlXGI,2337
684
+ sglang/srt/multimodal/processors/pixtral.py,sha256=VsCIFJpIUM3pSGNe_uRd8NlH7zSokW4xHOrZSi70R1o,4055
685
+ sglang/srt/multimodal/processors/qwen_vl.py,sha256=lKVWvvtB4OWfyJ9YZLuJapiW93cGb4T3SoqSAsPc1S4,6874
686
+ sglang/srt/multimodal/processors/vila.py,sha256=cfBY1Lmlndb-aNLpOyAffi7QPCI6rIYCdAnuxfaNcnA,2176
680
687
  sglang/srt/sampling/custom_logit_processor.py,sha256=AwODYVJdRkcQ8PGtJrhzKsqAgn8XZLQbAmR9fGiQzmc,1608
681
- sglang/srt/sampling/sampling_batch_info.py,sha256=JOGU-Fa8wPtytEJ30BHg1PldeNytwy8u31azLH436kw,13450
688
+ sglang/srt/sampling/sampling_batch_info.py,sha256=m8m-mXu3N8hLYFhAkRopePDT5Ozkd4KAmWDgM_9_4iA,14536
682
689
  sglang/srt/sampling/sampling_params.py,sha256=L2cU3MhAo9OvfdEtTdJidp9nTOkD6tiwlegxQ5vgIfU,6127
683
690
  sglang/srt/sampling/penaltylib/__init__.py,sha256=mtN8grFEcaBUhl4yBHmw8NNirt_i6uKO2cDNLHOpZQE,496
684
691
  sglang/srt/sampling/penaltylib/frequency_penalty.py,sha256=Loc3qjJTksNc5s-DV7QZHjgqoo5pxk7-nZzxwyhD2tQ,2144
685
692
  sglang/srt/sampling/penaltylib/min_new_tokens.py,sha256=rdU_D7RoIcrQPhysNQEzmr4TO2OoEi___p-i3QdwkgU,3331
686
693
  sglang/srt/sampling/penaltylib/orchestrator.py,sha256=XM-Lm6u7gYPtMZrTIc0FR4QxNZxBH5s_Cj82umyCzYk,5721
687
694
  sglang/srt/sampling/penaltylib/presence_penalty.py,sha256=NRh10AJrrQlGJ6S-enGdRefrTrWpyqrSm-aNnyqQNQQ,2119
688
- sglang/srt/speculative/build_eagle_tree.py,sha256=lxfaTEOTY0N9QTlgXSUae3DVtPLqW8CcYXWcHsxCJp4,11632
695
+ sglang/srt/speculative/build_eagle_tree.py,sha256=O9LJNaBflgJdWT94D-rGH1gJFJ18nst2oOD8HnA2mZ4,12859
689
696
  sglang/srt/speculative/eagle_draft_cuda_graph_runner.py,sha256=fSNaHYJOQUgy2_AHRlZPYSQRIMgSiL_Pz5h53eothx4,14239
690
697
  sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py,sha256=sdIHbcWwgsXDoo64-T5veDuYB5eHC9QBwu2Ns29SCSI,14930
691
698
  sglang/srt/speculative/eagle_utils.py,sha256=cBQYqryCr4is5E_16xIcUue0Q2_Mn4meY8NCyuu4RAg,45558
692
- sglang/srt/speculative/eagle_worker.py,sha256=fjYJmzz8vYCf3xod0dYoGmwyFWh6iTjnGfbV6SdY32M,38105
699
+ sglang/srt/speculative/eagle_worker.py,sha256=iOwloJqhYIrgBdnZQz9NV3zuiAe5dXJJa0QeSIg92x8,38180
693
700
  sglang/srt/speculative/spec_info.py,sha256=rhaKG0TzyF9XZYHEWp1jccwTBohSNsUDvxHFtAoOl18,709
694
701
  sglang/test/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
695
702
  sglang/test/few_shot_gsm8k.py,sha256=qnEejCyPHGEMBEiNc7T4-t9lvoo2DNN72RXw-ei_TnY,4300
696
703
  sglang/test/few_shot_gsm8k_engine.py,sha256=Yf1Dg0Tk-tY4v1oj_UTxJ7950CWn6kRMbQKDjT2Orgo,3902
697
704
  sglang/test/run_eval.py,sha256=K4Z3OdMPvLeuGJhWWTBD0F-MOUFeBYLvsPnDQ44bd18,4036
698
- sglang/test/runners.py,sha256=AOnCXNGO9AYWrUShCDoxYajiN5yVFF9b8fT6XnwAWew,32439
705
+ sglang/test/runners.py,sha256=BmIxB7H5N0ib1Tmc88L2gLuRYpat_lkxAewtjA1fjbE,32804
699
706
  sglang/test/send_one.py,sha256=XNZdfZs21tXDBwrDj2pq46WQd5smiKoYETY8U09c1Z8,5079
700
707
  sglang/test/simple_eval_common.py,sha256=OW4Z7O33QqDySRFuHIC4Ouidfup4eaOEuR9i7xJzkDY,12379
701
708
  sglang/test/simple_eval_gpqa.py,sha256=8Xt9Bw05c7SZTYrCZgB68OZUqUbLo69ywiyx0bTvSUk,3220
@@ -714,13 +721,13 @@ sglang/test/test_dynamic_grad_mode.py,sha256=L76yUCuk_ymNpXD2CmO8r2GiGjIvD_gtTsu
714
721
  sglang/test/test_fp4_moe.py,sha256=U4LHzpGl6pCiCZiENRPxVP6hxqkqRZ_0WXbB29vYeAo,8187
715
722
  sglang/test/test_layernorm.py,sha256=2GMWqqNDuGvSMSsEBF5eDCzwVSYA9E6hGhRo6s4ecKg,3764
716
723
  sglang/test/test_programs.py,sha256=DJIbTChloPwaDiEWHQoSTuKv3BGx0-K8Y5e1mDDTACM,18910
717
- sglang/test/test_utils.py,sha256=UfVq6snSqzomW0sDTql54Vbefl6kVovbFx1R79y_mqw,36243
724
+ sglang/test/test_utils.py,sha256=u3L0E_5Evrv7Wjss_ZMNnro4HwMStQcUvg6cQvL_eBY,36778
718
725
  sglang/test/attention/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
719
726
  sglang/test/attention/test_flashattn_backend.py,sha256=_rTG849FwQdVTyGKkqhczaOqngBmRWXFmkl5NnuK1GM,13914
720
727
  sglang/test/attention/test_flashattn_mla_backend.py,sha256=g4O50WblTpM7_Gq2b76k0i25_z01BOUBQ4i6PmyxpO4,10774
721
728
  sglang/test/attention/test_prefix_chunk_info.py,sha256=hpoDe2wfSa6RlUbfyri_c0iyBTb35UXGL9I2Xh6jamM,7772
722
- sglang-0.4.8.post1.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
723
- sglang-0.4.8.post1.dist-info/METADATA,sha256=isDKzDsTthshFCkEmL3isGMcgn1uBG3M2mvGolPE_xc,26609
724
- sglang-0.4.8.post1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
725
- sglang-0.4.8.post1.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
726
- sglang-0.4.8.post1.dist-info/RECORD,,
729
+ sglang-0.4.9.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
730
+ sglang-0.4.9.dist-info/METADATA,sha256=tH3lSIOqvezltkU9P2f6oqUauU_5S8qnLr3jYUIRiV0,27125
731
+ sglang-0.4.9.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
732
+ sglang-0.4.9.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
733
+ sglang-0.4.9.dist-info/RECORD,,
sglang/math_utils.py DELETED
@@ -1,8 +0,0 @@
1
- # COPIED FROM DeepGEMM
2
- def align(x: int, y: int) -> int:
3
- return ceil_div(x, y) * y
4
-
5
-
6
- # COPIED FROM DeepGEMM
7
- def ceil_div(x: int, y: int) -> int:
8
- return (x + y - 1) // y