sglang 0.4.9__py3-none-any.whl → 0.4.9.post2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (99) hide show
  1. sglang/bench_serving.py +2 -2
  2. sglang/srt/configs/model_config.py +36 -2
  3. sglang/srt/conversation.py +56 -3
  4. sglang/srt/disaggregation/ascend/__init__.py +6 -0
  5. sglang/srt/disaggregation/ascend/conn.py +44 -0
  6. sglang/srt/disaggregation/ascend/transfer_engine.py +58 -0
  7. sglang/srt/disaggregation/mooncake/conn.py +50 -18
  8. sglang/srt/disaggregation/mooncake/transfer_engine.py +17 -8
  9. sglang/srt/disaggregation/utils.py +25 -3
  10. sglang/srt/entrypoints/engine.py +1 -1
  11. sglang/srt/entrypoints/http_server.py +1 -0
  12. sglang/srt/entrypoints/http_server_engine.py +1 -1
  13. sglang/srt/entrypoints/openai/protocol.py +11 -0
  14. sglang/srt/entrypoints/openai/serving_chat.py +7 -0
  15. sglang/srt/function_call/function_call_parser.py +2 -0
  16. sglang/srt/function_call/kimik2_detector.py +220 -0
  17. sglang/srt/hf_transformers_utils.py +18 -0
  18. sglang/srt/jinja_template_utils.py +8 -0
  19. sglang/srt/layers/communicator.py +20 -5
  20. sglang/srt/layers/flashinfer_comm_fusion.py +3 -3
  21. sglang/srt/layers/layernorm.py +2 -2
  22. sglang/srt/layers/linear.py +12 -2
  23. sglang/srt/layers/moe/cutlass_w4a8_moe.py +215 -0
  24. sglang/srt/layers/moe/ep_moe/kernels.py +60 -1
  25. sglang/srt/layers/moe/ep_moe/layer.py +141 -2
  26. sglang/srt/layers/moe/fused_moe_triton/fused_moe.py +2 -0
  27. sglang/srt/layers/moe/fused_moe_triton/layer.py +141 -59
  28. sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py +176 -0
  29. sglang/srt/layers/moe/topk.py +8 -2
  30. sglang/srt/layers/parameter.py +19 -3
  31. sglang/srt/layers/quantization/__init__.py +2 -0
  32. sglang/srt/layers/quantization/fp8.py +28 -7
  33. sglang/srt/layers/quantization/fp8_kernel.py +2 -2
  34. sglang/srt/layers/quantization/modelopt_quant.py +244 -1
  35. sglang/srt/layers/quantization/moe_wna16.py +1 -2
  36. sglang/srt/layers/quantization/w4afp8.py +264 -0
  37. sglang/srt/layers/quantization/w8a8_int8.py +738 -14
  38. sglang/srt/layers/vocab_parallel_embedding.py +9 -3
  39. sglang/srt/lora/triton_ops/gate_up_lora_b.py +30 -19
  40. sglang/srt/lora/triton_ops/qkv_lora_b.py +30 -19
  41. sglang/srt/lora/triton_ops/sgemm_lora_a.py +27 -11
  42. sglang/srt/lora/triton_ops/sgemm_lora_b.py +27 -15
  43. sglang/srt/managers/cache_controller.py +41 -195
  44. sglang/srt/managers/io_struct.py +35 -3
  45. sglang/srt/managers/mm_utils.py +59 -96
  46. sglang/srt/managers/schedule_batch.py +17 -6
  47. sglang/srt/managers/scheduler.py +38 -6
  48. sglang/srt/managers/tokenizer_manager.py +16 -0
  49. sglang/srt/mem_cache/hiradix_cache.py +2 -0
  50. sglang/srt/mem_cache/memory_pool.py +176 -101
  51. sglang/srt/mem_cache/memory_pool_host.py +6 -109
  52. sglang/srt/mem_cache/radix_cache.py +8 -4
  53. sglang/srt/model_executor/forward_batch_info.py +13 -1
  54. sglang/srt/model_loader/loader.py +23 -12
  55. sglang/srt/models/deepseek_janus_pro.py +1 -1
  56. sglang/srt/models/deepseek_v2.py +78 -19
  57. sglang/srt/models/deepseek_vl2.py +1 -1
  58. sglang/srt/models/gemma3_mm.py +1 -1
  59. sglang/srt/models/gemma3n_mm.py +6 -3
  60. sglang/srt/models/internvl.py +8 -2
  61. sglang/srt/models/kimi_vl.py +8 -2
  62. sglang/srt/models/llama.py +2 -0
  63. sglang/srt/models/llava.py +3 -1
  64. sglang/srt/models/llavavid.py +1 -1
  65. sglang/srt/models/minicpmo.py +1 -2
  66. sglang/srt/models/minicpmv.py +1 -1
  67. sglang/srt/models/mixtral_quant.py +4 -0
  68. sglang/srt/models/mllama4.py +372 -82
  69. sglang/srt/models/phi4mm.py +8 -2
  70. sglang/srt/models/phimoe.py +553 -0
  71. sglang/srt/models/qwen2.py +2 -0
  72. sglang/srt/models/qwen2_5_vl.py +10 -7
  73. sglang/srt/models/qwen2_vl.py +12 -1
  74. sglang/srt/models/vila.py +8 -2
  75. sglang/srt/multimodal/mm_utils.py +2 -2
  76. sglang/srt/multimodal/processors/base_processor.py +197 -137
  77. sglang/srt/multimodal/processors/deepseek_vl_v2.py +1 -1
  78. sglang/srt/multimodal/processors/gemma3.py +4 -2
  79. sglang/srt/multimodal/processors/gemma3n.py +1 -1
  80. sglang/srt/multimodal/processors/internvl.py +1 -1
  81. sglang/srt/multimodal/processors/janus_pro.py +1 -1
  82. sglang/srt/multimodal/processors/kimi_vl.py +1 -1
  83. sglang/srt/multimodal/processors/minicpm.py +4 -3
  84. sglang/srt/multimodal/processors/mllama4.py +63 -61
  85. sglang/srt/multimodal/processors/phi4mm.py +1 -1
  86. sglang/srt/multimodal/processors/pixtral.py +1 -1
  87. sglang/srt/multimodal/processors/qwen_vl.py +203 -80
  88. sglang/srt/multimodal/processors/vila.py +1 -1
  89. sglang/srt/server_args.py +26 -4
  90. sglang/srt/two_batch_overlap.py +3 -0
  91. sglang/srt/utils.py +191 -48
  92. sglang/test/test_cutlass_w4a8_moe.py +281 -0
  93. sglang/utils.py +5 -5
  94. sglang/version.py +1 -1
  95. {sglang-0.4.9.dist-info → sglang-0.4.9.post2.dist-info}/METADATA +6 -4
  96. {sglang-0.4.9.dist-info → sglang-0.4.9.post2.dist-info}/RECORD +99 -90
  97. {sglang-0.4.9.dist-info → sglang-0.4.9.post2.dist-info}/WHEEL +0 -0
  98. {sglang-0.4.9.dist-info → sglang-0.4.9.post2.dist-info}/licenses/LICENSE +0 -0
  99. {sglang-0.4.9.dist-info → sglang-0.4.9.post2.dist-info}/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: sglang
3
- Version: 0.4.9
3
+ Version: 0.4.9.post2
4
4
  Summary: SGLang is yet another fast serving framework for large language models and vision language models.
5
5
  License: Apache License
6
6
  Version 2.0, January 2004
@@ -239,8 +239,10 @@ Requires-Dist: prometheus-client>=0.20.0; extra == "runtime-common"
239
239
  Requires-Dist: psutil; extra == "runtime-common"
240
240
  Requires-Dist: pydantic; extra == "runtime-common"
241
241
  Requires-Dist: pynvml; extra == "runtime-common"
242
+ Requires-Dist: pybase64; extra == "runtime-common"
242
243
  Requires-Dist: python-multipart; extra == "runtime-common"
243
244
  Requires-Dist: pyzmq>=25.1.2; extra == "runtime-common"
245
+ Requires-Dist: sentencepiece; extra == "runtime-common"
244
246
  Requires-Dist: soundfile==0.13.1; extra == "runtime-common"
245
247
  Requires-Dist: scipy; extra == "runtime-common"
246
248
  Requires-Dist: torchao==0.9.0; extra == "runtime-common"
@@ -248,10 +250,10 @@ Requires-Dist: transformers==4.53.0; extra == "runtime-common"
248
250
  Requires-Dist: timm==1.0.16; extra == "runtime-common"
249
251
  Requires-Dist: uvicorn; extra == "runtime-common"
250
252
  Requires-Dist: uvloop; extra == "runtime-common"
251
- Requires-Dist: xgrammar==0.1.19; extra == "runtime-common"
253
+ Requires-Dist: xgrammar==0.1.21; extra == "runtime-common"
252
254
  Provides-Extra: srt
253
255
  Requires-Dist: sglang[runtime_common]; extra == "srt"
254
- Requires-Dist: sgl-kernel==0.2.4; extra == "srt"
256
+ Requires-Dist: sgl-kernel==0.2.5; extra == "srt"
255
257
  Requires-Dist: torch==2.7.1; extra == "srt"
256
258
  Requires-Dist: torchaudio==2.7.1; extra == "srt"
257
259
  Requires-Dist: torchvision==0.22.1; extra == "srt"
@@ -419,7 +421,7 @@ Learn more in the release blogs: [v0.2 blog](https://lmsys.org/blog/2024-07-25-s
419
421
  [Development Roadmap (2025 H1)](https://github.com/sgl-project/sglang/issues/4042)
420
422
 
421
423
  ## Adoption and Sponsorship
422
- SGLang has been deployed at large scale, generating trillions of tokens in production every day. It is trusted and adopted by a broad range of leading enterprises and institutions, including xAI, NVIDIA, AMD, Google Cloud, Oracle Cloud, LinkedIn, Cursor, Voltage Park, Atlas Cloud, DataCrunch, Baseten, Nebius, Novita, InnoMatrix, RunPod, Stanford, UC Berkeley, UCLA, ETCHED, Jam & Tea Studios, Hyperbolic, as well as major technology organizations across North America and Asia. As an open-source LLM inference engine, SGLang has become the de facto standard in the industry, with production deployments running on over 100,000 GPUs worldwide.
424
+ SGLang has been deployed at large scale, generating trillions of tokens in production each day. It is trusted and adopted by a wide range of leading enterprises and institutions, including xAI, AMD, NVIDIA, Intel, LinkedIn, Cursor, Oracle Cloud, Google Cloud, Microsoft Azure, AWS, Atlas Cloud, Voltage Park, Nebius, DataCrunch, Novita, InnoMatrix, MIT, UCLA, the University of Washington, Stanford, UC Berkeley, Tsinghua University, Jam & Tea Studios, Baseten, and other major technology organizations across North America and Asia. As an open-source LLM inference engine, SGLang has become the de facto industry standard, with deployments running on over 1,000,000 GPUs worldwide.
423
425
 
424
426
  <img src="https://raw.githubusercontent.com/sgl-project/sgl-learning-materials/refs/heads/main/slides/adoption.png" alt="logo" width="800" margin="10px"></img>
425
427
 
@@ -3,14 +3,14 @@ sglang/api.py,sha256=rcp3GeoyZhmJ0GDLPRkuZNcxd0TBJy_wfUDpcmQoqW8,7210
3
3
  sglang/bench_offline_throughput.py,sha256=TwgXZYmwPaHVsdPtNU9LO0p1tr5OOKLy9wYgrfGAlFU,14056
4
4
  sglang/bench_one_batch.py,sha256=RJsXQ7pvq8y4yzW7svURtWZF5RiawxEMrsjV0OcKsrk,19388
5
5
  sglang/bench_one_batch_server.py,sha256=LS1BRmFwP67IpYlU5wmkWjqquiA5drvtWe-fwHnFSKI,14170
6
- sglang/bench_serving.py,sha256=sQKEgJZIfHRu3vNh8QWqIrTQzOfUMaoVidG05ewTVUE,71744
6
+ sglang/bench_serving.py,sha256=nOjDnqOKDezDvtCvEhC1_FAoWVkir38bSaEIcSGGVZg,71748
7
7
  sglang/check_env.py,sha256=qDMIG2rCNBH1yKnxQmF-Bp10oiFMUKMgfZLHZYOmdSY,8412
8
8
  sglang/compile_deep_gemm.py,sha256=H118s76CKdpZr-cDeFfBCePe7--c_teEBNVIzchYVSo,6243
9
9
  sglang/global_config.py,sha256=xzLdk8W53fneFblNh8iIjGF9C3-7mnzR1-LleD9Btxg,1495
10
10
  sglang/launch_server.py,sha256=mDXfwha8LHpWQJekcCosR98QhCQsbmilsBlI5jAIgg0,420
11
11
  sglang/profiler.py,sha256=tEHzHerXC-ymk4OrkoUcMbgcGHmb8VESthsNSP2Yx9w,4417
12
- sglang/utils.py,sha256=VH6zrnkjzcR3DE__WfVph6wswJ4JuzoQD47VmbZ38eI,16435
13
- sglang/version.py,sha256=LdxLMJM_JXsCQBeSvnxCNyGWmINE0yWfna3DQaT41Vs,22
12
+ sglang/utils.py,sha256=leKs-YyX1_Jk216yoKX-KRYx_EbLiuemsHbD31xSjMw,16445
13
+ sglang/version.py,sha256=2VQK7_pzesJW0_F_Vd4w5UmkEfHPeIjSBRrIXNIBvAU,28
14
14
  sglang/eval/llama3_eval.py,sha256=gWSboDchIGybIce88bJlrCG0yiLZ513mw4gcutJlzGM,10017
15
15
  sglang/eval/loogle_eval.py,sha256=pRPVA4fxGmT3_oXvXnlNE-UlPrcQGLBJF-OSE9YWJXM,4336
16
16
  sglang/lang/chat_template.py,sha256=HKlx7snSWFED8GKF5ex79sQrPWFw5TSXQM0_LsiD9Bc,20552
@@ -30,20 +30,20 @@ sglang/srt/_custom_ops.py,sha256=0lJRMTKTjoxJPh1qQnnMY02Z3SyBDi7LJI34IBLQsgQ,446
30
30
  sglang/srt/aio_rwlock.py,sha256=6LYtOdeTUY3hkfa1dmYkgsaF2ttrwIF3hUWz2AZ2fqw,2970
31
31
  sglang/srt/code_completion_parser.py,sha256=KFa95OU0TeVjJkOqIgS4xV3kaJ5dFWOmAAgISyc1oEc,3803
32
32
  sglang/srt/constants.py,sha256=0i-tEwG2BSYNDy96MxnGHV5HnBELkYcnsVGsE-R18o0,93
33
- sglang/srt/conversation.py,sha256=fFP6RxkRolz-YLl55o0juzp0Ov-78j89RCt7Cflzr2Q,38335
33
+ sglang/srt/conversation.py,sha256=NeXU0CFdx_b8gLvmNCXjbqllXTTNAfQCD7mr6JrVtHw,40360
34
34
  sglang/srt/custom_op.py,sha256=87r2PIgiGLREsIZQ8qsUD-zgI66_54y9GrE0buXzoCI,3076
35
35
  sglang/srt/debug_utils.py,sha256=slaFOY4BYDBFatkfu8FZlzai-u4LFS-5GUzdr-t50zE,2241
36
- sglang/srt/hf_transformers_utils.py,sha256=1Ku6POAyk1Hb4Q1VcHTE_2EjujVhPerPO9V9NAcHbOI,11997
37
- sglang/srt/jinja_template_utils.py,sha256=Jc6Vl-lYtUyMBSWWQGIMpJQ1O-ceU9c8DbOi_bN-oVk,6719
36
+ sglang/srt/hf_transformers_utils.py,sha256=X3lntqlG9h7zNvAonhj47St0AR8Nx5NUHjn0wWYxTlw,12457
37
+ sglang/srt/jinja_template_utils.py,sha256=0c6nQjkGukmyXsqQ9r85R5QK9CafnjqXyrXF4K3aFhE,7177
38
38
  sglang/srt/model_parallel.py,sha256=eLXZhvJ4wG6dh0FontNCIdVZvHYdWgaeY-5cu7TD9tE,6078
39
39
  sglang/srt/operations.py,sha256=ddQ8KO63L73OciaR8MZ9h2h83gKVY4-WuWgeEGowPJA,5346
40
40
  sglang/srt/operations_strategy.py,sha256=Pwd2sKeRtKh9WJXgzlNr2tU9y6YMcI3MDLbatHqlMws,7145
41
41
  sglang/srt/patch_torch.py,sha256=OUPCGQSQz3MVZB1zZ_Eq8lXiw0uIKJ_HWjqQolI8FsM,3088
42
42
  sglang/srt/reasoning_parser.py,sha256=DkZrFhkJ9qe7w46fTnM9sqhXwTDgZxD4qPdGka-Dly8,7579
43
- sglang/srt/server_args.py,sha256=Fg1CqO92iiKA5jLd9vqKZ59uwnw0l23DO6KL47kBJgY,75458
43
+ sglang/srt/server_args.py,sha256=HOwXUp6ver6xVZNaRJH-A9rtC_VpM7tPyMBF08JFOl4,76138
44
44
  sglang/srt/torch_memory_saver_adapter.py,sha256=K_eTx0UU84MHSTXI3iqYLdHV4IWtJMJ2FKdGFJR8v1E,2417
45
- sglang/srt/two_batch_overlap.py,sha256=kunhMhCF_ucK4EkthOUEUegd1C9j4aSbpBLYaIKYgas,28447
46
- sglang/srt/utils.py,sha256=pI-0YtHmQrC2B2Q_uK13qvje1y_ni6TNzqs8W7T3hts,85846
45
+ sglang/srt/two_batch_overlap.py,sha256=Pqqj4BzVbXCiOvWE20MGMo21AoAmEPd0R32DsPfD5c8,28562
46
+ sglang/srt/utils.py,sha256=mQE61yjzwgI8iwxrcaiZk4Zeyd69S3ErBuXQuYNita4,91714
47
47
  sglang/srt/warmup.py,sha256=zldxhMlXpclRAJXmfBjJNUJd1eDizVdysibBvQyTVuA,1782
48
48
  sglang/srt/configs/__init__.py,sha256=8EcVRP95epZ49DxBa6LgKWt7eO3Qe7Hrr3V1c6HkMnY,553
49
49
  sglang/srt/configs/chatglm.py,sha256=j-b0YkdYUmQm2y1kNmMJtKeACxWKmBbvNNkDWbs6kbI,2907
@@ -56,7 +56,7 @@ sglang/srt/configs/janus_pro.py,sha256=95qLFQ43n-q5MVEDnh9OBXCUNXOCofwBKYvd7LKPv
56
56
  sglang/srt/configs/kimi_vl.py,sha256=4W7VQI3pr888ZsFA2SqCQo4mI0seXTOrGQ-x3oTvWew,1358
57
57
  sglang/srt/configs/kimi_vl_moonvit.py,sha256=hx2Rt4JSFbvy2HUTeLjBpge87m8M6ITAhqsgdNf_Jd4,1163
58
58
  sglang/srt/configs/load_config.py,sha256=qs-AxuplouBx2tsv9KGBOLZPbwzuVA4vbktbGP_cRp8,3309
59
- sglang/srt/configs/model_config.py,sha256=EzF91fOMu97BxPFSrVU4r-RTuUS3pqoDObKAstnPxGE,26983
59
+ sglang/srt/configs/model_config.py,sha256=N-S1xKCEH-5LqVfL9VEGKUHRFAujFgczB6tIk5Jr-_Y,28333
60
60
  sglang/srt/configs/update_config.py,sha256=2EpDVocEpMv35g1V-iPLSaLjBgylC5vN0yYSlW49k5w,4664
61
61
  sglang/srt/configs/utils.py,sha256=3nHUfisMs_Ltuhv8OZTNCJp63YJKJVF43h1QZB1zqx8,670
62
62
  sglang/srt/connector/__init__.py,sha256=czLX5JOxuMhH-T9eSJzoc1qv1B4z9chyffDRL5I6wo4,1247
@@ -80,7 +80,10 @@ sglang/srt/disaggregation/kv_events.py,sha256=yFbtwOeblcCmOXTjg00TopxnyjkmCBQIVz
80
80
  sglang/srt/disaggregation/launch_lb.py,sha256=mcbAztN4gnHevw_T5R2_nWsymsDEY9vHkm7OJ1vr6cc,4211
81
81
  sglang/srt/disaggregation/mini_lb.py,sha256=BBeIdeZZxi7Ra5_hukHHX3TNdyfZ4tP1GBUxC-qrv_g,14401
82
82
  sglang/srt/disaggregation/prefill.py,sha256=3u6WCrjogZSqd6yWdBZe1HO4lf6w2e9M7sQtGHyax-Y,23512
83
- sglang/srt/disaggregation/utils.py,sha256=pKy2MDWqnfHmktc7bJg0hi_x92ellCtfWB-RJSg1jSw,11343
83
+ sglang/srt/disaggregation/utils.py,sha256=ql5p9yjBCRcR0YMgcgRK6tH0kPGvLNTUgeXBr_BUcoI,12198
84
+ sglang/srt/disaggregation/ascend/__init__.py,sha256=-lxnica6fZYmYNpKwmE8yESUpQ5Sxf2DiZoBHzboKc8,146
85
+ sglang/srt/disaggregation/ascend/conn.py,sha256=FOYrGtEhj58iTjhYT1eP96DpyxBLFFR87icqYCzWmCY,1215
86
+ sglang/srt/disaggregation/ascend/transfer_engine.py,sha256=_4PszsQL6wICdg5cqpR2N9TbZpUY6bBX8tgE3xeaYfc,2137
84
87
  sglang/srt/disaggregation/base/__init__.py,sha256=4VwUv0aWxwmVL1049XK82aLTNxmt0WY5RPy9li-wyVk,160
85
88
  sglang/srt/disaggregation/base/conn.py,sha256=CPDAoAkYaFtVPLa1QROfwipSVe7MH6omzIBHzo8TSYk,2811
86
89
  sglang/srt/disaggregation/common/__init__.py,sha256=7yl-EGLMVKRpBUaGF_7lwAsw2J_mqpRZV0238VGxD9o,126
@@ -89,8 +92,8 @@ sglang/srt/disaggregation/common/utils.py,sha256=SxRhAWisNK8seGhb5BXBJ5u53DF7yeK
89
92
  sglang/srt/disaggregation/fake/__init__.py,sha256=jJGWdXwaQiGIoR6atKqkQfkJmVyQ09l55VUN2WjwaeY,77
90
93
  sglang/srt/disaggregation/fake/conn.py,sha256=oD1DArn1yDFZCu-X6p93uSLlAXEkt9lYxERICMznxGw,2286
91
94
  sglang/srt/disaggregation/mooncake/__init__.py,sha256=0TgqkAdQI1YynbHY6c0QISvVoOSk-0SwCIq5rjPSmgE,156
92
- sglang/srt/disaggregation/mooncake/conn.py,sha256=MATJkiS_5Vh8fc8Gx6S6cI3zCYDbgKXVEAa1xkUsCKA,58879
93
- sglang/srt/disaggregation/mooncake/transfer_engine.py,sha256=JYB9T-EPdJNfv4I_sVpmMOZCOJ14itD97ws6tTvj240,4281
95
+ sglang/srt/disaggregation/mooncake/conn.py,sha256=GUC1LUuO-PI7TmiZg-KBXpyccYCwE5K5byoV2eHxIFw,60891
96
+ sglang/srt/disaggregation/mooncake/transfer_engine.py,sha256=a3pki0d7QauTn6slt7gVxjicABP6Uo4Ztt0wEXR9dZc,4687
94
97
  sglang/srt/disaggregation/nixl/__init__.py,sha256=qODVPIGWUXKXq4zsRIcMYoAoAeg6nBIN9vdQOlVMANE,136
95
98
  sglang/srt/disaggregation/nixl/conn.py,sha256=cXqWU2Gbi6E2LS0MznEcgFCrwONhYxBtD-zE9DU32z0,20333
96
99
  sglang/srt/distributed/__init__.py,sha256=jFOcyt-wFAPMBUAf9zkZalNQlt-4rqmT6pCKBz1E4qo,149
@@ -108,13 +111,13 @@ sglang/srt/distributed/device_communicators/pynccl_wrapper.py,sha256=LblisImY9d6
108
111
  sglang/srt/distributed/device_communicators/shm_broadcast.py,sha256=d8mykYmXM1lfbPm8GNtqCF0Un_pdXYjbNmsgoVFyyow,20874
109
112
  sglang/srt/distributed/device_communicators/xpu_communicator.py,sha256=ajW6132BvA6jkeipEIgN27TFycI0U06Ih2Z8WNjlA4s,1593
110
113
  sglang/srt/entrypoints/EngineBase.py,sha256=yKN76witT2jz1zhmLHmPNLGMpK2UiOTaKQ2KPD8l99U,2594
111
- sglang/srt/entrypoints/engine.py,sha256=o6sccP-gdeO6rOY9vbSqVmUNlBrK2YsinrDf42URg5A,31328
112
- sglang/srt/entrypoints/http_server.py,sha256=7q6TK02vkppIrW_oa_Xxhr-EV3SNaAwAt_pcnLNfC8w,37503
113
- sglang/srt/entrypoints/http_server_engine.py,sha256=ncN45ti9mawSOimPSedI6zugfoMhMQOYh4tmdfC9LcE,4936
114
+ sglang/srt/entrypoints/engine.py,sha256=zZGuZVdyCPf1WeCRb1Lde7fIlAT181IKT1CCmK8AHrk,31328
115
+ sglang/srt/entrypoints/http_server.py,sha256=pUZgA7ILuRynIY3Cs2nbFoXSnZ7ohsMauF_RBtl-V_s,37538
116
+ sglang/srt/entrypoints/http_server_engine.py,sha256=_--j4U04OeJLlnnv1f0XmCd_Ry0z1FlhkrbePX8rYV0,4938
114
117
  sglang/srt/entrypoints/openai/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
115
- sglang/srt/entrypoints/openai/protocol.py,sha256=qIwhokAlAVbp7Nin1eE4TCnUyrAhKcPS47kzHkhzZg4,18799
118
+ sglang/srt/entrypoints/openai/protocol.py,sha256=oAd5u_J6Wk9gzXVPS-Ps8VaxkhmMXyIuH1KZ73pEOvQ,19083
116
119
  sglang/srt/entrypoints/openai/serving_base.py,sha256=5NJ2S_6B2NFSwn4nLp6eaeJ5iC3IcQzMEY9lW_gPcdA,5246
117
- sglang/srt/entrypoints/openai/serving_chat.py,sha256=tWKWjspTpNnuk-Aqfl_S6OmpZe6gz5XxmSGEwfIvCsY,35935
120
+ sglang/srt/entrypoints/openai/serving_chat.py,sha256=QhHvqRjbzwsTQNtRhia7UJd2BlXnxWD-7udRsX_8H8s,36233
118
121
  sglang/srt/entrypoints/openai/serving_completions.py,sha256=emIutVmnJgOgGRuAqdB80-kVHUfQbE67n1VS-76o4QY,16690
119
122
  sglang/srt/entrypoints/openai/serving_embedding.py,sha256=hqPt2ELpT1yQ8sBXo801aLJ3sExoPXs_K5ZQtC2vpAs,6274
120
123
  sglang/srt/entrypoints/openai/serving_rerank.py,sha256=8n6y5kC6UhRpWrDtzH0eIp0dznW12FT60MLCR4bvD2U,3333
@@ -136,7 +139,8 @@ sglang/srt/function_call/base_format_detector.py,sha256=eMSqbx99YPm2m_ChLafFRuLO
136
139
  sglang/srt/function_call/core_types.py,sha256=wLUsW8mUA-i-ISz5QUDL7Ejq72W-K1HIhFa9Wm-_oA8,786
137
140
  sglang/srt/function_call/deepseekv3_detector.py,sha256=XudIiIt2Mejokg6qOkX7vYS-3XIFstOBHv-m-Q5fBLQ,8970
138
141
  sglang/srt/function_call/ebnf_composer.py,sha256=1r5UPEkUeMCug-P-c1mAZbJPgEXU8hR-fDLdYG5Q-wo,13585
139
- sglang/srt/function_call/function_call_parser.py,sha256=IB3QXZjedOFhXcLIOWSiceE_dOqGPcHqqnALu3w-_VY,7682
142
+ sglang/srt/function_call/function_call_parser.py,sha256=YqtfxJYu9kWZIJTtM20miH2duXIvG6CWintBZ3_7SfQ,7785
143
+ sglang/srt/function_call/kimik2_detector.py,sha256=wb--wnAp-ZtWeIJZM1dS33GNu-K9lGxvrFbtp-UmGVk,8978
140
144
  sglang/srt/function_call/llama32_detector.py,sha256=EHYGAy1NCIxFWKdSQByPxyJgFaFRCtGdgj4ntEAgi00,3619
141
145
  sglang/srt/function_call/mistral_detector.py,sha256=xNuVl2vDXVYbXyiXLkJZ9VM6njcwlS9EqryR1eJbMr4,4462
142
146
  sglang/srt/function_call/pythonic_detector.py,sha256=rtXSflE4w993a4OqphWG-WQzvwRz0v3dfgHOnte1fpI,8731
@@ -144,22 +148,22 @@ sglang/srt/function_call/qwen25_detector.py,sha256=9JfZem_5nw91Og2biwq8eIpUQjy_3
144
148
  sglang/srt/function_call/utils.py,sha256=__ImDF2kNyoLWsYO5RYoryvy1mmgEjnjXlCvLv-uLCM,1695
145
149
  sglang/srt/layers/activation.py,sha256=UDrJcnQoIOJjMzZ9XAy5JlEJ-do44tGMtcitY7I8kPQ,7327
146
150
  sglang/srt/layers/amx_utils.py,sha256=1mENgHK2B8mgaD1oMtgbZ15Jmy_Uu1QueBmo09Ff2iA,2865
147
- sglang/srt/layers/communicator.py,sha256=_aq6rDgDlRRVXO1EquSNtmMADuQJGdRZkbt0vCxTxqo,19314
151
+ sglang/srt/layers/communicator.py,sha256=yckTsQ_3SeADES7maU2bgIpzwbWu3Q3Qpxu8T8UpCoQ,20045
148
152
  sglang/srt/layers/dp_attention.py,sha256=V7m_PfvHHtRMJMviIqmoyqf5VFFJLYYcynDuI5dXtAU,10275
149
153
  sglang/srt/layers/elementwise.py,sha256=MyQUflyKEfPZ-BggW1Kd4hB53RFD6FXGc2S5LXjx_do,16026
150
- sglang/srt/layers/flashinfer_comm_fusion.py,sha256=IwI3VPHVZaWTgf_rsSH_5QROTcmoWnjlZ9annh7cYRs,5888
151
- sglang/srt/layers/layernorm.py,sha256=4KGaB4QSO5hBcr26TtPfspD3XZwr5X55Pkn5xN9eJrQ,8647
152
- sglang/srt/layers/linear.py,sha256=cxth3pvLGdud-ZoHrGFhrPeuhLnBX4IWohyBr2gCCv0,54890
154
+ sglang/srt/layers/flashinfer_comm_fusion.py,sha256=fkTcAB7qYwSWi95qI3Rqq0JUyDpJdcYkd4TYkWO01HI,5891
155
+ sglang/srt/layers/layernorm.py,sha256=ooqA-t-vY5erbKBwqnOotfDsJRTygP5E10CfzEAVF6M,8657
156
+ sglang/srt/layers/linear.py,sha256=7XQvKQL7oS1o8aw3i0XRj4JcV6OOwGycdYJZO21AXvE,55355
153
157
  sglang/srt/layers/logits_processor.py,sha256=tOPMYopEQuoLBzwbjSmU9OWFYh2mmy3ViJSbA_wpFOU,25619
154
158
  sglang/srt/layers/multimodal.py,sha256=YVR69WW-2aGDcZHT8IVJ6F_LRM7wraZr8VjrPDXqDmA,2104
155
- sglang/srt/layers/parameter.py,sha256=hu1l8Yzd38xQfkRaIOE1ouzxjG6Ro84pt6SfoUB61qU,16936
159
+ sglang/srt/layers/parameter.py,sha256=jCg0G-12GZqTa9gGOqEtVCsnnuBGnYg0VmF6pc6oCFg,17455
156
160
  sglang/srt/layers/pooler.py,sha256=uZ6WX1FLMEafZwusyZdm6KuVlIwSjbKrdwk2qzgqNGk,3812
157
161
  sglang/srt/layers/radix_attention.py,sha256=IlqRB4bk06FOH05_7zB8lik0xLpys7jFooLeCwdO0j8,3437
158
162
  sglang/srt/layers/rotary_embedding.py,sha256=EhxI0E8jcTWZ2COpnku7crbW8Hew5fe_ujMndj7hKvE,52246
159
163
  sglang/srt/layers/sampler.py,sha256=xNds1migup2s6b9_pS6ljkJUkvNtv7nmTGeIdOzoQ6w,11182
160
164
  sglang/srt/layers/torchao_utils.py,sha256=Ws24FdRBSkTpyeyA6bQrdDm-W5wfDxKvSIPUSahyMfA,4063
161
165
  sglang/srt/layers/utils.py,sha256=IWGg1Hb7c33Z3LHRPVJyUAzp3BnSid23ZWXAmJ_Jvp8,1204
162
- sglang/srt/layers/vocab_parallel_embedding.py,sha256=1Av2YHpx-Oa18-33ps0lpkOuUgnY-Y--Yt_I7YcpYBU,23438
166
+ sglang/srt/layers/vocab_parallel_embedding.py,sha256=i1Uoo8TE877jLNjAjwoyMD36W7J3WwFD402YWq0qTT0,23560
163
167
  sglang/srt/layers/attention/aiter_backend.py,sha256=7sEUgViw-xl3yok91yyOD9gTi8lQmME0g0ZiKVTCcyI,32851
164
168
  sglang/srt/layers/attention/ascend_backend.py,sha256=jPCsU9_gH1iZNoZHD9nCeDdVdXqBt31LI65N55BTJPg,8250
165
169
  sglang/srt/layers/attention/base_attn_backend.py,sha256=KXVcCguwXh-PSrY9Y2aUrlXXUhWdbVxqVEF2_xIMvm4,3466
@@ -184,16 +188,18 @@ sglang/srt/layers/attention/triton_ops/prefill_attention.py,sha256=waZsmpKIp8rTg
184
188
  sglang/srt/layers/attention/triton_ops/rocm_mla_decode_rope.py,sha256=664WnAJ91EiCUZOcnVDfbTQf4uGJ4ZDZB1CbxpEUFZc,13866
185
189
  sglang/srt/layers/moe/cutlass_moe.py,sha256=--bNTA2BGbHeULb_XXDoRUyWWbE-doHo5K5k1T0N0WA,14323
186
190
  sglang/srt/layers/moe/cutlass_moe_params.py,sha256=9NRCmgP_Ug3gGqCcpi-x-QRbLjCNpw8792gKXwZsbEU,6522
191
+ sglang/srt/layers/moe/cutlass_w4a8_moe.py,sha256=bc8s5Oc36pCF0VozxZuqFOOU2fov-4wGPlyduye3Imk,7296
187
192
  sglang/srt/layers/moe/fused_moe_native.py,sha256=bW3KWxxz9rxKMUQqfmAtF-7ptTODA1pwLydE05ABDJE,5030
188
193
  sglang/srt/layers/moe/router.py,sha256=UrPieRvemN7Ew48gtG7DA2xhNDBRSnZxzugTEBI-0_E,12006
189
- sglang/srt/layers/moe/topk.py,sha256=DhG8EIqyhn41erCKRwX2wGrYOOF-1VdBrCZwyyc1Ks0,18048
194
+ sglang/srt/layers/moe/topk.py,sha256=FxmdIdyMbRqIequtfwaLsz9Go-1lRooH8d8HBfQ0pvw,18426
190
195
  sglang/srt/layers/moe/ep_moe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
191
- sglang/srt/layers/moe/ep_moe/kernels.py,sha256=bHn50WQ9K57wLxLWZ8ytNJrCi7bAQ6MegN2o7qxB_Mc,40690
192
- sglang/srt/layers/moe/ep_moe/layer.py,sha256=DjUSrRAiRzvuDRvF3JyTqupL3z7smzwXO9hQpQOK0Io,56658
196
+ sglang/srt/layers/moe/ep_moe/kernels.py,sha256=_pb2_5sNqbkImh4Ylv0hWhEQCOmItvPqB-b3dsfDHc4,42604
197
+ sglang/srt/layers/moe/ep_moe/layer.py,sha256=Jl1TolpjQMtpMC2QXq5X5IA3vkF9UlfxlLl8r6qqN2k,62485
193
198
  sglang/srt/layers/moe/ep_moe/token_dispatcher.py,sha256=aiBE3mjvWV3eBrFGH9J44tuJncQwOjRS_XeyBNCEtqM,24379
194
199
  sglang/srt/layers/moe/fused_moe_triton/__init__.py,sha256=h9yMFAL_bagUf-qBED8gSWdCOb7d8IdA-pE-L_nIg8E,842
195
- sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=GQk0WVdPYI1lOsa0ItkiYcGHS_k8r5y7Mfy485MBZl8,63177
196
- sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=wsNUtzqE2Emi0RAwVzpFHUOVOqUMXr3pCMSJHqkc7EE,34126
200
+ sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=Ffcu3Jvp7-nllybh5EWtG0MamWI9PqO8a6ESiMKWEB0,63292
201
+ sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=5NQh7_17xTtwSFClwgvpnzXrEO9iitl8aKfMm4jWJCo,37556
202
+ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=hoWVdf8ry8IDGH2bfk2WW-y2S5h5haLTGanBSwkkeE0,5848
197
203
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=iNGsE2ZeVnQEnN4A8UJ9Jv0d3hbRF2MJ9oBgjup5Szk,2737
198
204
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json",sha256=JJN0hryyLr5Zv3dSS7C8cPFhAwTT6XxUVnBGMZvV6JA,2752
199
205
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=ouRyZ5PEMPP2njPftCNhs-1g1y6wueWLmhI7G1SjV1k,4131
@@ -356,24 +362,25 @@ sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=wsNUtzqE2Emi0RAwVzpFHUOVO
356
362
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=128,N=384,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=LNx1W_BsWZcpHomiScCRap46dV0-F7S_w3Htskoqlm8,3263
357
363
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=257,N=256,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=fo1akCuGoqcGwQgfh56hApgg-wLXfo9kHHksE_6m1F4,3262
358
364
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=8,N=7168,device_name=NVIDIA_H100_80GB_HBM3.json",sha256=a9XJZ0XudUTebAdN5guVq-3XSvZetHIRjatO1-_0xCk,3257
359
- sglang/srt/layers/quantization/__init__.py,sha256=isMl8LINJFMzEse4r2Ta_7JXT15eKCX4mDIikuwticM,12559
365
+ sglang/srt/layers/quantization/__init__.py,sha256=JHV4X982TW7_U7ZobQwNIdK-Z5saEH-R1xKWrF6jgRg,12650
360
366
  sglang/srt/layers/quantization/awq.py,sha256=KemDG55U3B6YZVjMV71awVAIj0islFvtxcUHmOBeGy0,6739
361
367
  sglang/srt/layers/quantization/base_config.py,sha256=jWk_egQrVNMYmQgbTI9vkcgzScLFjB5_sywFlAfE5J0,4776
362
368
  sglang/srt/layers/quantization/blockwise_int8.py,sha256=vWyPZsRLhdKtSmjvlT5fsowBK_nEebYbDAUh2yqseGw,15285
363
- sglang/srt/layers/quantization/fp8.py,sha256=fPzEIAYqiSgVjVTu6_CceyW-kemzSRGS_Q-FZ0eGAD0,46375
364
- sglang/srt/layers/quantization/fp8_kernel.py,sha256=vziHnk-gVbeY3z94216UDCU5kyev36ZrKldMgglSmpw,34718
369
+ sglang/srt/layers/quantization/fp8.py,sha256=X97n8M7Kqhv98JvVQsSW6oYJtI2Wwrnoix-LMtsaxu4,47468
370
+ sglang/srt/layers/quantization/fp8_kernel.py,sha256=PuDdACPV8xFQwcEAY57L465-yPJHbbJBKOlo1vuEOPM,34744
365
371
  sglang/srt/layers/quantization/fp8_utils.py,sha256=fsX1x17RwcK88N1WpF-YELQOpkpHvJnoLriZj27H2R8,25611
366
372
  sglang/srt/layers/quantization/gptq.py,sha256=B0J14a-OANM2uglnatukFMlvpDnUprV3-p_l4308WUQ,26838
367
373
  sglang/srt/layers/quantization/int8_kernel.py,sha256=GfRC9FOn9exNvK4QHbUeBj3Hhv32VcyGphapFPt5b84,12625
368
374
  sglang/srt/layers/quantization/int8_utils.py,sha256=YK9CS-lb_n91kNCTKK5o5apYF31V2giDg5G5VKrpcUA,2356
369
375
  sglang/srt/layers/quantization/kv_cache.py,sha256=_9pF5rwvB7ta6Gdc5YKVVGbNzYwqmhIx4TrX1-xnodQ,3261
370
- sglang/srt/layers/quantization/modelopt_quant.py,sha256=wW90ZS1ZrGOXf7l5svudmXqAi3JE2SkCV-fwqWeYfdg,30905
371
- sglang/srt/layers/quantization/moe_wna16.py,sha256=9w3TYF1aQ0N0zNBgcuyOX-z-zfq4it2ul_MjKk_fPCA,19680
376
+ sglang/srt/layers/quantization/modelopt_quant.py,sha256=0abOZfOyGYOQFiyMssZPey1YekQrAQBcMp-GQlrFXZY,40746
377
+ sglang/srt/layers/quantization/moe_wna16.py,sha256=Fb7qc4fHec9Qst1ne55YqNAJvO5D3JoMMkhYrYh8vzE,19646
372
378
  sglang/srt/layers/quantization/qoq.py,sha256=adhsCixRUTh1m8sfpRWNhh5oX3I1WJli3Elg8uexP6A,8222
373
379
  sglang/srt/layers/quantization/quant_utils.py,sha256=kBibCBK9DCambuPy2atB82Bmalb-Vs_wbQoVHT7h2Lw,5089
374
380
  sglang/srt/layers/quantization/utils.py,sha256=qHdWbLQD8teKhv2tOcuyGegpFonXygoJHwCAD7Ur5MA,5439
381
+ sglang/srt/layers/quantization/w4afp8.py,sha256=Rf8wMqtGUgLF8soOM16owfFI0AR1q1Ylzr5YpcdqyxU,9538
375
382
  sglang/srt/layers/quantization/w8a8_fp8.py,sha256=ZB6ydquyPOORDe9OCoEBRH6dsQhCeRWv1YIgm8UDQwQ,11622
376
- sglang/srt/layers/quantization/w8a8_int8.py,sha256=aPMm-sk5nBpHwHzkedvuAWXiqWpp_NPyVaPHxHnuhVg,10847
383
+ sglang/srt/layers/quantization/w8a8_int8.py,sha256=jXQiodlIShMWbivWPlnLFkg9W41eC-_5bWTzd5AMecA,37189
377
384
  sglang/srt/layers/quantization/compressed_tensors/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
378
385
  sglang/srt/layers/quantization/compressed_tensors/compressed_tensors.py,sha256=EaOKuIA0zXwqmH_eVhWeNdGJT9d1d9gVvFyYkgpdjDg,25665
379
386
  sglang/srt/layers/quantization/compressed_tensors/compressed_tensors_moe.py,sha256=w19mhCnOre3j6L2-Tc_sRtBPgwBOAKV4QmYLpzyU_Fk,26637
@@ -548,24 +555,24 @@ sglang/srt/lora/backend/base_backend.py,sha256=EIz8I-GIrdmK4fISw3ENhbJVVITaxKfyL
548
555
  sglang/srt/lora/backend/flashinfer_backend.py,sha256=el6IAB4kTgDTbwCggmqFuukliyoapN5X6FLksG-4wJ8,4151
549
556
  sglang/srt/lora/backend/triton_backend.py,sha256=uqwBGlguXX8EkCKjSPqac6SPTgcKA31u3u6HkKPQcos,2530
550
557
  sglang/srt/lora/triton_ops/__init__.py,sha256=JGOYPIn1XbGcyJTbt8A0qoc02PYONSGNNjGkC8yJpAM,283
551
- sglang/srt/lora/triton_ops/gate_up_lora_b.py,sha256=vOUDzC_Sq7UGnDbdF8F7ChKG12hDIOFwwMb7e62Lz9w,5280
552
- sglang/srt/lora/triton_ops/qkv_lora_b.py,sha256=qCpJAksCSXS3Znm-ABx1QfrdNqj9hrP61oaeW-n2RhU,5945
553
- sglang/srt/lora/triton_ops/sgemm_lora_a.py,sha256=yNBgl8jS76DPlGJg8puRkSnKkewf2_2oKfVZZRq4lYY,4351
554
- sglang/srt/lora/triton_ops/sgemm_lora_b.py,sha256=EoF9HymgQ1V9DwyOJOvbw1hCbEjprVOne_fC4VHgj-s,4518
555
- sglang/srt/managers/cache_controller.py,sha256=K00t5dSZU6gbAMHZWhNyj0ndgHISvelTl7UMI5KqBuE,19352
558
+ sglang/srt/lora/triton_ops/gate_up_lora_b.py,sha256=QURCYxHNR8Ls4SQtt3dvdgjvdDVhywI9tOzsK8SV9m8,5779
559
+ sglang/srt/lora/triton_ops/qkv_lora_b.py,sha256=iz5scFNo2YFTeiM8beWg9Z1oZI-6AM_T1wBMCQ6qp2Q,6485
560
+ sglang/srt/lora/triton_ops/sgemm_lora_a.py,sha256=Ksova04wgeGsFqGOXWqJtMYaHgyUYcx8VU42BZQOkVA,5129
561
+ sglang/srt/lora/triton_ops/sgemm_lora_b.py,sha256=VqCAFvUtq_l-0RGIkx3W_fzD55QcW2FAcqpvSHOBFp4,5115
562
+ sglang/srt/managers/cache_controller.py,sha256=HPQGLwjey6GeW60Vu6MVeLYtRsJrh99_-dqHYSzlBkE,13614
556
563
  sglang/srt/managers/configure_logging.py,sha256=8sNXZ2z9pBWOwn-X3wyz013Ob8Nbm1zDxRkxoZjH-l4,1633
557
564
  sglang/srt/managers/data_parallel_controller.py,sha256=PZ-wOcAFn3PQqMB6I2vjIsFmplf0nlNl5hqTDKTHTG8,12112
558
565
  sglang/srt/managers/detokenizer_manager.py,sha256=SpLxTsSPKBZfD-ZMhJ5zpPPGuUb8PmcYgFSL9CsurU4,10696
559
- sglang/srt/managers/io_struct.py,sha256=DQ2zg8InwXHgOa06n47rbwTzR5mYkj4OGQe5rZ0T77k,35137
560
- sglang/srt/managers/mm_utils.py,sha256=px_pMotzBLhuqw-mLXXzf8N1DthhDn9ILsIVIzW9y74,26582
566
+ sglang/srt/managers/io_struct.py,sha256=DaRJxXiIAhp0Dz4FxScZkoflf4CSc6SdO9YP1hbPY2c,36582
567
+ sglang/srt/managers/mm_utils.py,sha256=Pk6yWX7YThmulSjx7EWYuIKXm8Gvh0WdvPDsBHNApog,25500
561
568
  sglang/srt/managers/multimodal_processor.py,sha256=mzCrN-8H0bE0iMO8UzxmYmhE2M1qsbVJXGdhAYcjjYA,2016
562
- sglang/srt/managers/schedule_batch.py,sha256=3NF590tt4TJ99svwdrlsrFiICH_8X2DpSOj1ebEUSC8,73119
569
+ sglang/srt/managers/schedule_batch.py,sha256=T36ZokjgjzzV4VYKdxphY20O05j7DO7lrciknsW9-N0,73519
563
570
  sglang/srt/managers/schedule_policy.py,sha256=0T8URzQmLvEmG-42-SFBBl9WnsOSwYO8-_CcBpuD38M,20474
564
- sglang/srt/managers/scheduler.py,sha256=ZC49CVTsVlDh77QCq5UPhy04NM9FV5YHXuMg4M0cwEE,112191
571
+ sglang/srt/managers/scheduler.py,sha256=uaz-x3VrM77yeauYgVHYdu72iYK9Ct-qGY67j84ss5o,113502
565
572
  sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=XAK2aeLleZBaLtzebEKdpaz9E7uKnHV7ywHSk_WPDYo,30148
566
573
  sglang/srt/managers/session_controller.py,sha256=dzlMNZlo20FTSl64QqK7y7pElsdCy8ICOWWBPTBVwgs,6040
567
574
  sglang/srt/managers/template_manager.py,sha256=RrwRA2oqId_PMQ98qJQGwIxMroOxiorl2sGC9ARou_0,8543
568
- sglang/srt/managers/tokenizer_manager.py,sha256=I2M8Hpj9T120rJYP5Hdu6cV72oPmsoRr829LiT7O4Dk,73655
575
+ sglang/srt/managers/tokenizer_manager.py,sha256=MK7k23sOWnuq4_slZt2a_yvr3xVG-66ZKIy5-eBwlMI,74364
569
576
  sglang/srt/managers/tp_worker.py,sha256=kyk2EVd3eP0gpgVETJ6J_BdxIDbiB76AfpN4_-Xqkrs,10896
570
577
  sglang/srt/managers/tp_worker_overlap_thread.py,sha256=EFbtichmZjMoBgRa0AMIGdKGur1i8bpd3JvaDi-SsK8,10663
571
578
  sglang/srt/managers/utils.py,sha256=9_VGE48EK0PXVJ26aYvbRJ6n7gIZALvCcf6uZCccCgM,1369
@@ -574,18 +581,18 @@ sglang/srt/mem_cache/allocator.py,sha256=MJUPQt4ECj4ReGeUVGVUNfwrwjHBbf3youdkyp3
574
581
  sglang/srt/mem_cache/base_prefix_cache.py,sha256=XHSzXKgBin-m1HsL47K-GobhLnajaGxqLqGtrLsWaZ0,2540
575
582
  sglang/srt/mem_cache/chunk_cache.py,sha256=MWo4DwRkHKOLKyow53YrGQdvn2dI7hVJuf2Gf-SPAr0,3110
576
583
  sglang/srt/mem_cache/flush_cache.py,sha256=GYcxmNXh4hsMpFfNOuCTpKilW7guZwTtAg_usVeM3J0,979
577
- sglang/srt/mem_cache/hiradix_cache.py,sha256=Z_XgbLBxI8SN7kgsi1R6iX6AfgDUF5-ynVnBVRF7KUw,17061
578
- sglang/srt/mem_cache/memory_pool.py,sha256=soOE9l5qZlWHFbqIHwSEW4l7NQXzmEjpJKk1rfehQZc,37055
579
- sglang/srt/mem_cache/memory_pool_host.py,sha256=9N34Y7P0aM2xkmhsEw2_W8xN897h-HEwzRPIu1REwac,13186
584
+ sglang/srt/mem_cache/hiradix_cache.py,sha256=0jZEWFP4k5LkKMiCc-G0G9GD7oPoP9zNWaAFPMeVFSw,17137
585
+ sglang/srt/mem_cache/memory_pool.py,sha256=EclwV8sNObkpw6lmIYwIFqq7jdTsbHS91H0Rt_IjPUo,40304
586
+ sglang/srt/mem_cache/memory_pool_host.py,sha256=G_vmKQFw6jvPnaxjltRLXueDUjlqYgIdxRqoM1kTj5Q,8863
580
587
  sglang/srt/mem_cache/multimodal_cache.py,sha256=wZl2KeEl3xeoEsYdH33UoM-FO8kqfLo_XUgereJVvoM,1348
581
- sglang/srt/mem_cache/radix_cache.py,sha256=ojr9_bUwnPocmpbGZXz8JKac4dS-PrfNYk8UqF4Gvi8,17936
588
+ sglang/srt/mem_cache/radix_cache.py,sha256=qZSsdlTVCZ3UCqkwe3IDYE07-QE72hYExIb2kbhyMmQ,18096
582
589
  sglang/srt/metrics/collector.py,sha256=C9QEJDOEdOPBwy2IJwFS3R6VbGzVzGs2xakKCCPvQDk,19903
583
590
  sglang/srt/metrics/func_timer.py,sha256=VFyNRrbnKVCwnQsrlLin1lITJfjQpf9m8sGPqL5LIsQ,3438
584
591
  sglang/srt/model_executor/cuda_graph_runner.py,sha256=3pc1_TpGmUAI51SxVubGGZIRuBmZrj8kOuch970RN2A,30505
585
- sglang/srt/model_executor/forward_batch_info.py,sha256=uzWEXYdVJie1xLikH6pmOnT64BDnZvJvfK7gCHH82x4,29572
592
+ sglang/srt/model_executor/forward_batch_info.py,sha256=w2U4at0aQGdj7niBf2__aYG_2qAR2yDFfzm3nl1s7qo,29901
586
593
  sglang/srt/model_executor/model_runner.py,sha256=kfFWWHMXJ6X9WEQgEj618mx8zIc9qvhXC5-K2ICDPJM,65709
587
594
  sglang/srt/model_loader/__init__.py,sha256=zGZkOBz1zx-pkaIy47BasL3fjDlAcxAXUTjInOhXHAE,919
588
- sglang/srt/model_loader/loader.py,sha256=oHIX6qiGfXDQWzP6NuPQfc_haFsWykbcVTKEGUwC_t0,59164
595
+ sglang/srt/model_loader/loader.py,sha256=xHeIiwhp26fOCkaegfWk_Gp6_E8eSAWvblY8xQKwGQ0,59562
589
596
  sglang/srt/model_loader/utils.py,sha256=zSZBPA9ErPmkf-HfCxJjhmiFwYueB15KUg7NFspLvPY,4454
590
597
  sglang/srt/model_loader/weight_utils.py,sha256=dfepjK1lhcFoxX6Vflb3imiHaj9_Tep_uZ7j3lfN9jE,38004
591
598
  sglang/srt/models/baichuan.py,sha256=HbvlErnkCSK4pRQYCSDxMcrn-1DQyfiNoeDcnRrJas8,15807
@@ -595,19 +602,19 @@ sglang/srt/models/clip.py,sha256=mkdSNhc2SgRHyeq9tCLEjUGdnA8yS2EMMbMKSpn5dMs,198
595
602
  sglang/srt/models/commandr.py,sha256=5Y_b3K0QY7D37nFGkyiGgY38RleRui_GJUYcHSuHUZo,15315
596
603
  sglang/srt/models/dbrx.py,sha256=4pn_fdoATg01VEqNnIAxNEsKV5XU7gwHyd289eydq1s,15598
597
604
  sglang/srt/models/deepseek.py,sha256=ZnN02HdgXCB23Vno5V9UMUoOxH5HC82vNTwsVulUJ-o,17206
598
- sglang/srt/models/deepseek_janus_pro.py,sha256=OeeI7vZbE4HGpxa8CwT6-Lbfs7J7WMQ3oBNpVJQpv3w,70450
605
+ sglang/srt/models/deepseek_janus_pro.py,sha256=nOUBFIpZpnQixcH6q18NPx7k2RSNdJOtEW1L6mnsCok,70423
599
606
  sglang/srt/models/deepseek_nextn.py,sha256=47fehxRdiOizr0rdLg5f1fzQEx6gGAOcDcWKtblloyk,5928
600
- sglang/srt/models/deepseek_v2.py,sha256=L0ewZPnxM6xCCB8tJxswwNKAjE-q_SCloJfZx8Y8LoU,100660
601
- sglang/srt/models/deepseek_vl2.py,sha256=F-nf2qRiiZNg9js__rYFEc9fNs_HVEfAi_Mh1jvqwkQ,13095
607
+ sglang/srt/models/deepseek_v2.py,sha256=KnGeJj_WEIntcQm67GK2NgYxyDNEurs3lTIOzDSsadQ,102964
608
+ sglang/srt/models/deepseek_vl2.py,sha256=5xyOXHKTk9GrnpfJhQCSExfzdtztyt4A0BuFsjr2dW4,13068
602
609
  sglang/srt/models/exaone.py,sha256=TpO-rtCpEZ8Ua7hGFnS8l2oAYhY0Pij50grc9WQ2mvc,13576
603
610
  sglang/srt/models/gemma.py,sha256=4cdrPISg1VKnsuI-QPTpYvet4BrX8BMKvCIN82iLskw,12641
604
611
  sglang/srt/models/gemma2.py,sha256=kqtwdo93GWKm2iBN29RoIRH2ggRm-K_80LM5btgfBLo,16395
605
612
  sglang/srt/models/gemma2_reward.py,sha256=V8U3_ADUHWPdOwvEe1jhGW-oJmBgL8t1TY3-67Ksv2A,2618
606
613
  sglang/srt/models/gemma3_causal.py,sha256=CJ2g08Ec7IeoObQIiGH0WIEtYOl05SbJ2g_pfJwSyBs,25130
607
- sglang/srt/models/gemma3_mm.py,sha256=b9YmkipsfVb5IXVeIVwW_PviXiCkRULhEsqNOvPoDxU,17221
614
+ sglang/srt/models/gemma3_mm.py,sha256=oJnfckeiMWyTy-pwq5sPhmrIEatO23T7xUbYefSySq8,17194
608
615
  sglang/srt/models/gemma3n_audio.py,sha256=isgKfjA5UieYawxU6medL2ssXlzYPqAbagDBnLcemC0,36405
609
616
  sglang/srt/models/gemma3n_causal.py,sha256=kBDlpSWAg6ZDmUPe08Q7sj5CbdVD_0h07zwJw8sKu7I,36335
610
- sglang/srt/models/gemma3n_mm.py,sha256=nCCnVbGvkYit6UXljZWRAQagGeSe0Ej9YnH0DbEaN8Q,18689
617
+ sglang/srt/models/gemma3n_mm.py,sha256=REq6a63hXpEuxJ59yJDtPIXZkvd-1YcAtirnauptwsw,18735
611
618
  sglang/srt/models/glm4.py,sha256=2VQzUqFkQTy_2nfkxP9SF6_9kKLTZUExGRjge7r99Es,11265
612
619
  sglang/srt/models/gpt2.py,sha256=kclhxEs8oJk1KCyhmAqo7rZqecVGGHYkc-a1WZi3aIk,9841
613
620
  sglang/srt/models/gpt_bigcode.py,sha256=1D6bi8Zu760gCRZkvdLHFcg8kCkY35ARwQYaMDtYhl4,10307
@@ -617,44 +624,45 @@ sglang/srt/models/hunyuan.py,sha256=YRx9Zafs8HVTNHxlMMKdbV3ELMn6rWi9GKlk94U_R7E,
617
624
  sglang/srt/models/idefics2.py,sha256=U3khd3hbdawJeRNXsxmaKHdssOCT5TPOZ1D-2_zHoQo,12079
618
625
  sglang/srt/models/internlm2.py,sha256=F_iNY1gUqzAjAuUatcE47gnrcoTh5_08PY2Rw9tKr9M,13150
619
626
  sglang/srt/models/internlm2_reward.py,sha256=ndfGmyqYZbVZ7C7rJ-v9oK3wa-EpoBGybS8MlyKZi2E,2522
620
- sglang/srt/models/internvl.py,sha256=fZ18eKFYvvtYqoBRXKmS7KlgHMewJSAykADnrf0N3nk,23267
621
- sglang/srt/models/kimi_vl.py,sha256=oFmkPGaCW3QcrExie5o0fqnvk73w6K8zVbaRXw0kV3k,12811
627
+ sglang/srt/models/internvl.py,sha256=ZM5I_Dp0jaG29WfZD_S0tKZUStQm1C2C8_0WGRA0T7w,23338
628
+ sglang/srt/models/kimi_vl.py,sha256=d1qOBRWmxKr-hywvF9Xl4UvW8lDDHS7zeGyZgjEZWEw,12882
622
629
  sglang/srt/models/kimi_vl_moonvit.py,sha256=M5L7AJOJ2Zh2pqLZAq8aRqhbTSlipr8XOoD3ix6o2sU,23908
623
- sglang/srt/models/llama.py,sha256=xUVXptse-TTTPaZGLPYf8OoL2giczzl9FGiNRjy1CWA,27505
630
+ sglang/srt/models/llama.py,sha256=Ok2Ombk80KQ8G17V2h2pz3XH_LBtO3TCW2aAAdN4k9E,27578
624
631
  sglang/srt/models/llama4.py,sha256=nF19fG2ZdT1bUX3pncckwJ9dRMSazNZx647EW__rBRo,18746
625
632
  sglang/srt/models/llama_classification.py,sha256=4QWTFaUZIFKYZvEzs8bx8VkOZNIwdYCLrnwrdAw4QK0,3108
626
633
  sglang/srt/models/llama_eagle.py,sha256=Ubh_jmtfiOnriwvHgQT0ZGID7JvYvdSi_QGHOIkEgPE,5028
627
634
  sglang/srt/models/llama_eagle3.py,sha256=715soylDE3kOMWskbPy_70BFxaSc5ptaHCS1v3-ViA0,8579
628
635
  sglang/srt/models/llama_embedding.py,sha256=zq-_lNu35VBFc7eemiam0zdkGIE8fzrgk5OWYfirZnA,3254
629
636
  sglang/srt/models/llama_reward.py,sha256=LF2nqMV5XOrljGjAwJg43mBv3z6Q040I2EYlgZeCp8k,4681
630
- sglang/srt/models/llava.py,sha256=r0nHLVRI7AcFEhruqdRXTLWeQ-Cx3uty9wIkHh3TxZs,37507
631
- sglang/srt/models/llavavid.py,sha256=q0lHlRnoYHKJZsWnkIQdd6dYAQ26t7XsmrqA0zDGmZc,12829
637
+ sglang/srt/models/llava.py,sha256=yx867BoTyWd_UPcVDbPhhDpHE243KfAtDHyUi5uAsec,37551
638
+ sglang/srt/models/llavavid.py,sha256=nBGPuzN9okPk8Zy2cIjMRmx7VPJWfkB3DGKeo09Y8XU,12823
632
639
  sglang/srt/models/mimo.py,sha256=Mp-iFp4YHuiuq-H8enUF5K5QbMnVcvEa6mURH6vM3yM,6140
633
640
  sglang/srt/models/mimo_mtp.py,sha256=jSmqJAXu7G3OO7jW1oa2suI4H_Yl7u5ZT7w4lHFbHhg,7292
634
641
  sglang/srt/models/minicpm.py,sha256=m5HFsSJj0Po09LY9R6qj6K4gceqWDMOePz3NDGgMGT4,14691
635
642
  sglang/srt/models/minicpm3.py,sha256=6-gfHSfXwyB5zw7AIj-c5TzjpEKR6CM0H67MrD8LVUE,19347
636
- sglang/srt/models/minicpmo.py,sha256=CwcogzxwTRAInBynhP3z_YAFVq4DC_YN3gG_95C6MQ8,76034
637
- sglang/srt/models/minicpmv.py,sha256=7YYWwk4LX0Z7lZegnsldctb-a9zGGgJUdjFeGo-oLv4,30426
643
+ sglang/srt/models/minicpmo.py,sha256=HbtJ-Ds5nqzZqNdicotL5OnRnyS34U4CwfjHbQHc2j0,75945
644
+ sglang/srt/models/minicpmv.py,sha256=W_ZlgT3BxB4PyTLhBdDyV_JAhTJgDQmDk8mxWI6c_mw,30399
638
645
  sglang/srt/models/mistral.py,sha256=Ox07RJpTYl-4Pb25UIghL_66o9TTA6lPmsUyent_Flc,3480
639
646
  sglang/srt/models/mixtral.py,sha256=n-Pz7fyWE4m6Uh7sjzAYKNr5Wy4QUj5Yekl0qiCwQI8,17055
640
- sglang/srt/models/mixtral_quant.py,sha256=-kQw9r8KcLdO8SNN9RKXzrGq9Q2Al9l9cWHi1VrZSRM,15260
647
+ sglang/srt/models/mixtral_quant.py,sha256=UUIq7lpUonD9IoGePyl59oJYEcVwT9wUXvtVp5tjQ9Y,15406
641
648
  sglang/srt/models/mllama.py,sha256=pkS0UWiqKJHRsFtSZzpSI9O6B5_j1OtI5pf_nyDPp3U,39707
642
- sglang/srt/models/mllama4.py,sha256=4E7qGicVuTKAs3vHF2SnoNlQP1mm2eBrsLU7QK3x9ow,10519
649
+ sglang/srt/models/mllama4.py,sha256=Zq9WIOmtdtRy68LwsRXJ0NgaIAqAyBBsUdTZoCsptSY,20216
643
650
  sglang/srt/models/olmo.py,sha256=7-q_fA6XXdG7kPUjpUzYkzMUWJobuSjhqjYw9xSUs_c,12671
644
651
  sglang/srt/models/olmo2.py,sha256=azmljhJF4ivcQfUtfsAUxq3ducE4tRKTL6iwe0IKYMg,14327
645
652
  sglang/srt/models/olmoe.py,sha256=TMzt-yB891bvA4X50xL0NjNnFYSx9imlA7N1EG8KNK0,15949
646
653
  sglang/srt/models/phi3_small.py,sha256=eJb8aS_3KLObrq3PNkoIyVHaQ6SZTAJe42rbpC54QKg,16012
647
- sglang/srt/models/phi4mm.py,sha256=rBGRtTLGBJZGYXhvotBjJbAUpbLxsCZahDtrInP_FGM,19064
654
+ sglang/srt/models/phi4mm.py,sha256=es6sQM6JOpfL1uR6DerK427Q4Hj7aE0RkIwhux3NZlU,19135
655
+ sglang/srt/models/phimoe.py,sha256=R3uA1e9XbH2e4XP_GiH8mb7_288BC94w2XQcoQrjyfM,19026
648
656
  sglang/srt/models/pixtral.py,sha256=ZkZrV0mEfmbBdgRko2AvsMFZbAVskgp_5a5p1xCSRN0,16835
649
657
  sglang/srt/models/qwen.py,sha256=xYkVmMZS2uMqWhfndc8EYm0olpKFnggfuMp_6aobVi4,10758
650
- sglang/srt/models/qwen2.py,sha256=uF71yk7ZbW4ENbfdq7Sf4dWwZjLT2JNLyzkcFtmLEoU,20983
651
- sglang/srt/models/qwen2_5_vl.py,sha256=SuJe8YfRQkJJo_bBSgRodY2-hUl_evYdNuAal16jrxs,22563
658
+ sglang/srt/models/qwen2.py,sha256=2G-aT1izwYsi60NObMXjbsJjyYy_Blo1kjkgI65bYZo,21056
659
+ sglang/srt/models/qwen2_5_vl.py,sha256=RxRDLV7F6J-q-QKKhvkafa8C0jc_PWohW9N25Rq46Mg,22737
652
660
  sglang/srt/models/qwen2_audio.py,sha256=linjXOVGhjyKk5DUx9Uw-BJa1N-YcqCFUpsj0Zr_98A,7877
653
661
  sglang/srt/models/qwen2_classification.py,sha256=dGrMm4ebd30_lBhHOhaV57ig2iOTx3nqB4GEzsrRIM8,2747
654
662
  sglang/srt/models/qwen2_eagle.py,sha256=6spFg6JYQGeUXLv2Q5eMkVzZvnqGyvW6SdVBtFMxlTM,4806
655
663
  sglang/srt/models/qwen2_moe.py,sha256=fmVDsb4ju0suMCZiDAhocPxO9gQecOWOxmdf-W1elvg,24239
656
664
  sglang/srt/models/qwen2_rm.py,sha256=-mQXDEv11p-I1HXgYLTtY6ROem6UYorO958WsDrzsgs,2837
657
- sglang/srt/models/qwen2_vl.py,sha256=Xo7f-ChWZJNJpM0RNe-GsYU4_VXPR62ZNMSXBVYr4QY,20842
665
+ sglang/srt/models/qwen2_vl.py,sha256=tm-k4vCWJa2lWppYrZxi_b6gCQm0HQKs-QTI13U0_tA,21383
658
666
  sglang/srt/models/qwen3.py,sha256=3alBwittpU5m44DnJZ5mjRM0x1UShepu2CREWotPYqA,17777
659
667
  sglang/srt/models/qwen3_moe.py,sha256=qP_UlowZPOOB9sALkRtaK3-gpXlsmgEJMaJ17bycpJ0,32867
660
668
  sglang/srt/models/registry.py,sha256=bH9H0OiNV0Cn7FRBM30Oh6dxICTs9mJscdLtHYPJvxc,3783
@@ -663,27 +671,27 @@ sglang/srt/models/siglip.py,sha256=DIVJRwdtpLD2QT1kVPIHw7Bn9BE40xJbkHujDNzkjgA,9
663
671
  sglang/srt/models/stablelm.py,sha256=0x_31uIr3WcWwecdPAI3ek9KkyKBJS7VwknTk2y0gjY,12281
664
672
  sglang/srt/models/torch_native_llama.py,sha256=oTxxof5Wx2b2egIwWx56LeHjtPGQleQ2zM5jXHMiuOU,19293
665
673
  sglang/srt/models/transformers.py,sha256=_CL0npi-_HvqzxkLgFhv2EE3bfGvCLXPYAtPFywZOr0,10260
666
- sglang/srt/models/vila.py,sha256=Q8Z4q8DH3SAiaYocGys6AkEpw8zg3-l3pb5wLcyVves,9780
674
+ sglang/srt/models/vila.py,sha256=7HJjYw85riD5JvQdTA-UmhPJaoI4kfQIHP7HbbW_B6U,9851
667
675
  sglang/srt/models/xverse.py,sha256=DsNVI9JpzN4jj0Ry6aTrj7r-xq5YLOoDX2kH4YLJA-I,14035
668
676
  sglang/srt/models/xverse_moe.py,sha256=7KCM2-j12towDMNvXkuuYiBOmNauH6NG4Ip40x0khqA,16782
669
677
  sglang/srt/models/yivl.py,sha256=oToK7-u5IGO7xwpJIQ7VtudlK6-zPqJX4bt6_wv0SH8,4850
670
- sglang/srt/multimodal/mm_utils.py,sha256=7o4w1W0VAWgEquVIz7qw7-IxYbZY2g3MrXw9php90oY,12621
671
- sglang/srt/multimodal/processors/base_processor.py,sha256=05moS0iDYUfI9CKzio5ip8cjsfUjqYi_S5fzArWJxw8,21539
678
+ sglang/srt/multimodal/mm_utils.py,sha256=6bV1_a7Iet9W0y3qdd0E-hFM78zalIzNZCYbLzJX2y8,12640
679
+ sglang/srt/multimodal/processors/base_processor.py,sha256=H3IospK9baMOtirUPnYFTA_FX3N7Uq4RlY2HGVSVHf0,24269
672
680
  sglang/srt/multimodal/processors/clip.py,sha256=chKReTXD4ETUQ0s7BOk_AmWHEZXR5no6fprrnHwSNIM,1271
673
- sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=VHrUbOTF_18fPYaEx_awS1UMhOy0nhTXoA17wakwyQ4,3281
674
- sglang/srt/multimodal/processors/gemma3.py,sha256=11tIvfpUAc9E_dkZZ-5kupUCn2TJ9e-yBriCpF38Ino,2084
675
- sglang/srt/multimodal/processors/gemma3n.py,sha256=FzwkaEhk4ATn4nV9zkGdBgcHTTTVK5CbnTx_vBr0QxI,3116
676
- sglang/srt/multimodal/processors/internvl.py,sha256=ffLizY9v3jYIm026UZg6MHBNadyUWYgag8HbL3hFtis,9334
677
- sglang/srt/multimodal/processors/janus_pro.py,sha256=TOxSQH8gVirAYZvcQ_3Gd2uvNMzzWwubF4ROKDWUO9g,1913
678
- sglang/srt/multimodal/processors/kimi_vl.py,sha256=2KMB6iEXizHXzE6yjtzS7V1RFhsA2hhuxk3Bx0ySMDM,1653
681
+ sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=OlkkeqMyaqfmxKDSIg-0Y3JKAKjzBDJfTx6p_UytleM,3275
682
+ sglang/srt/multimodal/processors/gemma3.py,sha256=Icn4wLs1JKiNXnZx7VFYDO88nk79Ht01GmsxSKfcv5A,2181
683
+ sglang/srt/multimodal/processors/gemma3n.py,sha256=sacfdl3sU6bgbD6fXFoLzrG5Ti5tzWewjaUh2wb4dlU,3119
684
+ sglang/srt/multimodal/processors/internvl.py,sha256=wy0fj4y9y7lUZo2hAACOb57eo5nmhJvSd1s2d-CpkNI,9328
685
+ sglang/srt/multimodal/processors/janus_pro.py,sha256=e5VBoL-adxdKFkkXgC9X70ESZXIhtBhUEq1i0pqrn90,1907
686
+ sglang/srt/multimodal/processors/kimi_vl.py,sha256=qLYonS4YwTB1yIz5D-dfZPJprtDzILueCAyMW6a7xLY,1656
679
687
  sglang/srt/multimodal/processors/llava.py,sha256=tIjeDPYxvMWUMXXLcfzzuaLPvdBtPrRzM25QzP0cnaE,7962
680
- sglang/srt/multimodal/processors/minicpm.py,sha256=9Y8KCo5eCX274CJIx1D8BVWgferjc0Uf6Zd_HR_IMnY,5316
688
+ sglang/srt/multimodal/processors/minicpm.py,sha256=_bejh4YQBuYy39IKzOgkQ0XRgmYqt9FhqXn5Z3d4wV8,5398
681
689
  sglang/srt/multimodal/processors/mlama.py,sha256=bW0hVPtRMqYz1RR2I19QtZLUTTPzInZv_6ZhVPJBieo,1406
682
- sglang/srt/multimodal/processors/mllama4.py,sha256=V2Y3G-bv2wdqkgE_XGPLMJp_nSEEr-MD8_S4h8QTDDk,5752
683
- sglang/srt/multimodal/processors/phi4mm.py,sha256=ZYH1fWTpbz6wLGyV6c51kd54vwPRm0qdZiQcc0GlXGI,2337
684
- sglang/srt/multimodal/processors/pixtral.py,sha256=VsCIFJpIUM3pSGNe_uRd8NlH7zSokW4xHOrZSi70R1o,4055
685
- sglang/srt/multimodal/processors/qwen_vl.py,sha256=lKVWvvtB4OWfyJ9YZLuJapiW93cGb4T3SoqSAsPc1S4,6874
686
- sglang/srt/multimodal/processors/vila.py,sha256=cfBY1Lmlndb-aNLpOyAffi7QPCI6rIYCdAnuxfaNcnA,2176
690
+ sglang/srt/multimodal/processors/mllama4.py,sha256=nAayC-mTpvooaqBC5pltaUMTXDgIpKFA8BzOXhptDZo,5597
691
+ sglang/srt/multimodal/processors/phi4mm.py,sha256=iT-fBClMecI52yQTpfjxowvpRnBo9FBjJ83ieCFVROc,2331
692
+ sglang/srt/multimodal/processors/pixtral.py,sha256=B8b30tiBClsALtgcqWDAgIGxd3uwr_8VqQx8xTvrsy8,4049
693
+ sglang/srt/multimodal/processors/qwen_vl.py,sha256=hniJbL7tt7DkMvjMHnxFH4PPdkXpwHRcanXgrlyGb-Q,10731
694
+ sglang/srt/multimodal/processors/vila.py,sha256=SL-O3WdBVIZcSO7NGnCRr_22KntPr6Qc-4jJbgvzN4M,2179
687
695
  sglang/srt/sampling/custom_logit_processor.py,sha256=AwODYVJdRkcQ8PGtJrhzKsqAgn8XZLQbAmR9fGiQzmc,1608
688
696
  sglang/srt/sampling/sampling_batch_info.py,sha256=m8m-mXu3N8hLYFhAkRopePDT5Ozkd4KAmWDgM_9_4iA,14536
689
697
  sglang/srt/sampling/sampling_params.py,sha256=L2cU3MhAo9OvfdEtTdJidp9nTOkD6tiwlegxQ5vgIfU,6127
@@ -716,6 +724,7 @@ sglang/test/test_block_fp8_deep_gemm_blackwell.py,sha256=Hnhq4kkyINHb4ONedkp5Kf7
716
724
  sglang/test/test_block_fp8_ep.py,sha256=Ufq6p32sb1RSbFKaSnsVF8RrqqwwAACBUgOJTEH2Lbc,10856
717
725
  sglang/test/test_custom_ops.py,sha256=2bSo9P5_rJZYFq8Y8IKRimDfFyZZGJluhL7Ngny0Pf4,5571
718
726
  sglang/test/test_cutlass_moe.py,sha256=beXdvpwpHh0O8fpLW-RV3Bx8Wu0lRFG_SNkL3Op5ITA,9905
727
+ sglang/test/test_cutlass_w4a8_moe.py,sha256=LmeSS7BrKO6-1mnksOqmo0nvJ_y3oeeiT5ytRkHk2A0,8780
719
728
  sglang/test/test_deepep_utils.py,sha256=749ysTBGNzh6rYUCJhhZBtZpeD15eWTeNHYCytcvZtc,7448
720
729
  sglang/test/test_dynamic_grad_mode.py,sha256=L76yUCuk_ymNpXD2CmO8r2GiGjIvD_gtTsuFDs2NolI,1638
721
730
  sglang/test/test_fp4_moe.py,sha256=U4LHzpGl6pCiCZiENRPxVP6hxqkqRZ_0WXbB29vYeAo,8187
@@ -726,8 +735,8 @@ sglang/test/attention/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3h
726
735
  sglang/test/attention/test_flashattn_backend.py,sha256=_rTG849FwQdVTyGKkqhczaOqngBmRWXFmkl5NnuK1GM,13914
727
736
  sglang/test/attention/test_flashattn_mla_backend.py,sha256=g4O50WblTpM7_Gq2b76k0i25_z01BOUBQ4i6PmyxpO4,10774
728
737
  sglang/test/attention/test_prefix_chunk_info.py,sha256=hpoDe2wfSa6RlUbfyri_c0iyBTb35UXGL9I2Xh6jamM,7772
729
- sglang-0.4.9.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
730
- sglang-0.4.9.dist-info/METADATA,sha256=tH3lSIOqvezltkU9P2f6oqUauU_5S8qnLr3jYUIRiV0,27125
731
- sglang-0.4.9.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
732
- sglang-0.4.9.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
733
- sglang-0.4.9.dist-info/RECORD,,
738
+ sglang-0.4.9.post2.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
739
+ sglang-0.4.9.post2.dist-info/METADATA,sha256=_Z1MAQxdNmJPXSJy0-sGf6MKxRciuhUY4BWxIDVqqCM,27276
740
+ sglang-0.4.9.post2.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
741
+ sglang-0.4.9.post2.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
742
+ sglang-0.4.9.post2.dist-info/RECORD,,