sglang 0.5.1.post3__py3-none-any.whl → 0.5.2rc1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (93) hide show
  1. sglang/bench_one_batch.py +3 -0
  2. sglang/srt/configs/__init__.py +2 -0
  3. sglang/srt/configs/longcat_flash.py +104 -0
  4. sglang/srt/configs/model_config.py +14 -1
  5. sglang/srt/connector/__init__.py +1 -1
  6. sglang/srt/connector/base_connector.py +1 -2
  7. sglang/srt/connector/redis.py +2 -2
  8. sglang/srt/connector/serde/__init__.py +1 -1
  9. sglang/srt/connector/serde/safe_serde.py +4 -3
  10. sglang/srt/disaggregation/ascend/conn.py +75 -0
  11. sglang/srt/disaggregation/launch_lb.py +0 -13
  12. sglang/srt/disaggregation/mini_lb.py +33 -8
  13. sglang/srt/disaggregation/prefill.py +1 -1
  14. sglang/srt/distributed/parallel_state.py +27 -15
  15. sglang/srt/entrypoints/engine.py +19 -12
  16. sglang/srt/entrypoints/http_server.py +174 -34
  17. sglang/srt/entrypoints/openai/protocol.py +60 -0
  18. sglang/srt/eplb/eplb_manager.py +26 -2
  19. sglang/srt/eplb/expert_distribution.py +29 -2
  20. sglang/srt/hf_transformers_utils.py +10 -0
  21. sglang/srt/layers/activation.py +12 -0
  22. sglang/srt/layers/attention/ascend_backend.py +240 -109
  23. sglang/srt/layers/attention/hybrid_attn_backend.py +53 -21
  24. sglang/srt/layers/attention/trtllm_mla_backend.py +25 -10
  25. sglang/srt/layers/layernorm.py +28 -3
  26. sglang/srt/layers/linear.py +3 -2
  27. sglang/srt/layers/logits_processor.py +1 -1
  28. sglang/srt/layers/moe/cutlass_w4a8_moe.py +1 -9
  29. sglang/srt/layers/moe/ep_moe/kernels.py +74 -0
  30. sglang/srt/layers/moe/ep_moe/layer.py +14 -13
  31. sglang/srt/layers/moe/fused_moe_triton/__init__.py +5 -3
  32. sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=129,N=352,device_name=NVIDIA_B200,dtype=fp8_w8a8.json +146 -0
  33. sglang/srt/layers/moe/fused_moe_triton/fused_moe.py +5 -1048
  34. sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_config.py +212 -0
  35. sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_kernels.py +796 -0
  36. sglang/srt/layers/moe/fused_moe_triton/layer.py +5 -2
  37. sglang/srt/layers/moe/fused_moe_triton/moe_align_block_size.py +87 -0
  38. sglang/srt/layers/moe/topk.py +35 -12
  39. sglang/srt/layers/quantization/deep_gemm_wrapper/compile_utils.py +9 -1
  40. sglang/srt/layers/quantization/deep_gemm_wrapper/configurer.py +0 -3
  41. sglang/srt/layers/quantization/modelopt_quant.py +7 -0
  42. sglang/srt/layers/quantization/mxfp4.py +9 -4
  43. sglang/srt/layers/quantization/utils.py +13 -0
  44. sglang/srt/layers/quantization/w4afp8.py +30 -25
  45. sglang/srt/layers/quantization/w8a8_int8.py +7 -3
  46. sglang/srt/layers/rotary_embedding.py +28 -1
  47. sglang/srt/layers/sampler.py +29 -5
  48. sglang/srt/managers/cache_controller.py +62 -96
  49. sglang/srt/managers/detokenizer_manager.py +9 -2
  50. sglang/srt/managers/io_struct.py +27 -0
  51. sglang/srt/managers/mm_utils.py +5 -1
  52. sglang/srt/managers/multi_tokenizer_mixin.py +629 -0
  53. sglang/srt/managers/scheduler.py +39 -2
  54. sglang/srt/managers/scheduler_output_processor_mixin.py +20 -18
  55. sglang/srt/managers/scheduler_update_weights_mixin.py +8 -1
  56. sglang/srt/managers/tokenizer_manager.py +86 -39
  57. sglang/srt/mem_cache/chunk_cache.py +1 -1
  58. sglang/srt/mem_cache/hicache_storage.py +20 -3
  59. sglang/srt/mem_cache/hiradix_cache.py +94 -71
  60. sglang/srt/mem_cache/lora_radix_cache.py +1 -1
  61. sglang/srt/mem_cache/memory_pool.py +4 -0
  62. sglang/srt/mem_cache/memory_pool_host.py +4 -4
  63. sglang/srt/mem_cache/radix_cache.py +5 -4
  64. sglang/srt/mem_cache/radix_cache_cpp.py +1 -1
  65. sglang/srt/mem_cache/storage/hf3fs/mini_3fs_metadata_server.py +61 -34
  66. sglang/srt/mem_cache/storage/hf3fs/storage_hf3fs.py +56 -9
  67. sglang/srt/mem_cache/storage/mooncake_store/mooncake_store.py +2 -1
  68. sglang/srt/mem_cache/swa_radix_cache.py +1 -1
  69. sglang/srt/model_executor/model_runner.py +5 -4
  70. sglang/srt/model_loader/loader.py +15 -24
  71. sglang/srt/model_loader/utils.py +12 -0
  72. sglang/srt/models/deepseek_v2.py +31 -10
  73. sglang/srt/models/gpt_oss.py +5 -18
  74. sglang/srt/models/llama_eagle3.py +4 -0
  75. sglang/srt/models/longcat_flash.py +1026 -0
  76. sglang/srt/models/longcat_flash_nextn.py +699 -0
  77. sglang/srt/models/qwen2.py +26 -3
  78. sglang/srt/models/qwen2_5_vl.py +65 -41
  79. sglang/srt/models/qwen2_moe.py +22 -2
  80. sglang/srt/models/transformers.py +1 -1
  81. sglang/srt/multimodal/processors/base_processor.py +4 -2
  82. sglang/srt/sampling/penaltylib/orchestrator.py +14 -2
  83. sglang/srt/server_args.py +112 -55
  84. sglang/srt/speculative/eagle_worker.py +28 -8
  85. sglang/srt/utils.py +4 -0
  86. sglang/test/attention/test_trtllm_mla_backend.py +12 -3
  87. sglang/test/test_cutlass_w4a8_moe.py +24 -9
  88. sglang/version.py +1 -1
  89. {sglang-0.5.1.post3.dist-info → sglang-0.5.2rc1.dist-info}/METADATA +5 -5
  90. {sglang-0.5.1.post3.dist-info → sglang-0.5.2rc1.dist-info}/RECORD +93 -85
  91. {sglang-0.5.1.post3.dist-info → sglang-0.5.2rc1.dist-info}/WHEEL +0 -0
  92. {sglang-0.5.1.post3.dist-info → sglang-0.5.2rc1.dist-info}/licenses/LICENSE +0 -0
  93. {sglang-0.5.1.post3.dist-info → sglang-0.5.2rc1.dist-info}/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  sglang/__init__.py,sha256=CK60u1J439CJZaPihWqlDjFZ8doIC-5YgIYz-E1PIh4,1823
2
2
  sglang/bench_offline_throughput.py,sha256=Bge0KG4Uiv9CHsxDnqKdXJmG_TcxM4blz3CmvLmDRvM,14815
3
- sglang/bench_one_batch.py,sha256=8Aic1FibvTpRtxtZx0fK97v8n7MQYLzg9Hg4t64iorQ,23041
3
+ sglang/bench_one_batch.py,sha256=ITGCBFPksSyoXPEgAqZruGY2ZUPyOoc111jf1nil0go,23137
4
4
  sglang/bench_one_batch_server.py,sha256=d-XnTgyUzsEeOHyuc-DGZDeW4ZB4V59aV9Ojr3H43SE,14676
5
5
  sglang/bench_serving.py,sha256=TcT-yEO9bJW4VASIrfJaDZwKepBcerBUmVPeKbWoruI,78205
6
6
  sglang/check_env.py,sha256=qDMIG2rCNBH1yKnxQmF-Bp10oiFMUKMgfZLHZYOmdSY,8412
@@ -9,7 +9,7 @@ sglang/global_config.py,sha256=ZMTux_PsGnvkyJ0kTFwhTdbnFwIjjpGDogut_9Lu4Vo,1732
9
9
  sglang/launch_server.py,sha256=mDXfwha8LHpWQJekcCosR98QhCQsbmilsBlI5jAIgg0,420
10
10
  sglang/profiler.py,sha256=JCpZzlDhahoiPlPi5IG3n7GFrQHxfHEB6ELie3Ck55w,4397
11
11
  sglang/utils.py,sha256=dC2PNkKYTgDHsNrWdZJ74GvaXGSHCeIk_aZ-TA89OhY,16380
12
- sglang/version.py,sha256=_jbt9dYNR7pmoDsN781ZGkqYq_dZ7gNo3S1g-kmR8DM,28
12
+ sglang/version.py,sha256=Yk9OPhzYNwVtFzj5deHSdkGtcxF0FXLnKJ9OFFikW9M,25
13
13
  sglang/eval/llama3_eval.py,sha256=mLNRZJIqV4CfqrY8UGnJEcHw2Xsyr1eyYZgFSUFYr1g,9997
14
14
  sglang/eval/loogle_eval.py,sha256=-CC2s2kh5qUoDrHRkQVkC_jNvBgNojXbf456ny5s78s,4557
15
15
  sglang/lang/api.py,sha256=rcp3GeoyZhmJ0GDLPRkuZNcxd0TBJy_wfUDpcmQoqW8,7210
@@ -33,7 +33,7 @@ sglang/srt/constants.py,sha256=0i-tEwG2BSYNDy96MxnGHV5HnBELkYcnsVGsE-R18o0,93
33
33
  sglang/srt/conversation.py,sha256=cmVT4SCqRYxprYvmftUC_z_TkhXCqYC9B2rVZsmQe30,38869
34
34
  sglang/srt/custom_op.py,sha256=7OPQAZe3PqDXk-xM0Wxl7pm9cazilNJfkNiYIWztWgI,3198
35
35
  sglang/srt/harmony_parser.py,sha256=YweG4azWm5jmzYGaAHEXSaORpgWctPpSGQk_jp5H-CE,23227
36
- sglang/srt/hf_transformers_utils.py,sha256=YXaapaY6N8ETS0vTQBwcFERG5eMt3nsdN6GYeiEK9wM,15201
36
+ sglang/srt/hf_transformers_utils.py,sha256=XifKc8JTPr_CkQtdLZ5-OvsNzapGgny_JJSIkYaiJYo,15674
37
37
  sglang/srt/host_shared_memory.py,sha256=00TgVm3PNCl4rTPJZChG5uu4I5hd_Xf587r39tibmIg,2274
38
38
  sglang/srt/jinja_template_utils.py,sha256=XCuqi6iHQrtziUvhy22ePdh8WcS42O9sKxuXpM_bMXc,7836
39
39
  sglang/srt/model_parallel.py,sha256=eLXZhvJ4wG6dh0FontNCIdVZvHYdWgaeY-5cu7TD9tE,6078
@@ -43,12 +43,12 @@ sglang/srt/operations_strategy.py,sha256=-w6GI2VgSGvORy3pUWRAJo6244ykSW1ZBV1Dx0f
43
43
  sglang/srt/patch_torch.py,sha256=OUPCGQSQz3MVZB1zZ_Eq8lXiw0uIKJ_HWjqQolI8FsM,3088
44
44
  sglang/srt/poll_based_barrier.py,sha256=9vjn32ROlSueEk7EuZjWKUrrL7XVR9KJsSVliGTYB_4,937
45
45
  sglang/srt/reasoning_parser.py,sha256=HEWAeFzPA_Jn3a44BYCz61QNV6kAvX46Y0tR8csAUg4,11152
46
- sglang/srt/server_args.py,sha256=ywi3C49ixZneuJ7EXjTu4E1EMn0M6-jlQfHfU77ksLQ,102532
46
+ sglang/srt/server_args.py,sha256=qEh8ykOglDMHh3GvyUhG0oOSJq_tH8vUYtDzSukoOtk,104043
47
47
  sglang/srt/torch_memory_saver_adapter.py,sha256=K_eTx0UU84MHSTXI3iqYLdHV4IWtJMJ2FKdGFJR8v1E,2417
48
48
  sglang/srt/two_batch_overlap.py,sha256=UykF5nC2rja3Hvmu0D9glqKdVRIEhQGPV84Jm7veopQ,34150
49
- sglang/srt/utils.py,sha256=hgJ3PsNL07eOe4uvIdq50_Aiq2WJo0783FSJJ_L9xwk,95170
49
+ sglang/srt/utils.py,sha256=3qKij1k6uj0Ch-gErdsfXJFUiCU941L0ePoqnIqxZvk,95252
50
50
  sglang/srt/warmup.py,sha256=zldxhMlXpclRAJXmfBjJNUJd1eDizVdysibBvQyTVuA,1782
51
- sglang/srt/configs/__init__.py,sha256=gas3cKYVgZp7qF4m8FejX4EUUmdQd_w5WDTm7fo7yM0,743
51
+ sglang/srt/configs/__init__.py,sha256=3GdmJ2DUiNq1zNs3yOILwZzL0J8fK-h8k2P5YVgxEI0,833
52
52
  sglang/srt/configs/chatglm.py,sha256=j-b0YkdYUmQm2y1kNmMJtKeACxWKmBbvNNkDWbs6kbI,2907
53
53
  sglang/srt/configs/dbrx.py,sha256=tdhIkXAQl1yr0MxqFmsDG1E0e2puRTTKm6UTyANBLac,11005
54
54
  sglang/srt/configs/deepseekvl2.py,sha256=sYMmoy5_LlDXht7MTi4QGYOaiE8iMGUO44bnuOu4i8I,23683
@@ -59,17 +59,18 @@ sglang/srt/configs/janus_pro.py,sha256=yI2c_aWBIKiTcK6RZxK6hq8CIxyYRH_NN8uaSNKsr
59
59
  sglang/srt/configs/kimi_vl.py,sha256=4W7VQI3pr888ZsFA2SqCQo4mI0seXTOrGQ-x3oTvWew,1358
60
60
  sglang/srt/configs/kimi_vl_moonvit.py,sha256=hx2Rt4JSFbvy2HUTeLjBpge87m8M6ITAhqsgdNf_Jd4,1163
61
61
  sglang/srt/configs/load_config.py,sha256=qs-AxuplouBx2tsv9KGBOLZPbwzuVA4vbktbGP_cRp8,3309
62
- sglang/srt/configs/model_config.py,sha256=TbXN5Vne86gmaIq5E5In30nVvcuPms8mCi7Cn2b6sQw,30967
62
+ sglang/srt/configs/longcat_flash.py,sha256=Qp25xJVLq2K72Z80cXhcJxtqhagAdiPySDoevuT0Sno,3589
63
+ sglang/srt/configs/model_config.py,sha256=0oEbC4bxtfPckBuY_p6uXHB1vDXxhkvJCpr9cPbExwI,31712
63
64
  sglang/srt/configs/step3_vl.py,sha256=_Otgnym57DVgB_kZ__8c1_Ys5gSalA_K0ZuVjcG51T0,4845
64
65
  sglang/srt/configs/update_config.py,sha256=GEf-XhL8JPrbX9-Hz8V7S3M6YTg76DVdIhc_4YdMDtc,6291
65
66
  sglang/srt/configs/utils.py,sha256=3nHUfisMs_Ltuhv8OZTNCJp63YJKJVF43h1QZB1zqx8,670
66
- sglang/srt/connector/__init__.py,sha256=czLX5JOxuMhH-T9eSJzoc1qv1B4z9chyffDRL5I6wo4,1247
67
- sglang/srt/connector/base_connector.py,sha256=i6i1TIzsz4NbSEkrdMPq-urb2sN2aLAx8dazga4gB9U,2833
68
- sglang/srt/connector/redis.py,sha256=KoLLUSY4Lu9zUrRJy2yYdtf1yanTaS0bQP8V0t95DB0,2552
67
+ sglang/srt/connector/__init__.py,sha256=7sKpAYPdW9NC0A3sbUmDVgLuMf9b2jwifnVMs2Q7Ow4,1243
68
+ sglang/srt/connector/base_connector.py,sha256=LCKsTX_yWHclPrzNNB1fLwVCN8rIDKZaZhqHQ54B9MU,2774
69
+ sglang/srt/connector/redis.py,sha256=K3fJSm2rZsd0R_KkICV3jIWKtrwxXE1tYktWnovLbz4,2514
69
70
  sglang/srt/connector/s3.py,sha256=hn5Ow9Y6ItS8RMJDwnTQe5QaiQ7HKMgiwggE9QnUewM,3743
70
71
  sglang/srt/connector/utils.py,sha256=isTvxauz1_8no5MW6p8Bwj2H9mQkweaRO_RSwAPA7R8,983
71
- sglang/srt/connector/serde/__init__.py,sha256=MvBJ7FBJtnou-AD-EdsCdAIDCcA8kWvUNuRViILVJ-0,718
72
- sglang/srt/connector/serde/safe_serde.py,sha256=Iv_mFsDvk-cXuw0WTykBZ2yGxW0jb82DwVqC7r3RmAU,750
72
+ sglang/srt/connector/serde/__init__.py,sha256=zuleyYN-jrDyiPiXjTbQKA27llb4H7HuDTZcBwrLk1U,707
73
+ sglang/srt/connector/serde/safe_serde.py,sha256=XSjb9mRv1HqeG6Jiw633EOQYlrcI23Q21UluYqPZaWA,760
73
74
  sglang/srt/connector/serde/serde.py,sha256=n59I2MXLa7WCyN_8pEd8L-scJk7lMhmEX-GOUIhF0ZA,1004
74
75
  sglang/srt/constrained/base_grammar_backend.py,sha256=ATWX1LKp3GjUDVkauEaSc3MnS8Bt6hOiHUgeYDZtgNo,7059
75
76
  sglang/srt/constrained/llguidance_backend.py,sha256=Au8G8x4EB39w7k9-GFLP2hOPETyeAPw53RRZYdLimpA,6191
@@ -85,12 +86,12 @@ sglang/srt/debug_utils/text_comparator.py,sha256=pg58q3fzsnd3rJKRgZTdcOviOtAv8pS
85
86
  sglang/srt/disaggregation/decode.py,sha256=EELA3krHp4YtRIpUYU0-9LSFd7XQuvKn3yiHGrK7gaI,34598
86
87
  sglang/srt/disaggregation/decode_schedule_batch_mixin.py,sha256=Iu7ehHGAfYIVATtClwX6y-6zxWs-JyDlMotYo_5yuUc,6598
87
88
  sglang/srt/disaggregation/kv_events.py,sha256=yFbtwOeblcCmOXTjg00TopxnyjkmCBQIVz46KB8jetY,13555
88
- sglang/srt/disaggregation/launch_lb.py,sha256=pmHwo1GWbpHZn4IDKnOEHYVcfdKpsYuTHUMowNo3TrE,3891
89
- sglang/srt/disaggregation/mini_lb.py,sha256=4l3W2COZuX8DbLg8AQvAhv5EncH9FkEv2HF5fhn3GQM,14630
90
- sglang/srt/disaggregation/prefill.py,sha256=CLoixMP1qRWO-VEsvVbjfQOu4ggqF0KeuHhxZC-NSvU,36272
89
+ sglang/srt/disaggregation/launch_lb.py,sha256=x355ULx1tUOkSSDae5INMQoG8sPC-l-hMh4FBk9MAaI,3439
90
+ sglang/srt/disaggregation/mini_lb.py,sha256=pZ4MYR0DE_DJpINTcckbJTBdz8Y9NAOjOqPqbHPThJo,15599
91
+ sglang/srt/disaggregation/prefill.py,sha256=gf8ju_REf5FxPg_QtmlMEipeo1N5muUcZHRkaKtfMhY,36286
91
92
  sglang/srt/disaggregation/utils.py,sha256=evdv4AkQxJzTqdO0jrdAr7vHUbBSCEXMzNREh0FoRLc,12294
92
93
  sglang/srt/disaggregation/ascend/__init__.py,sha256=-lxnica6fZYmYNpKwmE8yESUpQ5Sxf2DiZoBHzboKc8,146
93
- sglang/srt/disaggregation/ascend/conn.py,sha256=oBhEQ83SbIlYc7QSG6Cqk48QqdYSlxcSMWbc-2KXlXM,1191
94
+ sglang/srt/disaggregation/ascend/conn.py,sha256=EuCsFMxwxDp7jt8K2uyTtRlIk0Vi5A_VBz6hKYwybhU,4119
94
95
  sglang/srt/disaggregation/ascend/transfer_engine.py,sha256=_4PszsQL6wICdg5cqpR2N9TbZpUY6bBX8tgE3xeaYfc,2137
95
96
  sglang/srt/disaggregation/base/__init__.py,sha256=4VwUv0aWxwmVL1049XK82aLTNxmt0WY5RPy9li-wyVk,160
96
97
  sglang/srt/disaggregation/base/conn.py,sha256=xQ-UB_brdn9vHr-NSbzuR6BysDPGh0Pt9h836iUgbX8,2901
@@ -107,7 +108,7 @@ sglang/srt/disaggregation/nixl/conn.py,sha256=eSof87fG21Dd4COszfnbeXIxne3TWvw0mS
107
108
  sglang/srt/distributed/__init__.py,sha256=jFOcyt-wFAPMBUAf9zkZalNQlt-4rqmT6pCKBz1E4qo,149
108
109
  sglang/srt/distributed/communication_op.py,sha256=IBnFUdMftK_VSTMMMitGveonorFUUVNL4guqO31cMSc,1130
109
110
  sglang/srt/distributed/naive_distributed.py,sha256=5Kcfapzz61G3TtScTZrHoWa4bf6Vr27GlMcBAGMz7tQ,3260
110
- sglang/srt/distributed/parallel_state.py,sha256=ic89h9Ze1yKMnY5s-mpO23LP-DH0zLXmvxDkRWgxILg,65200
111
+ sglang/srt/distributed/parallel_state.py,sha256=NsWEw341ew7dElC9BQ3vBLzaLVTDKCmCkKIl37b72dg,65717
111
112
  sglang/srt/distributed/utils.py,sha256=aaCxATncLGnVgB0WlGpBdee0behKW8Dy_dakqcuKSaQ,8497
112
113
  sglang/srt/distributed/device_communicators/cuda_wrapper.py,sha256=3jvPG-Ow5UBLiXhfx8T8snR7crSZbPpARAggsDPWq7k,7038
113
114
  sglang/srt/distributed/device_communicators/custom_all_reduce.py,sha256=Q1kkKPKFPV0QMmKLyjOBlOnX8-Pr4UeGBZYkG6j0gc0,16570
@@ -123,13 +124,13 @@ sglang/srt/distributed/device_communicators/shm_broadcast.py,sha256=IrSrnpZnii0E
123
124
  sglang/srt/distributed/device_communicators/xpu_communicator.py,sha256=ajW6132BvA6jkeipEIgN27TFycI0U06Ih2Z8WNjlA4s,1593
124
125
  sglang/srt/entrypoints/EngineBase.py,sha256=yKN76witT2jz1zhmLHmPNLGMpK2UiOTaKQ2KPD8l99U,2594
125
126
  sglang/srt/entrypoints/context.py,sha256=aD-94xkD0komuGO5gtYUoJKCHdc4hAipMxQt04yVRGA,8030
126
- sglang/srt/entrypoints/engine.py,sha256=Dt84ZOeuNKqjlC_PNU6dt6Cr4pFJxXwHdkYEjInmaz4,33151
127
+ sglang/srt/entrypoints/engine.py,sha256=wNEYxQTVFHt9EvMzQr5zutX9Cb7RDDn64c8Xckuwhsg,33490
127
128
  sglang/srt/entrypoints/harmony_utils.py,sha256=01T-A5GBUm2b306PcxNEg2rfx4cykBcqNYrzcXTWBlc,13590
128
- sglang/srt/entrypoints/http_server.py,sha256=B_nV6dqQWOHj2t_r0_rip30AMfJ8ZTgnIUJLeVt3qQw,44249
129
+ sglang/srt/entrypoints/http_server.py,sha256=_GEk6RgxlMWYUNXOx9he2OIFOs1-Qan1NrSm0EAGJ3M,49649
129
130
  sglang/srt/entrypoints/http_server_engine.py,sha256=_--j4U04OeJLlnnv1f0XmCd_Ry0z1FlhkrbePX8rYV0,4938
130
131
  sglang/srt/entrypoints/tool.py,sha256=aAXEjBqkr5j6_IgRL8fZCKgoDPY2TikM20-LQXU9TaI,2709
131
132
  sglang/srt/entrypoints/openai/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
132
- sglang/srt/entrypoints/openai/protocol.py,sha256=Tm2dVpIHozcxXVyQuPxI6WTofdz0UfOpA9VeIvMExRU,26740
133
+ sglang/srt/entrypoints/openai/protocol.py,sha256=jnHSYMJfCSTDCcIQpF1rWhJmU_It01CeiwiPlDd5-Vo,28673
133
134
  sglang/srt/entrypoints/openai/serving_base.py,sha256=epD6J7K72p6TP8o2dGYf-a76nXeF80vFhPRpWts6684,5445
134
135
  sglang/srt/entrypoints/openai/serving_chat.py,sha256=t5rZ0LxB1VXeclKex3cbzik4zmJ4ke1XyDmZOtRdJIk,43120
135
136
  sglang/srt/entrypoints/openai/serving_completions.py,sha256=7aamrEWd7hu57c9mJ86Oe8AeI9qHF8TM74T6Gy-Efzw,17844
@@ -141,8 +142,8 @@ sglang/srt/entrypoints/openai/tool_server.py,sha256=rRNGELPV5RHONp55MYkO4_b0NPsP
141
142
  sglang/srt/entrypoints/openai/usage_processor.py,sha256=9LTB5rqdRuMKyZrIXiUBuF_WKaSg9X45YdzERDxbtCY,2746
142
143
  sglang/srt/entrypoints/openai/utils.py,sha256=DT9quW0F1DX1P9NAuMxpERgXcNYKKtm7rd7J1m7EaDQ,2112
143
144
  sglang/srt/eplb/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
144
- sglang/srt/eplb/eplb_manager.py,sha256=Wt7w4L5g1BSsXx1mqoGo8WjkB55f4nGB4KqC3y_ijl8,3394
145
- sglang/srt/eplb/expert_distribution.py,sha256=HSv7kA8qeq25NJW0BcSRTNWQHF-YQsS82XhQMEqw7f8,31665
145
+ sglang/srt/eplb/eplb_manager.py,sha256=MRYyI3A2NgFvpv2R9lHXy_XS_KwZiZWPDxjpckh-H3A,4334
146
+ sglang/srt/eplb/expert_distribution.py,sha256=r7tqDZM-Ez2r6Wq7EnikoyB7fEAuPU60XI16r8DGa10,32705
146
147
  sglang/srt/eplb/expert_location.py,sha256=SIinJLiDhS4mctTiMdIQzQZFchwrrvES0ufEVJ4OGeg,17076
147
148
  sglang/srt/eplb/expert_location_dispatch.py,sha256=vA0o-7bXf847BQAVCqElWKEpofZLAIsir_d0pew2KNQ,4178
148
149
  sglang/srt/eplb/expert_location_updater.py,sha256=eMtJVMCRklfvKPbFiDKy85f5J9s_krJbpRCSArYZjVs,21157
@@ -167,26 +168,26 @@ sglang/srt/function_call/qwen25_detector.py,sha256=nv83_sipZMU6Vie3J4HeNiZVCSRU5
167
168
  sglang/srt/function_call/qwen3_coder_detector.py,sha256=wRsGBH3TUdI3cubWEAmHDFYGojfHyt2bPpV2RCbKsyg,14297
168
169
  sglang/srt/function_call/step3_detector.py,sha256=SAibrispu0peDQzqOG2-V93KGHtV6Ud7a38vlnhTunA,17442
169
170
  sglang/srt/function_call/utils.py,sha256=__ImDF2kNyoLWsYO5RYoryvy1mmgEjnjXlCvLv-uLCM,1695
170
- sglang/srt/layers/activation.py,sha256=uhfhh10N5iLoLEBCvFPRjCfDxu5jXe1ehHJb3ISIjig,7840
171
+ sglang/srt/layers/activation.py,sha256=mAa6E8xTDs6RyuBO0kNXaIuWxOlKfu8jQH5YG9PblhY,8213
171
172
  sglang/srt/layers/amx_utils.py,sha256=1mENgHK2B8mgaD1oMtgbZ15Jmy_Uu1QueBmo09Ff2iA,2865
172
173
  sglang/srt/layers/communicator.py,sha256=RAP_oBwHBZdc5Knnb9FRozStODWc4toqDjU4wvekzHc,22625
173
174
  sglang/srt/layers/dp_attention.py,sha256=35GQIpO8HpF9mtLQSJe2RW2a5rblTLvzAbr1CL0PbSg,15286
174
175
  sglang/srt/layers/elementwise.py,sha256=PjYv7Sk-zKbG9WiGlYDKsxvNrnxT2N1Q8bA2BWvA1Uo,18771
175
176
  sglang/srt/layers/flashinfer_comm_fusion.py,sha256=hnVVS_VsWukTYhREubWs2KcJ1GjVMEI9ECqxqOMXZv8,6729
176
- sglang/srt/layers/layernorm.py,sha256=3qanS30lgBGO8tiR5XaIW3ejJzB-8oYAD420Zjql2sw,9803
177
- sglang/srt/layers/linear.py,sha256=f5BZqcbM-6qILXn9nDN2_Vd1Oy8THk0-5z1iw40jRxs,53397
178
- sglang/srt/layers/logits_processor.py,sha256=jFWv46U6EkH7HLAlpGeC80iump5Kv2QZhHdj35RlQhc,26865
177
+ sglang/srt/layers/layernorm.py,sha256=hvfU36Q_SpHR7renSbXuI5WnENE_i5Z7TuU4dxRN7fw,10614
178
+ sglang/srt/layers/linear.py,sha256=evhlZ_aPFce-m89zYDeEfSrYAOoaMk5BC18vDjGPzjM,53508
179
+ sglang/srt/layers/logits_processor.py,sha256=jCLgKuU8r-T0ZdSjWEWNhtmx408f_NTKVCW20_dn2ZQ,26969
179
180
  sglang/srt/layers/multimodal.py,sha256=vNswe0J0maeBiN8ehlmxfs-YYlrmMllYl6Nc_Y57Neg,5114
180
181
  sglang/srt/layers/parameter.py,sha256=jCg0G-12GZqTa9gGOqEtVCsnnuBGnYg0VmF6pc6oCFg,17455
181
182
  sglang/srt/layers/pooler.py,sha256=uZ6WX1FLMEafZwusyZdm6KuVlIwSjbKrdwk2qzgqNGk,3812
182
183
  sglang/srt/layers/radix_attention.py,sha256=MpugwaqiY2zPTeg7FVW41OljljCXmYVvHZ2MvneF6PI,3745
183
- sglang/srt/layers/rotary_embedding.py,sha256=MZ-P1wcVSr2YA0Iz-4qKIyL8G5p_-nVJU2EA5MVISgM,73102
184
- sglang/srt/layers/sampler.py,sha256=cgtAtsxcllqhlrxk5ktiBEAeeVLZb-5wWb9NlGzkNYg,11199
184
+ sglang/srt/layers/rotary_embedding.py,sha256=lhGVkJpMtuWT_dLbYzgq6J7hXGIdvWiMWxWcww6oWv4,73927
185
+ sglang/srt/layers/sampler.py,sha256=RIcvSriJaHpFhjNPX3CzJzn4Lwy9H3MTPBeZjqAZq9o,11762
185
186
  sglang/srt/layers/torchao_utils.py,sha256=Ws24FdRBSkTpyeyA6bQrdDm-W5wfDxKvSIPUSahyMfA,4063
186
187
  sglang/srt/layers/utils.py,sha256=E7PHisGiD9ZmLS4RWqCUZWxAQJbfc0WaTfRZ37gUlPI,1077
187
188
  sglang/srt/layers/vocab_parallel_embedding.py,sha256=x0421kNUgnAb5LnkJR6O67vGZ0ikSD-ThluV3QGsZ_8,22673
188
189
  sglang/srt/layers/attention/aiter_backend.py,sha256=XfZKrPFL1feerRMRL4jFoBGtbtoOD9gzKFCx8BomfJ4,43146
189
- sglang/srt/layers/attention/ascend_backend.py,sha256=3I6ZCvDMs0QO9ahcg6egt1xLHVD0oLKtcyBG1mU1ciI,18158
190
+ sglang/srt/layers/attention/ascend_backend.py,sha256=zmEz1NfytWADYFmCGBVIGXhVAT5GX_z5fnC8-1r5pK4,23334
190
191
  sglang/srt/layers/attention/base_attn_backend.py,sha256=_vM05ddWy6SaoqWYPR8w5lflSE4MhcVFR271Q9EKK8E,3600
191
192
  sglang/srt/layers/attention/cutlass_mla_backend.py,sha256=PB5BjbJHhmTg_t0kXfarTI6C3pPvKhBAqvCSGGajou0,9846
192
193
  sglang/srt/layers/attention/double_sparsity_backend.py,sha256=2ZRL_gYz14idoVqQzeQ6N77nXer0f_8_TUYw40XUUz0,9161
@@ -195,14 +196,14 @@ sglang/srt/layers/attention/flashattention_backend.py,sha256=3Jgapx8tVh2PbPVi6e5
195
196
  sglang/srt/layers/attention/flashinfer_backend.py,sha256=KLN2t7qn0UtRMeNO9OPLgwyhj23KPAwx_z_OmJSN4uQ,54197
196
197
  sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=GNHvib_PaUO-JFmUcwRADzF7-4v61KFbvk0yEExMdhk,39556
197
198
  sglang/srt/layers/attention/flashmla_backend.py,sha256=5iSic5ho-lkXNas9mR3uLbXbEl-do31gc8gjR7-a79k,20711
198
- sglang/srt/layers/attention/hybrid_attn_backend.py,sha256=dwbxscTGMOnwfxxPpmGdbSiQ0kQRHnH0pdpKHA-_vqc,3181
199
+ sglang/srt/layers/attention/hybrid_attn_backend.py,sha256=e5P0RxuS5tCfQe4S54WI5vuKjgDvTi4FcvPxgLsIk9k,4451
199
200
  sglang/srt/layers/attention/intel_amx_backend.py,sha256=hH9lxXs_o66_IVs58oPhRCOXGUrHbXSz82FKtHr9GO8,4092
200
201
  sglang/srt/layers/attention/merge_state.py,sha256=OnWmNV6LYTUj0y8SCy_IK7A9q6v9bZwR4_XiLOIvbrk,1423
201
202
  sglang/srt/layers/attention/tbo_backend.py,sha256=CBnSDUmDvT-Tbhi9NHNo1LLkgUAcIsWMJgKa-sAIKW8,9318
202
203
  sglang/srt/layers/attention/torch_native_backend.py,sha256=RsI4lYiQJAj-Xy0vKkzbyKOWHAVPOD9b0n0dEehwlos,9496
203
204
  sglang/srt/layers/attention/triton_backend.py,sha256=fvcJLaJaM8JE9Q9Nkmn0dzdYnnYlwELCoxQGMoqS9Gk,41858
204
205
  sglang/srt/layers/attention/trtllm_mha_backend.py,sha256=8MxCAzqsNuvO3mhFqTMXCJ0Tt0_82kFbBHie6m0ieDA,27588
205
- sglang/srt/layers/attention/trtllm_mla_backend.py,sha256=pkXARtA9ISC3RL82mqjY7vzfsK-u1rvMRBcOn2n0J_o,19101
206
+ sglang/srt/layers/attention/trtllm_mla_backend.py,sha256=NBfuORA0oUlS_uB0I_ikHvUSVKsPbVVNdbvakyCQ3XY,19830
206
207
  sglang/srt/layers/attention/utils.py,sha256=lx_jNw2VwlBe2VnDb1eXRRdN9WArw9rdWHTHqndUEFk,3174
207
208
  sglang/srt/layers/attention/vision.py,sha256=PZUJuswPWvJ34NTtxJkcXnusojDv0pO0UhrsjL4SWYU,20268
208
209
  sglang/srt/layers/attention/vision_utils.py,sha256=6hPPAt8p3SOm7tgHNUesnMLxvQiKbaOM5EK6K-ig5dI,2771
@@ -219,18 +220,21 @@ sglang/srt/layers/attention/wave_ops/prefill_attention.py,sha256=viTUit0rxjVV5Ua
219
220
  sglang/srt/layers/moe/__init__.py,sha256=63TxUpSiUpVg1SDY1zdlTg3WFJzAc7WSndOViOmUv4E,835
220
221
  sglang/srt/layers/moe/cutlass_moe.py,sha256=JKJED-4709ndP5AwhQ7Vi04GJjw5d9Xl_mWOsZPZ3U4,14298
221
222
  sglang/srt/layers/moe/cutlass_moe_params.py,sha256=9NRCmgP_Ug3gGqCcpi-x-QRbLjCNpw8792gKXwZsbEU,6522
222
- sglang/srt/layers/moe/cutlass_w4a8_moe.py,sha256=rWyHMg0kYZhIdLWTJeC7pqRG9ywfeKqi47-OekNeF4Y,7306
223
+ sglang/srt/layers/moe/cutlass_w4a8_moe.py,sha256=pUvYkbm3kD5IBjVuJeehU_hvEvdNcYcO2eRZXDc6iLI,7005
223
224
  sglang/srt/layers/moe/fused_moe_native.py,sha256=8SAToE4B-22H5JsENZgJ1Io6QfE5-D9ItWLtbGksFQQ,3372
224
225
  sglang/srt/layers/moe/rocm_moe_utils.py,sha256=07Z99bTV3B-b2Cbm-odhGpx2twxtnVpYvaDMBE1K3LM,4555
225
226
  sglang/srt/layers/moe/router.py,sha256=eUNu_Uz5VB2FOZzZyYuZo5pokCVBS17_fcjHQbmvDSE,12181
226
- sglang/srt/layers/moe/topk.py,sha256=wxCkMzm4FdCQM5-Gr5eS0qTTbKxntU6dFKU4Qn9DQYc,30377
227
+ sglang/srt/layers/moe/topk.py,sha256=r8pE6eJ8dprfZxaw8VcfrRvSp6_xDNPkr0tajmG_CZc,31349
227
228
  sglang/srt/layers/moe/utils.py,sha256=omh9E6sF-KtrELEsE9y01Ash7FfQlstyE-97UtpH8qk,5998
228
229
  sglang/srt/layers/moe/ep_moe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
229
- sglang/srt/layers/moe/ep_moe/kernels.py,sha256=7MieYfBctQjqfBoKun_QUyfloIrrgt5tjzmMkMoY5Ys,44107
230
- sglang/srt/layers/moe/ep_moe/layer.py,sha256=Ro4SQ9peGw4-1oHFHsw8HvFb2yEdTkB8JH7MnSV1hoM,27816
231
- sglang/srt/layers/moe/fused_moe_triton/__init__.py,sha256=4NXZHbCw-G-uSnNUj4up0yh3xBDPnT-x0pdoIr0lku8,831
232
- sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=JKp89Cdl8a85tKzmJa4ah5VtxZzRNBSbY4cnsAtnvio,60803
233
- sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=jub7moptP9UjyRYJ2gPvY8HEnE41d_oFbZgjVvNsJxQ,39409
230
+ sglang/srt/layers/moe/ep_moe/kernels.py,sha256=Acg6dW-zVDQ95vuBVuzxb5SUFFxhLCewk_tVSZeuma8,46158
231
+ sglang/srt/layers/moe/ep_moe/layer.py,sha256=uAHuiAILb3XQi9t1JGMElfzvsG9cKIDMXs6ezEGhGvY,27776
232
+ sglang/srt/layers/moe/fused_moe_triton/__init__.py,sha256=tis0ZJmih7gKHCurbLtY_o-bY3K4MOzQLYLC3ftIOf0,977
233
+ sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=q_L-eZh9pBP3KZLipv9cRe2WpezNrHMz8NzMy97TV0Q,23178
234
+ sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_config.py,sha256=fFnRcXA6r0gnD_7EQmb8NacQJRJ8YHsmMZw2khlClTQ,7687
235
+ sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_kernels.py,sha256=z10ZJLrFFhgB5_cEFrvMt6bnwe46T5Vzz4nvMl4ErGU,27776
236
+ sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=TI3p8FOJJjpoyE7VMngs9BPeiiN9M9XHZJRWVTWtiH0,39637
237
+ sglang/srt/layers/moe/fused_moe_triton/moe_align_block_size.py,sha256=U93mxPPU2RP7d3QRSvoG3OCtUQIK8YhQfHf1ZGeREmY,3284
234
238
  sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=Ai06BZ7uxMnk0nPWQelgvi1rV9Z72FetRo6p7E3rsYs,10986
235
239
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=iNGsE2ZeVnQEnN4A8UJ9Jv0d3hbRF2MJ9oBgjup5Szk,2737
236
240
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json",sha256=JJN0hryyLr5Zv3dSS7C8cPFhAwTT6XxUVnBGMZvV6JA,2752
@@ -417,6 +421,7 @@ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=Ai06BZ7uxMnk
417
421
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=8,N=7168,device_name=NVIDIA_H100_80GB_HBM3.json",sha256=a9XJZ0XudUTebAdN5guVq-3XSvZetHIRjatO1-_0xCk,3257
418
422
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=128,N=384,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=6JYGN4imwzIrQAEgboSO93wWYBuguzTgBjfTedq2c_Q,3250
419
423
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=128,N=768,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=dPe_9-JH0wF8q7Mhec4WWSLSGRE2gj_AQT3dnR3FREI,3257
424
+ "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=129,N=352,device_name=NVIDIA_B200,dtype=fp8_w8a8.json",sha256=ClPogINm5AsnjDqx6Hz_rHrmnnCdUPid-jYIdIgjZxs,3250
420
425
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=129,N=352,device_name=NVIDIA_RTX_PRO_6000_Blackwell_Max-Q_Workstation_Edition,dtype=fp8_w8a8.json",sha256=RMYwqtB7hYeaCyuZ1feVnRhBGlN4jMcmNQX2hqUqBlk,3254
421
426
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=129,N=704,device_name=NVIDIA_B200,dtype=fp8_w8a8.json",sha256=W8C1GtP4K43SK9128U52DD5WWofvPleAJE4us2Qju1k,3251
422
427
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=161,N=384,device_name=NVIDIA_RTX_PRO_6000_Blackwell_Max-Q_Workstation_Edition,dtype=fp8_w8a8.json",sha256=RMYwqtB7hYeaCyuZ1feVnRhBGlN4jMcmNQX2hqUqBlk,3254
@@ -444,18 +449,18 @@ sglang/srt/layers/quantization/int8_utils.py,sha256=YK9CS-lb_n91kNCTKK5o5apYF31V
444
449
  sglang/srt/layers/quantization/kv_cache.py,sha256=_9pF5rwvB7ta6Gdc5YKVVGbNzYwqmhIx4TrX1-xnodQ,3261
445
450
  sglang/srt/layers/quantization/marlin_utils.py,sha256=aM3GU7b7rHNZE-tZjRSrtOaPWzSaMcLxck4he8MlEVI,26344
446
451
  sglang/srt/layers/quantization/marlin_utils_fp8.py,sha256=iSjq-ikPOTU5plrWNTW4MletKLySIrNl5NhQmY6FyAo,12508
447
- sglang/srt/layers/quantization/modelopt_quant.py,sha256=k0F6b-bG5wv3zL7kipqCrQHEZ8QjfIDThnU9Y3mFNTA,52566
452
+ sglang/srt/layers/quantization/modelopt_quant.py,sha256=jWo_RzjZ993x7ZkV4c2MLBVMCqaL7lqaAlJpm9EDajU,52979
448
453
  sglang/srt/layers/quantization/moe_wna16.py,sha256=brU0nG6StgjGuuhOjpeoh-wJVZ1SUgbuHhiDR1hibbw,18905
449
- sglang/srt/layers/quantization/mxfp4.py,sha256=xCTaEtL9KLMzHjMP4snItR4sXKACTk1TCNQryRzmaXE,31195
454
+ sglang/srt/layers/quantization/mxfp4.py,sha256=-HL6fBteyLSIc_y48kiroY1-OXpe7oJ8918hLiiON6s,31374
450
455
  sglang/srt/layers/quantization/mxfp4_tensor.py,sha256=bGeCXlIOhmFZFGWp_lITkIRDEgGUaLpawDvMy1cTOmA,5389
451
456
  sglang/srt/layers/quantization/petit.py,sha256=74Jn0eICq23v_b4rEctDaYTINtbqkdM6IXycT-_FbbI,8954
452
457
  sglang/srt/layers/quantization/petit_utils.py,sha256=-gy4zMhqNoIA1R0n7-5C0efV54jHonCUgPDUUFjGsyM,3245
453
458
  sglang/srt/layers/quantization/qoq.py,sha256=jM96uJfKz3vo1B6SSIrQXNT3vnD3UJrepK2eY-tSQU4,8139
454
459
  sglang/srt/layers/quantization/unquant.py,sha256=CxsOEYqYIfanKHo0ooFArbVz2ueX3vBWnYHE8gtnzdQ,12996
455
- sglang/srt/layers/quantization/utils.py,sha256=DdsHXkB5R8YlzhOIEz9QqxAE8swrH0V9DKsNPrk8GSQ,17969
456
- sglang/srt/layers/quantization/w4afp8.py,sha256=345w-gCDes3dGqCUAmjyzXZemsIEWc_swJ7FyJyzFTI,11392
460
+ sglang/srt/layers/quantization/utils.py,sha256=d4eaS4-Z4q3GRgb4HDMr2EoWEdQCefrVdJufK6n_NQY,18509
461
+ sglang/srt/layers/quantization/w4afp8.py,sha256=Cm_KjJQu-XKqSKh6usJ5tNXARm6F5n_C2P1c1NuYdC0,11720
457
462
  sglang/srt/layers/quantization/w8a8_fp8.py,sha256=wzJi5jeTnbf-01iehOVTTCu_262rlMh9AQ2rogKWBmo,9981
458
- sglang/srt/layers/quantization/w8a8_int8.py,sha256=33Q_pWBj3l5MoLyrJ0i5hZvn-mCyeskzgS8oRoh72eQ,35138
463
+ sglang/srt/layers/quantization/w8a8_int8.py,sha256=cOKbhWxFlv6hw5dSs8ExPBXFcTwudwR26m3CAoOhCSs,35342
459
464
  sglang/srt/layers/quantization/compressed_tensors/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
460
465
  sglang/srt/layers/quantization/compressed_tensors/compressed_tensors.py,sha256=DsPCI82A4rqI6mjKo-WorIKUweppFV7-16Qku-zW9_g,25897
461
466
  sglang/srt/layers/quantization/compressed_tensors/compressed_tensors_moe.py,sha256=jWgfDtg5r6IRKJUpYXf5Tp13pWekoUCnYi8LMZ33PcU,25940
@@ -617,8 +622,8 @@ sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a
617
622
  "sglang/srt/layers/quantization/configs/N=7168,K=256,device_name=NVIDIA_H20,dtype=int8_w8a8,block_shape=[128, 128].json",sha256=FImA-TJ_tQDjqwoNWxS--sRDoKDXf9gamlME3tkxH58,3252
618
623
  "sglang/srt/layers/quantization/configs/N=7168,K=256,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=FFBjSWlpKXMxfAUUYUqXbOK_Hd7qBeBsfbcaa9uB4qY,3249
619
624
  sglang/srt/layers/quantization/deep_gemm_wrapper/__init__.py,sha256=esJMd0Yuj68t6QYOpmIFuiWP2J2dxTMC4bRBNH0Xk6I,26
620
- sglang/srt/layers/quantization/deep_gemm_wrapper/compile_utils.py,sha256=x5CcDGvfvJStt2yS1tlfOup7UcG_0L7iHPMF33mR9-U,7908
621
- sglang/srt/layers/quantization/deep_gemm_wrapper/configurer.py,sha256=WAMl4vrG6fXw2ar-svT-UO-mgUzwGV6dumkUiUxuTaY,876
625
+ sglang/srt/layers/quantization/deep_gemm_wrapper/compile_utils.py,sha256=PI9r3PHCMK9EgpoFuBgR4jvokA5sBz8zyC47ps3wet4,8164
626
+ sglang/srt/layers/quantization/deep_gemm_wrapper/configurer.py,sha256=8C4xyO58N3Zl8h-fYddUpXDs3mnSqjYbaLt12cPB2XA,778
622
627
  sglang/srt/layers/quantization/deep_gemm_wrapper/entrypoint.py,sha256=vCj5vdAshEB9mAgSUYXhgJ0bd1Ithmu_n4-m_IWUbd4,2531
623
628
  sglang/srt/layers/quantization/quark/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
624
629
  sglang/srt/layers/quantization/quark/quark.py,sha256=EqQvWzAc6nd_yl6UIMIwmozKif4I8fRNfBum040UUEQ,14613
@@ -641,49 +646,50 @@ sglang/srt/lora/triton_ops/gate_up_lora_b.py,sha256=QURCYxHNR8Ls4SQtt3dvdgjvdDVh
641
646
  sglang/srt/lora/triton_ops/qkv_lora_b.py,sha256=z9BB84Xu_MjwCu5v9Yvji-FkIzfEjDySAFybc4WYv7A,6483
642
647
  sglang/srt/lora/triton_ops/sgemm_lora_a.py,sha256=Ksova04wgeGsFqGOXWqJtMYaHgyUYcx8VU42BZQOkVA,5129
643
648
  sglang/srt/lora/triton_ops/sgemm_lora_b.py,sha256=VqCAFvUtq_l-0RGIkx3W_fzD55QcW2FAcqpvSHOBFp4,5115
644
- sglang/srt/managers/cache_controller.py,sha256=iSGfeS3IATQ6bcYEoDVZZvybP7KAJZGTX_SXw46JalU,34560
649
+ sglang/srt/managers/cache_controller.py,sha256=WEaM01U0al13oSU7AHvwEBcmOy-1SmtPWbikgrPAx6g,33130
645
650
  sglang/srt/managers/configure_logging.py,sha256=8sNXZ2z9pBWOwn-X3wyz013Ob8Nbm1zDxRkxoZjH-l4,1633
646
651
  sglang/srt/managers/data_parallel_controller.py,sha256=VvEkidmYCGAFTv6upEHf_tyTvkM8xLhCyOnLJGWL6BQ,14592
647
- sglang/srt/managers/detokenizer_manager.py,sha256=I1V4PqQo23stteiwyJXQryP2pAauNNq-pbeffhTDgQI,11244
648
- sglang/srt/managers/io_struct.py,sha256=xXMgXavOnQAPA3vI801nzZ9ha6QYMNmai5uSWcLQ-zU,40023
649
- sglang/srt/managers/mm_utils.py,sha256=0Kr3VJKINr9o4k2Tg2KN0Zb9kxRYBd4dxd0ImTbKHw4,29351
652
+ sglang/srt/managers/detokenizer_manager.py,sha256=mVEzkaCTu0MUe8QuwQC9uReOJgTWVQYXcItlDS2gYK4,11594
653
+ sglang/srt/managers/io_struct.py,sha256=ebAKRqBYj4slW25-dWs51JAW6caPcvuIMlSoJJZd8wo,40503
654
+ sglang/srt/managers/mm_utils.py,sha256=J5hahCJ7HAKhJtGzV6PRa5HB9B2NjYwWGYMqIgiGC60,29444
655
+ sglang/srt/managers/multi_tokenizer_mixin.py,sha256=5HbUePDkWeEua_500sEJdKYp9CfRITKUAeFEBp8OR7k,24706
650
656
  sglang/srt/managers/multimodal_processor.py,sha256=cnWpu2G79v1a6FJB_FriLxESgGUbfC3GptLmeRVVgew,1801
651
657
  sglang/srt/managers/schedule_batch.py,sha256=9lhBnf-siQjsThD8FRyhiF50N-LOE7dfoPr1uzklnjQ,77170
652
658
  sglang/srt/managers/schedule_policy.py,sha256=vh9BQW9tBv80LW4JApLE6smU2m4gy6cAEI25HVXiS60,22383
653
- sglang/srt/managers/scheduler.py,sha256=RQuW5MrfSkl1F7TbioVuIeYujiRp_leANRhzxyRhTHU,109467
659
+ sglang/srt/managers/scheduler.py,sha256=Ipdj1_nDJDUNWb9Hx2W4NNndvhwRkn6B9rBGmJhDklc,111243
654
660
  sglang/srt/managers/scheduler_input_blocker.py,sha256=zP8xU_UmU2H0AB6sEqvivDcDB1QDgTauNDYDIJ7Nez4,3683
655
661
  sglang/srt/managers/scheduler_metrics_mixin.py,sha256=31BbukSyUUPMNHLqRlS5sEiAv7Gi5VHFQ1TgxvcAdcw,10054
656
- sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=e_l5TRm05liINSAeZU-YPRpJXcutmEWYV30F1vPaxbs,31345
662
+ sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=CLwF58GTV7PkyYUoC-R7ROA-cZt8di9_9n2pajacxUY,31511
657
663
  sglang/srt/managers/scheduler_profiler_mixin.py,sha256=A67lC_U7HUCf_znatXK51orC8xeFNGouJ866HH_Y-yc,11402
658
664
  sglang/srt/managers/scheduler_recv_skipper.py,sha256=8rVQCBjn9f26Th4XbeUS3fEsvo1GI029Me28wMjcKRY,1103
659
- sglang/srt/managers/scheduler_update_weights_mixin.py,sha256=R81fU-0aIJoi5URm9IA-n2sEjvn3phGXOhzJALZjiOM,5467
665
+ sglang/srt/managers/scheduler_update_weights_mixin.py,sha256=uk7Dusr8EJBDRdcuQNIoedj0oP4tmSWrUbEqmjclwnk,5813
660
666
  sglang/srt/managers/session_controller.py,sha256=FGADRGSkRmS76o_BQ2fivpgw0Q5Q-K0Ws3aezH41YSc,6041
661
667
  sglang/srt/managers/template_manager.py,sha256=m_cy_KY5bOkDlh6IB9ocisy8N5r7abp4nfFnhruNxFg,11947
662
- sglang/srt/managers/tokenizer_manager.py,sha256=xW3fNwocCtHPAjc1EEegpzYqpeMfOd-SFvIDfUn0pKw,86156
668
+ sglang/srt/managers/tokenizer_manager.py,sha256=YaWYZ_FWjVPY1PaUqRBUgsREWgJ4YcN0n2CKaCXXhRw,88266
663
669
  sglang/srt/managers/tp_worker.py,sha256=n_DqSD4JqOJYjdZrchOpmpuTazRw-AUrs6RPQYuAPyQ,11933
664
670
  sglang/srt/managers/tp_worker_overlap_thread.py,sha256=NXjrBT7lvdUlDDNFzEQyFYCerpqj92sNl2YynGhQj-Y,11118
665
671
  sglang/srt/managers/utils.py,sha256=WbUdADEdiSOoQNfwjfU64mNaXoskEveBO1HP_t0FJtQ,5687
666
672
  sglang/srt/mem_cache/allocator.py,sha256=5cLql3bTIFElYn9S6baBmKCO5L88W_sPC-TsTMZrk_g,18216
667
673
  sglang/srt/mem_cache/allocator_ascend.py,sha256=i0KPCcFlzGkCIjW8ph3IPkBXAWTqq4-AeaoG1wR--lw,4471
668
674
  sglang/srt/mem_cache/base_prefix_cache.py,sha256=hLS2ncTMAz7Kpdk5pNwn5c6g8b61_K9OCBL4Vj1xsYc,2801
669
- sglang/srt/mem_cache/chunk_cache.py,sha256=xQjfmpijkkNRuqfwYMhoiV2nJAviABX4uOSLE-yyVus,3184
675
+ sglang/srt/mem_cache/chunk_cache.py,sha256=jbJeEEZ5_WYEF_AnDZIAu2sMD4hAGAd_24F980fjVwU,3199
670
676
  sglang/srt/mem_cache/flush_cache.py,sha256=GYcxmNXh4hsMpFfNOuCTpKilW7guZwTtAg_usVeM3J0,979
671
- sglang/srt/mem_cache/hicache_storage.py,sha256=hs8jp88UEOJKsNVsqp_z0GbmRrWs5oQSZDGMUGAUDDk,6974
672
- sglang/srt/mem_cache/hiradix_cache.py,sha256=yhBuVZKqpko0Vd55aJd34Fqk-xeCbo6woD5EMOoeA54,28574
673
- sglang/srt/mem_cache/lora_radix_cache.py,sha256=FCA1d-TSqXYPrz9-m-cRrxse9RtwALXltGNuzR-PnB8,14354
674
- sglang/srt/mem_cache/memory_pool.py,sha256=md3W5lWoa5-g0XLHyYI_EIqcW6yijN7usnbmbD_C_GY,39396
675
- sglang/srt/mem_cache/memory_pool_host.py,sha256=cXNn4C0m-MXM6g36uF1Dx5Ld9zP9ZAhlTngohQGpfUc,26215
677
+ sglang/srt/mem_cache/hicache_storage.py,sha256=eidtVRRsT8efqaEECXRLcxwJ7OomstzOctbqTucOLNg,7307
678
+ sglang/srt/mem_cache/hiradix_cache.py,sha256=k7P_MHQnFfvFj41T3WseTQQR0Hpun4VXrqtqnjKZHtI,29155
679
+ sglang/srt/mem_cache/lora_radix_cache.py,sha256=4NbK0Rc15kTiCOSsthyM6WsZarMK2MNhtsNqYMakJ5k,14369
680
+ sglang/srt/mem_cache/memory_pool.py,sha256=EGZtQsgXDOuySeEBdV6jBIt9ZDvqMsErNPe6P5ifHh8,39540
681
+ sglang/srt/mem_cache/memory_pool_host.py,sha256=Uy2sGFEVupj7ZBWRFBgnkn0s5Yb8NzmKre9IbBQ-ut8,26189
676
682
  sglang/srt/mem_cache/multimodal_cache.py,sha256=zPnQLQhBZ6zsUpCQPSoNkrB9EEvpoDQS4mU7c3sRWjE,2171
677
- sglang/srt/mem_cache/radix_cache.py,sha256=MdX_gYcrif6HJQTIGTD9sA1zOLIn8920lbqTO96TpgQ,19085
678
- sglang/srt/mem_cache/radix_cache_cpp.py,sha256=1V-XxYC2jxQYUMJBLrlcSMcqhCBo8TC7wRTTVbOaMkY,9269
679
- sglang/srt/mem_cache/swa_radix_cache.py,sha256=4qt_gS7GuHiekd6VvKkx54dB2GHJzNA_kj71Np6jTDA,40300
683
+ sglang/srt/mem_cache/radix_cache.py,sha256=U0KEjQNcwhdFWnXYTMhDkxpiazAD1ttbADEkGPHiiTU,19116
684
+ sglang/srt/mem_cache/radix_cache_cpp.py,sha256=YuYt4xNzfmNNSkwaAk3VLWcZI74_XQobIyEgt96f7Qs,9284
685
+ sglang/srt/mem_cache/swa_radix_cache.py,sha256=hV5OOmAqu4UT80BVsu7lhGewcbq-u__JKx5T1lgxJyQ,40315
680
686
  sglang/srt/mem_cache/cpp_radix_tree/radix_tree.py,sha256=tQZpz-H6HxNAQe9mYqt6aX8mfDZyu_fbJTcCNK-Ns1M,7179
681
687
  sglang/srt/mem_cache/storage/hf3fs/client_hf3fs.py,sha256=WV5M9UPPLUMMjU3Mpp6HBqyCQpGBuMyj-N5PwQcNo5k,5178
682
688
  sglang/srt/mem_cache/storage/hf3fs/hf3fs_utils.cpp,sha256=dDYPtxmL6OFhEyv_GuTgzkTDpBjcD0EK8kphnn7eaGc,1133
683
- sglang/srt/mem_cache/storage/hf3fs/mini_3fs_metadata_server.py,sha256=OfQMFwbbQg0pbC7rJktg5wz3YFhNsNOjsXCsAjrh6iU,16738
684
- sglang/srt/mem_cache/storage/hf3fs/storage_hf3fs.py,sha256=MlN9RLhd2W81RDSvaPtGm_AP_QKwO_KWUSKXMi_rnL8,12918
689
+ sglang/srt/mem_cache/storage/hf3fs/mini_3fs_metadata_server.py,sha256=lJ9Jp2kOgQQaUihxlO9l-W8fYfOMa1h1y0WAtzzFGLM,17850
690
+ sglang/srt/mem_cache/storage/hf3fs/storage_hf3fs.py,sha256=2sa0fgXRB0rkOqGbewRtO11A8ES0DhlKZi7nZmD330I,14873
685
691
  sglang/srt/mem_cache/storage/hf3fs/test_hf3fs_utils.py,sha256=g2h0Woa2CK39pRTigHCVR_hq095dTaC70lCIAIs9THM,1089
686
- sglang/srt/mem_cache/storage/mooncake_store/mooncake_store.py,sha256=TevMG2cd05-uUxDfW1LDk35pLwOwiTfVDdVyw-4lsZs,9951
692
+ sglang/srt/mem_cache/storage/mooncake_store/mooncake_store.py,sha256=S0UAG86sVMDc4-LvzSZrLKeW0fec5D7py_sqe3JtXEk,10000
687
693
  sglang/srt/mem_cache/storage/mooncake_store/unit_test.py,sha256=jMdJgU41VscKS-mn_AVZE8LQbb_3MWQ57i9V3OCWLI4,1007
688
694
  sglang/srt/mem_cache/storage/nixl/hicache_nixl.py,sha256=bau9Jsp50lpEiy_osgb-dYzeoUkPWM03x7Q8z2BpKaU,9920
689
695
  sglang/srt/mem_cache/storage/nixl/nixl_utils.py,sha256=KXkwMrbWwIOUOASINnUo4HyheiMd-93smmwGLv0CacU,7463
@@ -692,11 +698,11 @@ sglang/srt/metrics/collector.py,sha256=IfFr4RaamT3TPj9DjuEnvkdiBGKcIUCQSIIwd9GeZ
692
698
  sglang/srt/metrics/func_timer.py,sha256=VFyNRrbnKVCwnQsrlLin1lITJfjQpf9m8sGPqL5LIsQ,3438
693
699
  sglang/srt/model_executor/cuda_graph_runner.py,sha256=fZT_CQwhfu7kdnliKu5lYM2tunU0u3wBoIlCxm4FXCA,33920
694
700
  sglang/srt/model_executor/forward_batch_info.py,sha256=2KBu9SChR-YwSNbw1mO3WR0P_EGQjFUC5rQfBx6js90,40707
695
- sglang/srt/model_executor/model_runner.py,sha256=VlSgaKfGa7E14wF18xOKte-PPHzgxVczPVzEQ646nwQ,78533
701
+ sglang/srt/model_executor/model_runner.py,sha256=z24KnHB_GLD1XRtk9y_bLbN_T6ASWV8U-mV8u20Dkbw,78474
696
702
  sglang/srt/model_executor/npu_graph_runner.py,sha256=isp2Plkf4b_gdjptYxJhTJk7JL21Jg-Md3hAYIuSVxM,3424
697
703
  sglang/srt/model_loader/__init__.py,sha256=zGZkOBz1zx-pkaIy47BasL3fjDlAcxAXUTjInOhXHAE,919
698
- sglang/srt/model_loader/loader.py,sha256=GPKjMkulnIqlX7gdSSpSselsXLpbEtCLscleC85-1jM,60879
699
- sglang/srt/model_loader/utils.py,sha256=svSrPQxViBz_-0_sByu4coCYrzJ51-4FCi_bFqa6rDo,4474
704
+ sglang/srt/model_loader/loader.py,sha256=RGcqzjQnOK2W-M3IURnmocNm8vZRG3ly_-76nye79Tg,60189
705
+ sglang/srt/model_loader/utils.py,sha256=KrOpyd_eefZC3zFnhnwxIKNTx9G-MmA6jIK3NQbTW0E,5002
700
706
  sglang/srt/model_loader/weight_utils.py,sha256=dHEkm0c4w-lyhJBzktvmop-Psmkpb2KoTu7Azgw7VgU,38555
701
707
  sglang/srt/models/arcee.py,sha256=Q6fujRESEnljzs8ls3XGsPtWxzfKfUa0QAvAekYzeBY,18981
702
708
  sglang/srt/models/baichuan.py,sha256=HbvlErnkCSK4pRQYCSDxMcrn-1DQyfiNoeDcnRrJas8,15807
@@ -709,7 +715,7 @@ sglang/srt/models/dbrx.py,sha256=117gwrB_o8VlACwDH5YlXkPfuS7t2Mh-nyJvpNpIYxs,159
709
715
  sglang/srt/models/deepseek.py,sha256=M7nyHcAbTIs8vc1g6u00oy22-pp704Xp4T3clBzu4xM,17460
710
716
  sglang/srt/models/deepseek_janus_pro.py,sha256=td8xGs6ARfJ8AQCYwUhMOZoWigrAs7m3trF5-kXCqik,70418
711
717
  sglang/srt/models/deepseek_nextn.py,sha256=uoiJxAVl9DX7bQcjyuouAZz6W-cB1HMubcirTBghyR4,6115
712
- sglang/srt/models/deepseek_v2.py,sha256=hgz0N6iX1oIRo0iR5apPA6nVMAmtlQLJHh3OOLR9Vuw,106961
718
+ sglang/srt/models/deepseek_v2.py,sha256=IOSLn1PV3GUsNmP10nd661EOlDI3ThGZBjHS7fSEnIE,107953
713
719
  sglang/srt/models/deepseek_vl2.py,sha256=7X3gI4DE7guUtNJvMLf06jO8MUHKa2Aan8evZg5hsXc,13061
714
720
  sglang/srt/models/ernie4.py,sha256=7dP7_d0i86tv8Mp21Ew9RdsFr6TskIkm8UtUd8zFo00,16067
715
721
  sglang/srt/models/ernie4_eagle.py,sha256=E7f-ygCcY8pIoyTMKFyVC2uRcG59-_RaQTO4gd5_uWI,7223
@@ -729,7 +735,7 @@ sglang/srt/models/glm4v.py,sha256=WtDvH4691H6IKrcGBrkBpweSm_iFK61bMEfvqpbblmc,23
729
735
  sglang/srt/models/glm4v_moe.py,sha256=qgJtWyRI0dy9qcTMXHxhBZp-ghfghV3PLhpOXgSAW60,17313
730
736
  sglang/srt/models/gpt2.py,sha256=kclhxEs8oJk1KCyhmAqo7rZqecVGGHYkc-a1WZi3aIk,9841
731
737
  sglang/srt/models/gpt_bigcode.py,sha256=1D6bi8Zu760gCRZkvdLHFcg8kCkY35ARwQYaMDtYhl4,10307
732
- sglang/srt/models/gpt_oss.py,sha256=bSi0135zmMDtmKDcMiq1UKHa7hGaUfmx3R_ky8jkuto,44934
738
+ sglang/srt/models/gpt_oss.py,sha256=6g7PE6EiOLDipmhV-XKmBcuoCGbhH6SU6NwsSoB_FJM,44469
733
739
  sglang/srt/models/granite.py,sha256=8q92shxVPAp_cJDohJATffSGd7Z0Oi-vF5jpY6DlK4s,19840
734
740
  sglang/srt/models/granitemoe.py,sha256=j1rgZ62CbBioECjUblDCw_NneDQgY_QJODsI0fqXVO8,13779
735
741
  sglang/srt/models/grok.py,sha256=8KCR13LtdnhswJrIwgb0sdFW0OxCA8GQ0fbN8gb856E,40518
@@ -745,11 +751,13 @@ sglang/srt/models/llama.py,sha256=tdyUon6icwzqo4XTAkFxVA2f82g80AGr9ZezK1uXmkM,28
745
751
  sglang/srt/models/llama4.py,sha256=Fp5kqnk1v9Q1TOZH6uXkFKOOZLjV-B6FGoWpw7icO9I,19598
746
752
  sglang/srt/models/llama_classification.py,sha256=4QWTFaUZIFKYZvEzs8bx8VkOZNIwdYCLrnwrdAw4QK0,3108
747
753
  sglang/srt/models/llama_eagle.py,sha256=Ubh_jmtfiOnriwvHgQT0ZGID7JvYvdSi_QGHOIkEgPE,5028
748
- sglang/srt/models/llama_eagle3.py,sha256=715soylDE3kOMWskbPy_70BFxaSc5ptaHCS1v3-ViA0,8579
754
+ sglang/srt/models/llama_eagle3.py,sha256=Rwije5WiCollXFfv4KPIshorboNozLk1NZI3MqVPGjU,8786
749
755
  sglang/srt/models/llama_embedding.py,sha256=zq-_lNu35VBFc7eemiam0zdkGIE8fzrgk5OWYfirZnA,3254
750
756
  sglang/srt/models/llama_reward.py,sha256=LF2nqMV5XOrljGjAwJg43mBv3z6Q040I2EYlgZeCp8k,4681
751
757
  sglang/srt/models/llava.py,sha256=xzYip_BAwpzSIdZre43LZiyTpFISa0ZCLdO6LUSbaCg,37702
752
758
  sglang/srt/models/llavavid.py,sha256=-CSk0RJ2MQeb81sh-RISeVJFaI-XWY6nR6_I594MkME,12818
759
+ sglang/srt/models/longcat_flash.py,sha256=gyElibQ9q_qq4tBA7eah0f3bLSzvMEpgD_n6CcRyG9M,41055
760
+ sglang/srt/models/longcat_flash_nextn.py,sha256=oVy776-AE5z43C472oqHlcl9NfzDDEaQgGB1msZNdgc,29644
753
761
  sglang/srt/models/mimo.py,sha256=Mp-iFp4YHuiuq-H8enUF5K5QbMnVcvEa6mURH6vM3yM,6140
754
762
  sglang/srt/models/mimo_mtp.py,sha256=jSmqJAXu7G3OO7jW1oa2suI4H_Yl7u5ZT7w4lHFbHhg,7292
755
763
  sglang/srt/models/minicpm.py,sha256=CzBJyZtfMpp8jvlEl29DHI7HLVq-CxuqP1UHwxIbaUI,14567
@@ -774,12 +782,12 @@ sglang/srt/models/phi4mm_utils.py,sha256=bW3un4x3SHDvSkAOHQEFO286FGdOPeKhBpJCOmN
774
782
  sglang/srt/models/phimoe.py,sha256=EGaKFi02MZP20qFrILA4o2SJ0wb1HoJagFTSqVUbJcQ,19223
775
783
  sglang/srt/models/pixtral.py,sha256=ZkZrV0mEfmbBdgRko2AvsMFZbAVskgp_5a5p1xCSRN0,16835
776
784
  sglang/srt/models/qwen.py,sha256=j0OU3JjznWi_TbayI09yYGM-Obov6mQzJO82Hs0qBGw,11868
777
- sglang/srt/models/qwen2.py,sha256=TuKblSvilyVoq9en9e9YpwzLGkpDeOA6IWJELOYSzZA,22733
778
- sglang/srt/models/qwen2_5_vl.py,sha256=1FpowSDKjuxvPYppOybnMAAh8mgrWJTPJ8d3qjkbriA,22913
785
+ sglang/srt/models/qwen2.py,sha256=kHNZCtT0jnQXC2aJN7Bp1DzaEzKWuhUAGL3hAmt8OU8,23598
786
+ sglang/srt/models/qwen2_5_vl.py,sha256=NBoGulAvr2dKk6sfTJQ3NAOIFtBvncbLi_nsUOhnGuA,24084
779
787
  sglang/srt/models/qwen2_audio.py,sha256=SOOsspU7J6eM-iSkms5op0nWhoxJd6QxmwXU2aQBEEQ,7776
780
788
  sglang/srt/models/qwen2_classification.py,sha256=dGrMm4ebd30_lBhHOhaV57ig2iOTx3nqB4GEzsrRIM8,2747
781
789
  sglang/srt/models/qwen2_eagle.py,sha256=6spFg6JYQGeUXLv2Q5eMkVzZvnqGyvW6SdVBtFMxlTM,4806
782
- sglang/srt/models/qwen2_moe.py,sha256=lyaNhrUsmg6OyF9LAe4J1csQIWOTzNNihRkdjMEw8CE,25971
790
+ sglang/srt/models/qwen2_moe.py,sha256=0Na7Zy6ukQl6IPCzQajunP2GYySm_NWuqCD-fQdWWX0,26756
783
791
  sglang/srt/models/qwen2_rm.py,sha256=-mQXDEv11p-I1HXgYLTtY6ROem6UYorO958WsDrzsgs,2837
784
792
  sglang/srt/models/qwen2_vl.py,sha256=ZRAL32Ymt4ZCBqB0JorXAm4ZBrECZ9EbaXKaTSikkQM,21366
785
793
  sglang/srt/models/qwen3.py,sha256=xw-OsNRsC3nO5IR2OG7nSfupIiKQOxC_0VFQ4lKcbfc,19123
@@ -791,13 +799,13 @@ sglang/srt/models/siglip.py,sha256=DIVJRwdtpLD2QT1kVPIHw7Bn9BE40xJbkHujDNzkjgA,9
791
799
  sglang/srt/models/stablelm.py,sha256=0x_31uIr3WcWwecdPAI3ek9KkyKBJS7VwknTk2y0gjY,12281
792
800
  sglang/srt/models/step3_vl.py,sha256=joJmGukbGThLvwwbwrI4mCEVONH_U1dzFLWdpeJFoKo,35654
793
801
  sglang/srt/models/torch_native_llama.py,sha256=C1WpLn47q0l7IQa0k-Gvbs914FBcpKzqTIX-uvibq-w,18320
794
- sglang/srt/models/transformers.py,sha256=ChqRbUq5YD9oXnXwVP81XRoZmsKc44ouYDNgRsH6zmk,10249
802
+ sglang/srt/models/transformers.py,sha256=laA2h39MPeiAWKv4DEg0ydre-1pyXWFSRga-nwy1HUk,10244
795
803
  sglang/srt/models/vila.py,sha256=3NiRHWOqXnCRjXmswAldsNtiE5zRILbScEsbhUzLZF4,9846
796
804
  sglang/srt/models/xverse.py,sha256=DsNVI9JpzN4jj0Ry6aTrj7r-xq5YLOoDX2kH4YLJA-I,14035
797
805
  sglang/srt/models/xverse_moe.py,sha256=nBtG_PAK8wcp1tW2l2Zby2oEOmtWAYzH5COH-_N5IAM,17072
798
806
  sglang/srt/models/yivl.py,sha256=oToK7-u5IGO7xwpJIQ7VtudlK6-zPqJX4bt6_wv0SH8,4850
799
807
  sglang/srt/multimodal/mm_utils.py,sha256=6bV1_a7Iet9W0y3qdd0E-hFM78zalIzNZCYbLzJX2y8,12640
800
- sglang/srt/multimodal/processors/base_processor.py,sha256=ZLLNjSUaiDCujQQmGhIO8kHXAQT8Acux7CRR2Y-Yjik,24464
808
+ sglang/srt/multimodal/processors/base_processor.py,sha256=G25SF9bIyoQ13v7Qsb2ZDWTBq-BJ8Sa9okGZPPsS2TM,24518
801
809
  sglang/srt/multimodal/processors/clip.py,sha256=5nXZuQYbyf-5mlqPwjhQrlWqxvswImWZQXivChsiHfQ,1057
802
810
  sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=Pymag9f0U5L_bBOTFs2q94BbuPJ-VwqSixs3meO0nsM,2569
803
811
  sglang/srt/multimodal/processors/gemma3.py,sha256=7aD6cR60iSC_MqjzdCDMAgtrb_cmy9YJyqLgVRClBT8,1986
@@ -822,13 +830,13 @@ sglang/srt/sampling/sampling_params.py,sha256=HbVcCeSXgPW19MRB-v0FTG1D-zHDAY6-to
822
830
  sglang/srt/sampling/penaltylib/__init__.py,sha256=mtN8grFEcaBUhl4yBHmw8NNirt_i6uKO2cDNLHOpZQE,496
823
831
  sglang/srt/sampling/penaltylib/frequency_penalty.py,sha256=Loc3qjJTksNc5s-DV7QZHjgqoo5pxk7-nZzxwyhD2tQ,2144
824
832
  sglang/srt/sampling/penaltylib/min_new_tokens.py,sha256=rdU_D7RoIcrQPhysNQEzmr4TO2OoEi___p-i3QdwkgU,3331
825
- sglang/srt/sampling/penaltylib/orchestrator.py,sha256=XM-Lm6u7gYPtMZrTIc0FR4QxNZxBH5s_Cj82umyCzYk,5721
833
+ sglang/srt/sampling/penaltylib/orchestrator.py,sha256=Romk41ahToaVlNMnnd1Enko7_kRA4KdMGO94qnEbDHA,6061
826
834
  sglang/srt/sampling/penaltylib/presence_penalty.py,sha256=NRh10AJrrQlGJ6S-enGdRefrTrWpyqrSm-aNnyqQNQQ,2119
827
835
  sglang/srt/speculative/build_eagle_tree.py,sha256=O9LJNaBflgJdWT94D-rGH1gJFJ18nst2oOD8HnA2mZ4,12859
828
836
  sglang/srt/speculative/eagle_draft_cuda_graph_runner.py,sha256=jOIQDXsZ_CbxiTXnJjKtzYfOpc7-67dWwCaNcrv1Ebc,13938
829
837
  sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py,sha256=QuPI0S85KirTlJArLpJXpywv7XQLborDGLFYwLUBnwk,15459
830
838
  sglang/srt/speculative/eagle_utils.py,sha256=H-2aqm3REztUXLnmhi31ck3TWPPMVKc2CUkWBPsFK44,47785
831
- sglang/srt/speculative/eagle_worker.py,sha256=tvRV7JNvIeOFb3CTF756kRxQm8SZwfA7rCmm39feMiA,41451
839
+ sglang/srt/speculative/eagle_worker.py,sha256=7tjpKhFxColzlUZ-sONDYGMvto5uInzFxGBcj8IY6dM,42197
832
840
  sglang/srt/speculative/spec_info.py,sha256=rhaKG0TzyF9XZYHEWp1jccwTBohSNsUDvxHFtAoOl18,709
833
841
  sglang/srt/tokenizer/tiktoken_tokenizer.py,sha256=KJwr6Xlc7AdHegMTnAVKJlPpW59Z7AE27GTzFL78GwI,6222
834
842
  sglang/srt/weight_sync/tensor_bucket.py,sha256=vp_LRrhULNnxiw9Tf56FcEckgUg07lifgv1lasG6y7o,3695
@@ -852,7 +860,7 @@ sglang/test/test_block_fp8_deep_gemm_blackwell.py,sha256=Hnhq4kkyINHb4ONedkp5Kf7
852
860
  sglang/test/test_block_fp8_ep.py,sha256=n4X6ZKwuUUbV5Ofjg64ptlaFGI1LbRXDfFiJW1ELHgY,10546
853
861
  sglang/test/test_custom_ops.py,sha256=PenQ8zM1wj5xwiVEPVzD37pO-x90aOfFMpCRZenaKsY,5709
854
862
  sglang/test/test_cutlass_moe.py,sha256=ax-IYPm5tZjkZft0q8swHnzerOI4LB4JOLFaKGJVE-k,9629
855
- sglang/test/test_cutlass_w4a8_moe.py,sha256=E0ffQOR84bEFz6KFNbczH2LRhQqkeC9HPp76u0vzdwo,8809
863
+ sglang/test/test_cutlass_w4a8_moe.py,sha256=Ku9VCXEMJ3BwXtvb1A3FzY-zek-S-A4thWyX6m-1v-A,9219
856
864
  sglang/test/test_deepep_utils.py,sha256=749ysTBGNzh6rYUCJhhZBtZpeD15eWTeNHYCytcvZtc,7448
857
865
  sglang/test/test_dynamic_grad_mode.py,sha256=L76yUCuk_ymNpXD2CmO8r2GiGjIvD_gtTsuFDs2NolI,1638
858
866
  sglang/test/test_fp4_moe.py,sha256=rJLkKW3glBMvI5Ed0LltOHi8zCReMa-WB50p5zGm6J4,10189
@@ -865,9 +873,9 @@ sglang/test/attention/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3h
865
873
  sglang/test/attention/test_flashattn_backend.py,sha256=_rTG849FwQdVTyGKkqhczaOqngBmRWXFmkl5NnuK1GM,13914
866
874
  sglang/test/attention/test_flashattn_mla_backend.py,sha256=g4O50WblTpM7_Gq2b76k0i25_z01BOUBQ4i6PmyxpO4,10774
867
875
  sglang/test/attention/test_prefix_chunk_info.py,sha256=hpoDe2wfSa6RlUbfyri_c0iyBTb35UXGL9I2Xh6jamM,7772
868
- sglang/test/attention/test_trtllm_mla_backend.py,sha256=ilrX20-1hVo0nmKN0GTqzKoUmDarTXGS8nWJ6c8RHVY,41792
869
- sglang-0.5.1.post3.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
870
- sglang-0.5.1.post3.dist-info/METADATA,sha256=5F018jFs9QId3jVlqacEYemDaNTGhkFtp_80TEVv_6I,28168
871
- sglang-0.5.1.post3.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
872
- sglang-0.5.1.post3.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
873
- sglang-0.5.1.post3.dist-info/RECORD,,
876
+ sglang/test/attention/test_trtllm_mla_backend.py,sha256=quZ6SYuEH7J1YMcF8YO1_bwSNMz1gecpWRGauYjbUeA,42055
877
+ sglang-0.5.2rc1.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
878
+ sglang-0.5.2rc1.dist-info/METADATA,sha256=mMYLEpjZJzf_6puNSLlKkwaPpNRJ9nJ7mAsmRgSvb3k,28151
879
+ sglang-0.5.2rc1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
880
+ sglang-0.5.2rc1.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
881
+ sglang-0.5.2rc1.dist-info/RECORD,,