sglang 0.4.6.post4__py3-none-any.whl → 0.4.6.post5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (130) hide show
  1. sglang/bench_offline_throughput.py +6 -6
  2. sglang/bench_one_batch.py +5 -4
  3. sglang/bench_one_batch_server.py +23 -15
  4. sglang/bench_serving.py +133 -57
  5. sglang/compile_deep_gemm.py +4 -4
  6. sglang/srt/configs/model_config.py +39 -28
  7. sglang/srt/conversation.py +1 -1
  8. sglang/srt/disaggregation/decode.py +122 -133
  9. sglang/srt/disaggregation/decode_schedule_batch_mixin.py +142 -0
  10. sglang/srt/disaggregation/fake/conn.py +3 -13
  11. sglang/srt/disaggregation/kv_events.py +357 -0
  12. sglang/srt/disaggregation/mini_lb.py +57 -24
  13. sglang/srt/disaggregation/mooncake/conn.py +11 -2
  14. sglang/srt/disaggregation/mooncake/transfer_engine.py +2 -1
  15. sglang/srt/disaggregation/nixl/conn.py +9 -19
  16. sglang/srt/disaggregation/prefill.py +126 -44
  17. sglang/srt/disaggregation/utils.py +116 -5
  18. sglang/srt/distributed/utils.py +3 -3
  19. sglang/srt/entrypoints/EngineBase.py +5 -0
  20. sglang/srt/entrypoints/engine.py +28 -8
  21. sglang/srt/entrypoints/http_server.py +6 -4
  22. sglang/srt/entrypoints/http_server_engine.py +5 -2
  23. sglang/srt/function_call/base_format_detector.py +250 -0
  24. sglang/srt/function_call/core_types.py +34 -0
  25. sglang/srt/function_call/deepseekv3_detector.py +157 -0
  26. sglang/srt/function_call/ebnf_composer.py +234 -0
  27. sglang/srt/function_call/function_call_parser.py +175 -0
  28. sglang/srt/function_call/llama32_detector.py +74 -0
  29. sglang/srt/function_call/mistral_detector.py +84 -0
  30. sglang/srt/function_call/pythonic_detector.py +163 -0
  31. sglang/srt/function_call/qwen25_detector.py +67 -0
  32. sglang/srt/function_call/utils.py +35 -0
  33. sglang/srt/hf_transformers_utils.py +46 -7
  34. sglang/srt/layers/attention/aiter_backend.py +513 -0
  35. sglang/srt/layers/attention/flashattention_backend.py +63 -17
  36. sglang/srt/layers/attention/flashinfer_mla_backend.py +8 -4
  37. sglang/srt/layers/attention/flashmla_backend.py +340 -78
  38. sglang/srt/layers/attention/triton_backend.py +3 -0
  39. sglang/srt/layers/attention/utils.py +2 -2
  40. sglang/srt/layers/attention/vision.py +1 -1
  41. sglang/srt/layers/communicator.py +451 -0
  42. sglang/srt/layers/dp_attention.py +0 -10
  43. sglang/srt/layers/moe/cutlass_moe.py +207 -0
  44. sglang/srt/layers/moe/ep_moe/kernels.py +33 -11
  45. sglang/srt/layers/moe/ep_moe/layer.py +104 -50
  46. sglang/srt/layers/moe/ep_moe/token_dispatcher.py +82 -7
  47. sglang/srt/layers/moe/fused_moe_triton/layer.py +14 -0
  48. sglang/srt/layers/moe/topk.py +66 -9
  49. sglang/srt/layers/multimodal.py +70 -0
  50. sglang/srt/layers/quantization/__init__.py +7 -2
  51. sglang/srt/layers/quantization/deep_gemm.py +5 -3
  52. sglang/srt/layers/quantization/fp8.py +90 -0
  53. sglang/srt/layers/quantization/fp8_utils.py +6 -0
  54. sglang/srt/layers/quantization/gptq.py +298 -6
  55. sglang/srt/layers/quantization/int8_kernel.py +18 -5
  56. sglang/srt/layers/quantization/qoq.py +244 -0
  57. sglang/srt/lora/lora_manager.py +1 -3
  58. sglang/srt/managers/deepseek_eplb.py +278 -0
  59. sglang/srt/managers/eplb_manager.py +55 -0
  60. sglang/srt/managers/expert_distribution.py +704 -56
  61. sglang/srt/managers/expert_location.py +394 -0
  62. sglang/srt/managers/expert_location_dispatch.py +91 -0
  63. sglang/srt/managers/io_struct.py +16 -3
  64. sglang/srt/managers/mm_utils.py +293 -139
  65. sglang/srt/managers/multimodal_processors/base_processor.py +127 -42
  66. sglang/srt/managers/multimodal_processors/deepseek_vl_v2.py +6 -1
  67. sglang/srt/managers/multimodal_processors/gemma3.py +31 -6
  68. sglang/srt/managers/multimodal_processors/internvl.py +14 -5
  69. sglang/srt/managers/multimodal_processors/janus_pro.py +7 -1
  70. sglang/srt/managers/multimodal_processors/kimi_vl.py +7 -6
  71. sglang/srt/managers/multimodal_processors/llava.py +3 -3
  72. sglang/srt/managers/multimodal_processors/minicpm.py +25 -31
  73. sglang/srt/managers/multimodal_processors/mllama4.py +6 -0
  74. sglang/srt/managers/multimodal_processors/pixtral.py +9 -9
  75. sglang/srt/managers/multimodal_processors/qwen_vl.py +58 -16
  76. sglang/srt/managers/schedule_batch.py +49 -21
  77. sglang/srt/managers/schedule_policy.py +4 -5
  78. sglang/srt/managers/scheduler.py +92 -50
  79. sglang/srt/managers/session_controller.py +1 -1
  80. sglang/srt/managers/tokenizer_manager.py +99 -24
  81. sglang/srt/mem_cache/base_prefix_cache.py +3 -0
  82. sglang/srt/mem_cache/chunk_cache.py +3 -1
  83. sglang/srt/mem_cache/hiradix_cache.py +4 -4
  84. sglang/srt/mem_cache/memory_pool.py +74 -52
  85. sglang/srt/mem_cache/multimodal_cache.py +45 -0
  86. sglang/srt/mem_cache/radix_cache.py +58 -5
  87. sglang/srt/metrics/collector.py +2 -2
  88. sglang/srt/mm_utils.py +10 -0
  89. sglang/srt/model_executor/cuda_graph_runner.py +20 -9
  90. sglang/srt/model_executor/expert_location_updater.py +422 -0
  91. sglang/srt/model_executor/forward_batch_info.py +4 -0
  92. sglang/srt/model_executor/model_runner.py +144 -54
  93. sglang/srt/model_loader/loader.py +10 -6
  94. sglang/srt/models/clip.py +5 -1
  95. sglang/srt/models/deepseek_v2.py +297 -343
  96. sglang/srt/models/exaone.py +8 -3
  97. sglang/srt/models/gemma3_mm.py +70 -33
  98. sglang/srt/models/llama4.py +10 -2
  99. sglang/srt/models/llava.py +26 -18
  100. sglang/srt/models/mimo_mtp.py +220 -0
  101. sglang/srt/models/minicpmo.py +5 -12
  102. sglang/srt/models/mistral.py +71 -1
  103. sglang/srt/models/mllama.py +3 -3
  104. sglang/srt/models/qwen2.py +95 -26
  105. sglang/srt/models/qwen2_5_vl.py +8 -0
  106. sglang/srt/models/qwen2_moe.py +330 -60
  107. sglang/srt/models/qwen2_vl.py +6 -0
  108. sglang/srt/models/qwen3.py +52 -10
  109. sglang/srt/models/qwen3_moe.py +411 -48
  110. sglang/srt/models/siglip.py +294 -0
  111. sglang/srt/openai_api/adapter.py +28 -16
  112. sglang/srt/openai_api/protocol.py +6 -0
  113. sglang/srt/operations.py +154 -0
  114. sglang/srt/operations_strategy.py +31 -0
  115. sglang/srt/server_args.py +134 -24
  116. sglang/srt/speculative/eagle_utils.py +131 -0
  117. sglang/srt/speculative/eagle_worker.py +47 -2
  118. sglang/srt/utils.py +68 -12
  119. sglang/test/test_cutlass_moe.py +278 -0
  120. sglang/test/test_utils.py +2 -36
  121. sglang/utils.py +2 -2
  122. sglang/version.py +1 -1
  123. {sglang-0.4.6.post4.dist-info → sglang-0.4.6.post5.dist-info}/METADATA +20 -11
  124. {sglang-0.4.6.post4.dist-info → sglang-0.4.6.post5.dist-info}/RECORD +128 -102
  125. {sglang-0.4.6.post4.dist-info → sglang-0.4.6.post5.dist-info}/WHEEL +1 -1
  126. sglang/srt/function_call_parser.py +0 -858
  127. sglang/srt/platforms/interface.py +0 -371
  128. /sglang/srt/models/{xiaomi_mimo.py → mimo.py} +0 -0
  129. {sglang-0.4.6.post4.dist-info → sglang-0.4.6.post5.dist-info}/licenses/LICENSE +0 -0
  130. {sglang-0.4.6.post4.dist-info → sglang-0.4.6.post5.dist-info}/top_level.txt +0 -0
@@ -1,15 +1,15 @@
1
1
  sglang/__init__.py,sha256=T-fZEjKP66Q1q3PB56oREs5U3zf6bL0fNcdIbW8jMhE,1652
2
2
  sglang/api.py,sha256=vHiKBg8wwIdmrpnGclop5BzJ-1Q88emrlrfLwNCHg98,7010
3
- sglang/bench_offline_throughput.py,sha256=G1lLm5F-ZE9HCb7tBi7GqhlZaDelgG4or4HgUSAD0sE,13877
4
- sglang/bench_one_batch.py,sha256=4XysFhY3fbJmVXVaIAvwb0dx5TYTtO8ONAAzTFT-ixQ,19222
5
- sglang/bench_one_batch_server.py,sha256=XJNBXYEuhU3vuSXJ2BRDAwlSPUmnC-gLCCJ1FSpuC9A,10894
6
- sglang/bench_serving.py,sha256=JkPLvFxCax5EKw-0DSoGxuFte2loApCIW7fGI_MuWsI,62931
3
+ sglang/bench_offline_throughput.py,sha256=j-h1Bk7zkI74EgFahfJnxe6aWtpdgKDfiN7qKmNN-0w,13895
4
+ sglang/bench_one_batch.py,sha256=fCxRRk14uQqTxpriBkrUkvrOUjNT7TZgDeGGWJQzhgw,19328
5
+ sglang/bench_one_batch_server.py,sha256=qFgN7tZwX4tK7KJeInrPvEtgF8DCQhTWr_l4jW0zH8w,11201
6
+ sglang/bench_serving.py,sha256=BdCY8iT5jM0s0T4DO8WmZaRyd2vKncALRx26Ptx3Yd0,64974
7
7
  sglang/check_env.py,sha256=qDMIG2rCNBH1yKnxQmF-Bp10oiFMUKMgfZLHZYOmdSY,8412
8
- sglang/compile_deep_gemm.py,sha256=XaKt2M4BMSiV8gx3ERzX5YwwEoE7suvUqgoi_wYlNpQ,6211
8
+ sglang/compile_deep_gemm.py,sha256=H118s76CKdpZr-cDeFfBCePe7--c_teEBNVIzchYVSo,6243
9
9
  sglang/global_config.py,sha256=xzLdk8W53fneFblNh8iIjGF9C3-7mnzR1-LleD9Btxg,1495
10
10
  sglang/launch_server.py,sha256=mDXfwha8LHpWQJekcCosR98QhCQsbmilsBlI5jAIgg0,420
11
- sglang/utils.py,sha256=6Zpzw96ZDrZcBAI-OFmWtKvXcLBVLiHok0B42pK3kKs,16160
12
- sglang/version.py,sha256=Rr2NlJlI5ama66BpRjzDUs7DOzgB59i8o_MYW0YO2X8,28
11
+ sglang/utils.py,sha256=LJQksRakIH624rHwOfe9j91g1HzSOEiF0kymUGwMXu8,16176
12
+ sglang/version.py,sha256=B_ux4x0ePtuRu-TrL0kt2lDB2SlCBrlbrPC2KwVy6DY,28
13
13
  sglang/eval/llama3_eval.py,sha256=gWSboDchIGybIce88bJlrCG0yiLZ513mw4gcutJlzGM,10017
14
14
  sglang/eval/loogle_eval.py,sha256=pRPVA4fxGmT3_oXvXnlNE-UlPrcQGLBJF-OSE9YWJXM,4336
15
15
  sglang/lang/chat_template.py,sha256=HKlx7snSWFED8GKF5ex79sQrPWFw5TSXQM0_LsiD9Bc,20552
@@ -28,17 +28,18 @@ sglang/lang/backend/vertexai.py,sha256=gz0uNYyBb88jbPYz6ZIJ774fefrcbuVdoK33bphUZ
28
28
  sglang/srt/_custom_ops.py,sha256=L7NuEaRD_Q6Q54n0NZnLXgWZURbnn8Tkg4NQedE6zgA,3616
29
29
  sglang/srt/aio_rwlock.py,sha256=6LYtOdeTUY3hkfa1dmYkgsaF2ttrwIF3hUWz2AZ2fqw,2970
30
30
  sglang/srt/code_completion_parser.py,sha256=vafJqdTTreD9kvCsoMuxP_fFmoue7pOA1ibI9KXg4mE,5405
31
- sglang/srt/conversation.py,sha256=569K5QEjnZGF45GjFGVZfP1n8RqmpcwxuVbgWRNFyis,35295
31
+ sglang/srt/conversation.py,sha256=q2qX5plROHDwZYKDHhB4Cp1_xNQjolISaHCn1zdohIk,35297
32
32
  sglang/srt/custom_op.py,sha256=J1PUcGaeJJjfAjp06BQsLpUkKyR1zsh9MvDiDlqqJsg,1129
33
- sglang/srt/function_call_parser.py,sha256=W3ZBbYP1Eg5z70sc1-HVhT_b1TJg5oxZDuGOppgMrA8,33378
34
- sglang/srt/hf_transformers_utils.py,sha256=97J396flSaelvOIn0zO8Ji3bvFWUiL2mhLgxnup-d-M,10054
35
- sglang/srt/mm_utils.py,sha256=1ScBunw_x4W8ebM_AcJ62-1T2mfT8NlMJqdAhkF1lb0,12367
33
+ sglang/srt/hf_transformers_utils.py,sha256=NmsiIL2KvmPLX3QQYv4SuH5TM-WVB4En8WI-KUEWf7U,11733
34
+ sglang/srt/mm_utils.py,sha256=7o4w1W0VAWgEquVIz7qw7-IxYbZY2g3MrXw9php90oY,12621
36
35
  sglang/srt/model_parallel.py,sha256=eLXZhvJ4wG6dh0FontNCIdVZvHYdWgaeY-5cu7TD9tE,6078
36
+ sglang/srt/operations.py,sha256=LMxv7ZW5sFj4qGya3xmV_8uL95hUc0CjpMxEhWOgZsU,4252
37
+ sglang/srt/operations_strategy.py,sha256=_ml_3xdu6ytebCJ96an26Ys3mmLnlPETaXkUenpX6Kw,800
37
38
  sglang/srt/patch_torch.py,sha256=OUPCGQSQz3MVZB1zZ_Eq8lXiw0uIKJ_HWjqQolI8FsM,3088
38
39
  sglang/srt/reasoning_parser.py,sha256=lZN5b1TJp3EK2GzxcICQhp0tRQjQw3ROOrjRgQe6Bsc,6341
39
- sglang/srt/server_args.py,sha256=gW3mDnnRqrtpZTZOmjeWPfdnDNr070tSpUMrl7Qlc_Y,59525
40
+ sglang/srt/server_args.py,sha256=YRr8CxIQAAiWxIDVxjTmXDyPxOvehSof9ylCd62Qix4,64106
40
41
  sglang/srt/torch_memory_saver_adapter.py,sha256=HYlgYJ2sgmjs2RSjU2KbCaXijRg3mTDZ0ZcCB5Bt6Ps,2211
41
- sglang/srt/utils.py,sha256=8xEOCR2aw4InlcwrdIN9EFfR-1FU26T_VylU5FQJ4-s,66467
42
+ sglang/srt/utils.py,sha256=ttLnrJ69dyppmRx8bIHrL4c6u9KY-xc_hj2kvjcRLk8,67598
42
43
  sglang/srt/warmup.py,sha256=FmJiYfjRr3X_eAe7ojQaPoN17LvHpjDmRWRnO-k86AQ,1469
43
44
  sglang/srt/configs/__init__.py,sha256=8EcVRP95epZ49DxBa6LgKWt7eO3Qe7Hrr3V1c6HkMnY,553
44
45
  sglang/srt/configs/chatglm.py,sha256=j-b0YkdYUmQm2y1kNmMJtKeACxWKmBbvNNkDWbs6kbI,2907
@@ -51,7 +52,7 @@ sglang/srt/configs/janus_pro.py,sha256=Rrb7kQsNaUP-TiZrjNk8Lr1momFrql8ScEunnrH0_
51
52
  sglang/srt/configs/kimi_vl.py,sha256=4W7VQI3pr888ZsFA2SqCQo4mI0seXTOrGQ-x3oTvWew,1358
52
53
  sglang/srt/configs/kimi_vl_moonvit.py,sha256=hx2Rt4JSFbvy2HUTeLjBpge87m8M6ITAhqsgdNf_Jd4,1163
53
54
  sglang/srt/configs/load_config.py,sha256=qs-AxuplouBx2tsv9KGBOLZPbwzuVA4vbktbGP_cRp8,3309
54
- sglang/srt/configs/model_config.py,sha256=MONwgieC5BZ2fPq31a-xTTx-RzPu1OGUBaEkcpdFkjU,23896
55
+ sglang/srt/configs/model_config.py,sha256=7qXt85m6dDp9qouFRSIN7mc0mWTTvOMNL5BgVYi1bUU,23843
55
56
  sglang/srt/configs/utils.py,sha256=3nHUfisMs_Ltuhv8OZTNCJp63YJKJVF43h1QZB1zqx8,670
56
57
  sglang/srt/connector/__init__.py,sha256=czLX5JOxuMhH-T9eSJzoc1qv1B4z9chyffDRL5I6wo4,1247
57
58
  sglang/srt/connector/base_connector.py,sha256=i6i1TIzsz4NbSEkrdMPq-urb2sN2aLAx8dazga4gB9U,2833
@@ -68,23 +69,25 @@ sglang/srt/constrained/outlines_jump_forward.py,sha256=Gyubp-FVetxd6wP4FA_kD6cCX
68
69
  sglang/srt/constrained/reasoner_grammar_backend.py,sha256=YFxWuOTTo4e6cGhxnaBwuwli6f8FTUJtszib8dBq_8I,3207
69
70
  sglang/srt/constrained/xgrammar_backend.py,sha256=FKWrMb1QSgtCTCyk6pQZ5NS-5T3M6dvdxN7OOPCYc8A,7837
70
71
  sglang/srt/constrained/triton_ops/bitmask_ops.py,sha256=WjTen9iuuFWLzkE1mAHQZB9_7aIy5QH8Wjf-lB-Fams,4614
71
- sglang/srt/disaggregation/decode.py,sha256=WDaXASJn2cp35r6ySPDdm5oXXg-3kR714CXX5xG28fY,25378
72
- sglang/srt/disaggregation/mini_lb.py,sha256=SROT_-_OdZSD3R7ar2g90vL5WX5Ijc-K99zz7ewWD7w,12389
73
- sglang/srt/disaggregation/prefill.py,sha256=Sf8wRv7BDBv0QQTahXR5wMTCiqOddhymx7L7vQbswXE,15527
74
- sglang/srt/disaggregation/utils.py,sha256=W3Fe_MwJrSxHC1eMZRkD7C09VWFKRwfoM9_XXY-n2s0,5054
72
+ sglang/srt/disaggregation/decode.py,sha256=SpKHH8xdG1_5XAgrd9YxOFVErmkp7e8gbRTCrsVYTys,25011
73
+ sglang/srt/disaggregation/decode_schedule_batch_mixin.py,sha256=cUfd3-5lRHqWpwkrj4xdGMV2Hus08hdQbobTLNoCXlo,5569
74
+ sglang/srt/disaggregation/kv_events.py,sha256=SSB0zMeAwU2enA2YoEbWYdwUC3TJqEBo_V9SjqrmZHY,11380
75
+ sglang/srt/disaggregation/mini_lb.py,sha256=r7oT02JtktxngiAA-uiW35EwUemBFRLqLrUsPZbQipg,14011
76
+ sglang/srt/disaggregation/prefill.py,sha256=M9sbLsHjVgJC6YRyGnQUfL7AZvviyot2d_aXSzc95nI,19591
77
+ sglang/srt/disaggregation/utils.py,sha256=vl5wY3wN6_4YAZ_8mH7EF-pop6EJJfrPVBCiFm2xCHU,9487
75
78
  sglang/srt/disaggregation/base/__init__.py,sha256=KR8xXoRCDAy2U623mfP6ujXu42m1_F9EiudjrKu2I_A,130
76
79
  sglang/srt/disaggregation/base/conn.py,sha256=hEOuR6kXrc7fRSYE9RAH53DLGHGaCcYWod6IkmtNttg,2491
77
80
  sglang/srt/disaggregation/fake/__init__.py,sha256=zmfeKYXjonRhfFOck1c_mP7Q4cW5G0f1RsTwRivKu0s,47
78
- sglang/srt/disaggregation/fake/conn.py,sha256=N9y0ZBhfPkrhaKN3gsRxqb2wWpiioaANtFqO9wVl2Ec,2553
81
+ sglang/srt/disaggregation/fake/conn.py,sha256=BzxFGjU87RgOeM_eV5S06RlB78DclpcYPlOAbcZKU2Y,2168
79
82
  sglang/srt/disaggregation/mooncake/__init__.py,sha256=1vacEHmWjf7zgbMPzsXKB08FqNKNCquJdUiDlO41BOk,122
80
- sglang/srt/disaggregation/mooncake/conn.py,sha256=MF2N1FbBdI5mh5Btl6gkX6Dw8MqjKPMVe9NvwdspEdY,33652
81
- sglang/srt/disaggregation/mooncake/transfer_engine.py,sha256=MxDAB9ZetRF1pFS2LP3FVHPtQ1HjIt_SK3UMaYHZ94o,2604
83
+ sglang/srt/disaggregation/mooncake/conn.py,sha256=31JWY7-xPqfQOsopP-3i8V8OUhwQP3OCOpQhYo239lk,33928
84
+ sglang/srt/disaggregation/mooncake/transfer_engine.py,sha256=jsSn7PzPcC4OPHJU6BuUJBaiaatgiqZ5Ra25J_ATTmw,2789
82
85
  sglang/srt/disaggregation/nixl/__init__.py,sha256=n9HjrRk36WUcZNeetGWOh2pSriLp7GNTq7YYX9K3EtY,85
83
- sglang/srt/disaggregation/nixl/conn.py,sha256=ekYUmS2c9TnkFrzS1DYGXZG-Yrb5WbMIL6gnQHAxG8M,30104
86
+ sglang/srt/disaggregation/nixl/conn.py,sha256=y67X1IutrzdqPYPzH9RUJ9vrTcIkOD1xk_PZWzJGIjM,29768
84
87
  sglang/srt/distributed/__init__.py,sha256=jFOcyt-wFAPMBUAf9zkZalNQlt-4rqmT6pCKBz1E4qo,149
85
88
  sglang/srt/distributed/communication_op.py,sha256=IBnFUdMftK_VSTMMMitGveonorFUUVNL4guqO31cMSc,1130
86
89
  sglang/srt/distributed/parallel_state.py,sha256=cCQq94H8A-rO2wZf_bCf1lkwcTVOBrHubM9K1PrzVSY,51560
87
- sglang/srt/distributed/utils.py,sha256=U-BSaXYjWwnfG8g-tUfBhjKt5Ug097nyHtu3g3aea_Y,8473
90
+ sglang/srt/distributed/utils.py,sha256=aaCxATncLGnVgB0WlGpBdee0behKW8Dy_dakqcuKSaQ,8497
88
91
  sglang/srt/distributed/device_communicators/cuda_wrapper.py,sha256=3jvPG-Ow5UBLiXhfx8T8snR7crSZbPpARAggsDPWq7k,7038
89
92
  sglang/srt/distributed/device_communicators/custom_all_reduce.py,sha256=qje-PQ3v8yaV-oYVLPws1mgIlXVsGKFCOvXHmSe8ZXg,19624
90
93
  sglang/srt/distributed/device_communicators/custom_all_reduce_utils.py,sha256=fLoptT_U0lVAqkhEg-ge53CdFSIKQpDRiqHYKwJVEZg,10974
@@ -94,17 +97,29 @@ sglang/srt/distributed/device_communicators/pynccl.py,sha256=obXyCaZznZHSt486XCn
94
97
  sglang/srt/distributed/device_communicators/pynccl_wrapper.py,sha256=LblisImY9d6EMz-oPS9J16WHo2Q_SRL1DtlJKK63Hfg,15349
95
98
  sglang/srt/distributed/device_communicators/shm_broadcast.py,sha256=d8mykYmXM1lfbPm8GNtqCF0Un_pdXYjbNmsgoVFyyow,20874
96
99
  sglang/srt/distributed/device_communicators/xpu_communicator.py,sha256=ajW6132BvA6jkeipEIgN27TFycI0U06Ih2Z8WNjlA4s,1593
97
- sglang/srt/entrypoints/EngineBase.py,sha256=xoyvp6XAeDLY2_Q2Ng33H-fRhrXHv2ldJJKd-HuDhqE,1870
98
- sglang/srt/entrypoints/engine.py,sha256=0L0jis9GLehFgkYP9cBBw7-Plg7e_quCF5OiX82O8io,24704
99
- sglang/srt/entrypoints/http_server.py,sha256=xH-iXPx9wg2VqHW9dFxDAyIwcdBMAsUboK7MH4SR-5E,31003
100
- sglang/srt/entrypoints/http_server_engine.py,sha256=ihA6y3GXRs28Y9U3SgdQcJQjnw_SVIby7QrVgiafX04,4846
100
+ sglang/srt/entrypoints/EngineBase.py,sha256=6e7XecqeGAv29aiqCJyGsWYV8LwBNZN-lSxnUj9E_lw,1976
101
+ sglang/srt/entrypoints/engine.py,sha256=UEpN507ZGyOn1Mpi5PNk02vk0D8gieYF16EivfBC-FE,25360
102
+ sglang/srt/entrypoints/http_server.py,sha256=noIHojetylEVOQIoykHHondGlUyJUB4TQ7ZZvTK0TX8,31174
103
+ sglang/srt/entrypoints/http_server_engine.py,sha256=0QJFmrKAVnBmFbObHrmvUDcxDAsvnv6H29cQq286CKc,4939
101
104
  sglang/srt/entrypoints/verl_engine.py,sha256=RYizNetTHzcB8dErX1EW4NsyRNGkFPljYaAf7pVRPdM,7002
105
+ sglang/srt/function_call/base_format_detector.py,sha256=76maa_oIMxLpnLGjcwXwVW6eFchVv4jIEFSCt0jDhxU,9842
106
+ sglang/srt/function_call/core_types.py,sha256=wLUsW8mUA-i-ISz5QUDL7Ejq72W-K1HIhFa9Wm-_oA8,786
107
+ sglang/srt/function_call/deepseekv3_detector.py,sha256=oDP5LNNcAHohGQjxFJoOJjx-karkOB7Y0VrYjUOAp0E,6636
108
+ sglang/srt/function_call/ebnf_composer.py,sha256=HuRg_sswglmgSF7GRZahKIku9ANH4MtAVRrBvoK5uuM,9788
109
+ sglang/srt/function_call/function_call_parser.py,sha256=X49mDuMD_9i8WqxzCFCwCbg0CLPmG_PAbDBT9se-mFo,6662
110
+ sglang/srt/function_call/llama32_detector.py,sha256=rWxtQ__guJOim_-E-RLOiykNuQGKB6wv-q2HpKugdeY,2660
111
+ sglang/srt/function_call/mistral_detector.py,sha256=jBK06utqq8u2OI7o3UiTINlBzk3KH6GxI0ouEtxFcP0,3342
112
+ sglang/srt/function_call/pythonic_detector.py,sha256=VD9eMGMZs3KkG3MMOlVDCusus8R7iDPKs6FvkMuMcdo,5953
113
+ sglang/srt/function_call/qwen25_detector.py,sha256=v1uLOzfH7N-WtXcanYpMuS2ZpiMfEUJSteql9mVDbfM,2380
114
+ sglang/srt/function_call/utils.py,sha256=iu4GWtIfcHv3vXZXkiPVsV1L7Hg-6BofBW2MTr8EEQM,891
102
115
  sglang/srt/layers/activation.py,sha256=oSkdo8B8najXFcVay3Y__CEvgXh87lAIhG0CMp2Ugqs,5954
103
- sglang/srt/layers/dp_attention.py,sha256=MwqjY3uOg4dKjFxTyNlWnnHaA0oLL3oUkapfh0qs1IE,9438
116
+ sglang/srt/layers/communicator.py,sha256=pMateRTOfpub6zFWZnpdgGtBIwclZM7AX4Dwzbp0h9Y,16301
117
+ sglang/srt/layers/dp_attention.py,sha256=W8aPfuYXAXHGVccJVTk11871ixoDy67f3yqyd3MvFm0,9150
104
118
  sglang/srt/layers/elementwise.py,sha256=XCrR2i-9dP-H6jQo2zUuquwZrsl_wEQqj5Wxk6WUf7o,13987
105
119
  sglang/srt/layers/layernorm.py,sha256=kU47PX_V46RblaxxMNxWxGjWSa99o0w2s68908rGp6Q,5957
106
120
  sglang/srt/layers/linear.py,sha256=nC9MxJrFap1BEyqgFlBySH4IeQruIbcBp32cOhUl5Fw,52149
107
121
  sglang/srt/layers/logits_processor.py,sha256=eeG2zXZguvz2r1OVKVd5HFSPseL5fzRenh0cYuKO-GQ,25557
122
+ sglang/srt/layers/multimodal.py,sha256=Hsqrz4dyNH4GgkpzOxtuzPIDnxmtsj5ox0qcC4S2iio,2078
108
123
  sglang/srt/layers/parameter.py,sha256=zqWyEzpWzP4NNTjq3G9khq6XofgpcmJqQLg6Vd4WyWE,15084
109
124
  sglang/srt/layers/pooler.py,sha256=nR9F4x0GP2KYkJihhcL-TX30gfLY3mVhOLRfeBDeKL4,1942
110
125
  sglang/srt/layers/radix_attention.py,sha256=F71GgDes_fEt_cHxR9HM2QhNG5u7uF4zDAuLqwLYEV4,3481
@@ -113,34 +128,36 @@ sglang/srt/layers/sampler.py,sha256=JmzceFPgl3vjaf9VQA3OPEW52tRZ_njrOxpGdZ35LP0,
113
128
  sglang/srt/layers/torchao_utils.py,sha256=Ws24FdRBSkTpyeyA6bQrdDm-W5wfDxKvSIPUSahyMfA,4063
114
129
  sglang/srt/layers/utils.py,sha256=tkTz86DFZ4NRMEUc4QkYNskUskdxXoEqkWqaMGbhP7E,1045
115
130
  sglang/srt/layers/vocab_parallel_embedding.py,sha256=GPKCQiR2yH5Z2XSE9g3vWObdegcwPnMHXv7qEZovLH4,22755
131
+ sglang/srt/layers/attention/aiter_backend.py,sha256=xMTZ1J0OOMgvMaULrLHDMLUJaVUGAFm-OhAACVlGaYU,17893
116
132
  sglang/srt/layers/attention/base_attn_backend.py,sha256=lGujcYJ_CxHJy0Q9L6Phn3ds-nBGMy0OGj3R54R65iQ,3334
117
133
  sglang/srt/layers/attention/cutlass_mla_backend.py,sha256=kCNn5Ub0jCsFjhVhuE-9qK53gu5a9oMStMeT2lcc6CU,9904
118
134
  sglang/srt/layers/attention/double_sparsity_backend.py,sha256=2ZRL_gYz14idoVqQzeQ6N77nXer0f_8_TUYw40XUUz0,9161
119
- sglang/srt/layers/attention/flashattention_backend.py,sha256=o9ggOpIAhmLzxRfVg8mjLM_x6vesOb5f6MayVZe0UJU,87868
135
+ sglang/srt/layers/attention/flashattention_backend.py,sha256=MuaEkGVuUfH50IeEqvwrVVl_2MSotnsSQ_UVxypkVm0,89610
120
136
  sglang/srt/layers/attention/flashinfer_backend.py,sha256=53TXhmBpU5rs04-4u-yXclwJ5UYg7WJfyLDZJ8nSDOU,47651
121
- sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=4BJy18GHYiNVjcSkvmzxgoSk8nugsLrZuars_m-4oYw,32406
122
- sglang/srt/layers/attention/flashmla_backend.py,sha256=wR0bkLz3mj5EfuHEi9fwEP2vtq6xFhsrIijpFb009o4,10340
137
+ sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=DPVgahpGzd69HmtSyjPHusEub6RPYCZq8jzcuadAfHk,32468
138
+ sglang/srt/layers/attention/flashmla_backend.py,sha256=rOFJFTPOP0PMkD0z1J6MduJsYCRHpoHikgPtviL-iRU,20962
123
139
  sglang/srt/layers/attention/merge_state.py,sha256=OnWmNV6LYTUj0y8SCy_IK7A9q6v9bZwR4_XiLOIvbrk,1423
124
140
  sglang/srt/layers/attention/torch_native_backend.py,sha256=K5hUqBgakk2COSQqsaxWs0yEVOHS-7BlOygZTOeI8kE,9444
125
- sglang/srt/layers/attention/triton_backend.py,sha256=oEEiUwHbm4rNw5ExbQ2c3n0TwAgkk77yuLFenj9bHOo,26902
126
- sglang/srt/layers/attention/utils.py,sha256=3NyDQ2T2IHwFb5mAJzbpyxRYmdkB8htM3_9_U5GqQDY,2889
127
- sglang/srt/layers/attention/vision.py,sha256=TOTRWzd5d_9fCR8DOvy_oY-vJ1zl2cVYni5hlZGDens,15355
141
+ sglang/srt/layers/attention/triton_backend.py,sha256=GH7EnR3caPrQQRyhSq15K1CRYC1wQ4kiDPHyS5gakqs,27093
142
+ sglang/srt/layers/attention/utils.py,sha256=KiRSIHaGBhErUhPWCSD3Uiaqb0pSEF0NJFwTTQXoMks,2887
143
+ sglang/srt/layers/attention/vision.py,sha256=rnfGrQPOQjSu3JV-rtdheQcR7jsvAF9P0-t5C9Nzudg,15358
128
144
  sglang/srt/layers/attention/triton_ops/decode_attention.py,sha256=DPu_aCPgwPqKWZPEQmp_xA7MPbpV2ip-MEICCB470Ao,19120
129
145
  sglang/srt/layers/attention/triton_ops/double_sparsity_attention.py,sha256=FbgrPO5GvEGEvojV7Ss0jX7384e9vuzX2goDCQuP1Zk,31124
130
146
  sglang/srt/layers/attention/triton_ops/extend_attention.py,sha256=m12jEnQkNJguATqvZ57HtMC2hhU4wqdB8xAYdh25BxE,13922
131
147
  sglang/srt/layers/attention/triton_ops/merge_state.py,sha256=v9nD01a5eTnkwZxMwERtrrRfC5rs6GxkYOpErkAPcYI,2877
132
148
  sglang/srt/layers/attention/triton_ops/prefill_attention.py,sha256=waZsmpKIp8rTgFSoM4QMabJuLaB3yW6ltOzAKJksBoE,6260
133
149
  sglang/srt/layers/attention/triton_ops/rocm_mla_decode_rope.py,sha256=664WnAJ91EiCUZOcnVDfbTQf4uGJ4ZDZB1CbxpEUFZc,13866
150
+ sglang/srt/layers/moe/cutlass_moe.py,sha256=rDDfx1Pzr0fILJQajid2DHuXQI6K8SToEbxM95nsW9Y,8565
134
151
  sglang/srt/layers/moe/fused_moe_native.py,sha256=U0qh3udHuJJll3udydqABoXPFz0au9aEj8Lv7OAHYvQ,4655
135
152
  sglang/srt/layers/moe/router.py,sha256=5Aeqoix_AS4uymb665OJE904wVSBkQeFdZP4e7KKPvg,10530
136
- sglang/srt/layers/moe/topk.py,sha256=ir3CXINtE2xeLJDh9S3PlxikRC0e4AIxb-lEQqttnBk,11127
153
+ sglang/srt/layers/moe/topk.py,sha256=4LROSaYWkYY7PP5uMPInu8LzT42LkwyAA5lB6c7dntU,14210
137
154
  sglang/srt/layers/moe/ep_moe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
138
- sglang/srt/layers/moe/ep_moe/kernels.py,sha256=tj2yIWdgn3zaz9uuhsm6qx4syaX_t-zpYPLKotCX89k,33547
139
- sglang/srt/layers/moe/ep_moe/layer.py,sha256=TPBcD9_To_sQhayur9nbQNRn8AYTCO3gXtytKHfUkGM,40349
140
- sglang/srt/layers/moe/ep_moe/token_dispatcher.py,sha256=y-t3qG0GS9r8GLTe6_-5BV43Sp5BPHIoveDlYFGIt7s,22051
155
+ sglang/srt/layers/moe/ep_moe/kernels.py,sha256=-CXEAlgsWJEToxn2qmOPkm4m0opI7qhMCWACid1C0Xo,34206
156
+ sglang/srt/layers/moe/ep_moe/layer.py,sha256=Kg0PGNzVW_Ah_nLaNh7anooZ_uowV3Cj81l2f6fsk80,42259
157
+ sglang/srt/layers/moe/ep_moe/token_dispatcher.py,sha256=zpbTtxcMZcRjx0ILd3EQ0H3zSEm9NbatZbAa6NdYOVY,24761
141
158
  sglang/srt/layers/moe/fused_moe_triton/__init__.py,sha256=h9yMFAL_bagUf-qBED8gSWdCOb7d8IdA-pE-L_nIg8E,842
142
159
  sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=mNFBkSB9n1axyLAs9dsIwdAj7L5w9ZFEEDsxOL6XPPE,55996
143
- sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=BMOV76fabrZcoyDmRpRbH11Jc0ogWH2k2QAQwvZIpgI,25084
160
+ sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=BoBiYHtUNOIvvXvqtWjHmx9i10SNbULi7l11YO9gHcs,25706
144
161
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=iNGsE2ZeVnQEnN4A8UJ9Jv0d3hbRF2MJ9oBgjup5Szk,2737
145
162
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json",sha256=JJN0hryyLr5Zv3dSS7C8cPFhAwTT6XxUVnBGMZvV6JA,2752
146
163
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=ouRyZ5PEMPP2njPftCNhs-1g1y6wueWLmhI7G1SjV1k,4131
@@ -294,20 +311,21 @@ sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=BMOV76fabrZcoyDmRpRbH11Jc
294
311
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=8,N=8192,device_name=AMD_Radeon_Graphics,dtype=fp8_w8a8.json",sha256=-RzUWSIAAsg6iA-8SPMa68hPpBVoUyMJs3dLP7edRu0,4323
295
312
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=8,N=8192,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json",sha256=sY2nWMPh9lsIkhPCjkHO245wpnfFbrHmzdcZDVFPVww,3265
296
313
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=8,N=8192,device_name=NVIDIA_H200,dtype=fp8_w8a8.json",sha256=Uz5X80VcNBOaxshwVNUEittHk2zqB4HQCfTJ4TPG5aM,3274
297
- sglang/srt/layers/quantization/__init__.py,sha256=0qQgvF5wR9VlYO9xv8GERPgtKWZ9OMilaxcSUeGTyN8,12424
314
+ sglang/srt/layers/quantization/__init__.py,sha256=fzlKUHBIQU8TsbzjAoFikdPKc4VXyv32ANF0EkO7XmA,12512
298
315
  sglang/srt/layers/quantization/awq.py,sha256=KemDG55U3B6YZVjMV71awVAIj0islFvtxcUHmOBeGy0,6739
299
316
  sglang/srt/layers/quantization/base_config.py,sha256=jWk_egQrVNMYmQgbTI9vkcgzScLFjB5_sywFlAfE5J0,4776
300
317
  sglang/srt/layers/quantization/blockwise_int8.py,sha256=BgPrsTakDDFirALkW9q9VmFk0wFZv9cotkTU69Gnxeo,15122
301
- sglang/srt/layers/quantization/deep_gemm.py,sha256=a8T2IdWV11m4tnXfSwEmNzb_LwdaXcuaseFRsR07TtM,13124
302
- sglang/srt/layers/quantization/fp8.py,sha256=QguTeY-PMgU5Vu3QdeqmS3DgFD1R9avwgBZABG92dcg,40709
318
+ sglang/srt/layers/quantization/deep_gemm.py,sha256=J9Brr0E0BEWFUrpTms_s7glPSXHCkaVS7YJKemWII8c,13214
319
+ sglang/srt/layers/quantization/fp8.py,sha256=9FC9HxqoekZF0YkIOZtngoVRvSYc0xKS7cqZ4L5jbq4,44220
303
320
  sglang/srt/layers/quantization/fp8_kernel.py,sha256=OKpebbn09CpRzxFgB-RB_I4ZnWGLJ9nR0YTFu6-ZMdw,32570
304
- sglang/srt/layers/quantization/fp8_utils.py,sha256=VHU7glWyKjAMvR-zXAvZIuqMk6V3fj-rOx9K3xR-LEE,20075
305
- sglang/srt/layers/quantization/gptq.py,sha256=gyGMOPXHzozK7pPWSjKgLdFX9h7MCEww7n8FqEVEVac,15364
306
- sglang/srt/layers/quantization/int8_kernel.py,sha256=W9sXTIs46LJQPHLCt6UjoAVkIZhUn5eWq8pbyQBHpSo,12163
321
+ sglang/srt/layers/quantization/fp8_utils.py,sha256=wtgunvlmuYg_6wEA1_rd5BHRhGlWDmIRq6mIdpb5FIo,20234
322
+ sglang/srt/layers/quantization/gptq.py,sha256=d1frUjvXmZfQKkcMQY5t0BA4sXWHE9Jze24qxniptJE,26719
323
+ sglang/srt/layers/quantization/int8_kernel.py,sha256=GfRC9FOn9exNvK4QHbUeBj3Hhv32VcyGphapFPt5b84,12625
307
324
  sglang/srt/layers/quantization/int8_utils.py,sha256=YK9CS-lb_n91kNCTKK5o5apYF31V2giDg5G5VKrpcUA,2356
308
325
  sglang/srt/layers/quantization/kv_cache.py,sha256=_9pF5rwvB7ta6Gdc5YKVVGbNzYwqmhIx4TrX1-xnodQ,3261
309
326
  sglang/srt/layers/quantization/modelopt_quant.py,sha256=TpPgtbV7O5r1JY4Wm0np2pReQO6XERIdEDQcV41oTn0,16596
310
327
  sglang/srt/layers/quantization/moe_wna16.py,sha256=KtFr4lIslMA12yx4JjXXPOsa5OHjxXWA6scYCRQnFMQ,19483
328
+ sglang/srt/layers/quantization/qoq.py,sha256=adhsCixRUTh1m8sfpRWNhh5oX3I1WJli3Elg8uexP6A,8222
311
329
  sglang/srt/layers/quantization/utils.py,sha256=AXvGD8KRZVVrkRR1Y64fGkz4lkUP-CAjAQdp0LDNXrE,5266
312
330
  sglang/srt/layers/quantization/w8a8_fp8.py,sha256=UFwlch8qEm2J4muM4hMATj06-rf-__lSbBqVr00j1tc,11459
313
331
  sglang/srt/layers/quantization/w8a8_int8.py,sha256=MkvmcxQj3X5AZbx8pgnHYAikc_Xd_jOhJXaxx7255ho,8984
@@ -474,7 +492,7 @@ sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a
474
492
  sglang/srt/lora/layers.py,sha256=xdP2Gwlw9PCPZBhujGqO6aBn0eGxpVeIBFUp1LIGCto,13119
475
493
  sglang/srt/lora/lora.py,sha256=uNvbjZ_Wr1SLI9-ElRJA_JKwkibSGroP5Bfpsr9MI-Y,7527
476
494
  sglang/srt/lora/lora_config.py,sha256=qDgMTx_69jyJUl29O5FxLzYa0BMhqYVXWXfyyVOvGm0,1684
477
- sglang/srt/lora/lora_manager.py,sha256=1vkfpx5EfkGji08xUFEBTNfeDjpjfieQDRScIbEmO3w,11528
495
+ sglang/srt/lora/lora_manager.py,sha256=rn4dy99SREWL2GB4wH_e7POgnFrSkmOY-jCKmmX-974,11443
478
496
  sglang/srt/lora/mem_pool.py,sha256=dIx_8yZiJkFMyddfKL9G0zzgDxdkCQjG2qrbdHxqPtA,9633
479
497
  sglang/srt/lora/utils.py,sha256=S53SOjYqeEc9toqGaThod9MNWEJs0OJew6KY558cMF0,5250
480
498
  sglang/srt/lora/backend/base_backend.py,sha256=EIz8I-GIrdmK4fISw3ENhbJVVITaxKfyLxHXGPU4fPs,5044
@@ -488,66 +506,72 @@ sglang/srt/lora/triton_ops/sgemm_lora_b.py,sha256=EoF9HymgQ1V9DwyOJOvbw1hCbEjprV
488
506
  sglang/srt/managers/cache_controller.py,sha256=RDKuRuRdrMWhsy4QOXvtTG_u_NQUQFly7a6BnoEYiMY,18434
489
507
  sglang/srt/managers/configure_logging.py,sha256=fOJaXAQ1n9m-8KPJndpsKvS885i69SMafoEADLIVfIM,1633
490
508
  sglang/srt/managers/data_parallel_controller.py,sha256=nB4CD_g8VShTZHCQ9sfst73lQeSvOChFzeY-6RRAhL8,11648
509
+ sglang/srt/managers/deepseek_eplb.py,sha256=bExIzjdX8IcBOWYdgne5n0VV9Vht6AfDPeBjQY1rttA,10699
491
510
  sglang/srt/managers/detokenizer_manager.py,sha256=SpLxTsSPKBZfD-ZMhJ5zpPPGuUb8PmcYgFSL9CsurU4,10696
492
- sglang/srt/managers/expert_distribution.py,sha256=r3o5RGI0gnV7xb60AApqKYa0oiSB37oB7hQBX7P3xZM,3225
493
- sglang/srt/managers/io_struct.py,sha256=A6Odr-nyO3CJ0925m_2zCnvra6oQAFPU2o7F9TqSD70,31835
494
- sglang/srt/managers/mm_utils.py,sha256=qTxNjMWdQwPpWBjk86eOS-UEgkfwNq5WwYiREK3wRso,18090
511
+ sglang/srt/managers/eplb_manager.py,sha256=Th-CcIJjXdwAjja7WmXsc-41gjHyqUoHkeopSi17Jvw,2004
512
+ sglang/srt/managers/expert_distribution.py,sha256=lBqqULoM6WRr1pzN-2dDGMm3dMPMI3s1O98YlEiP1qk,24921
513
+ sglang/srt/managers/expert_location.py,sha256=IpmiHfU_2Zi7_pscMQsDJRzp9hwqEr9hDOs1Wh2zKzU,14656
514
+ sglang/srt/managers/expert_location_dispatch.py,sha256=GmQ2chTMCPJdkYydyent0hGXoQVGcDAmA0ZQt5Yq3LA,3461
515
+ sglang/srt/managers/io_struct.py,sha256=LEdefg_TOXeEglzXcui7f6Phyk_Yfb3IRdM8sYiX72E,32343
516
+ sglang/srt/managers/mm_utils.py,sha256=5sagb_LjLP6UOv5aXJiCTZHq5tJK95N01A3mOAMo9-4,24720
495
517
  sglang/srt/managers/multimodal_processor.py,sha256=XlRYvNhF6XOssreRX9DZPhLSpps_VE62gSKw3EGdNPo,2088
496
- sglang/srt/managers/schedule_batch.py,sha256=OhrWYd_ywWiNNMOp_fcDOIwYt9_gX7oZnR9imEXbkb4,67564
497
- sglang/srt/managers/schedule_policy.py,sha256=mCgwmhCTpzQJawiNizIxjY4nszkxokMmMz9DlDGGUa8,19666
498
- sglang/srt/managers/scheduler.py,sha256=2TzJU0DZ_nmLnYJjQGn_JZJdfG-cDQnuMZUrINiOwsU,91483
518
+ sglang/srt/managers/schedule_batch.py,sha256=GwbTqrq1anmayVeGl5UklRk6X45g5JlyeEAGhlnzpQU,68679
519
+ sglang/srt/managers/schedule_policy.py,sha256=6uRRgxbTJ0pztoAg8oRh2u1g6hNejDyMevD2-68zEYA,19723
520
+ sglang/srt/managers/scheduler.py,sha256=fScqhC7bQAy1BDtk4i5yeDDCCJMpXKhOF6RXDnoM_vY,93732
499
521
  sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=aaj0z1PD3fGIOPoTtWwqoKsii0yQCR7txVFXMPECveQ,29879
500
- sglang/srt/managers/session_controller.py,sha256=o-ifit0n4_xHLNmyD0Ams8FxGRgxFybX-Vz1hwgr3UQ,5755
501
- sglang/srt/managers/tokenizer_manager.py,sha256=DMGNicPMCudO81ryP4zPC9GbO6cAkouGNUHtSQ4f_pQ,56162
522
+ sglang/srt/managers/session_controller.py,sha256=Lh1kruMcKqR7WVWYJRZbYgowtsssVlP7_paIVXLLIcE,5756
523
+ sglang/srt/managers/tokenizer_manager.py,sha256=MUTU2wZT3sFmB05Iej3Rs2EO896by6g1Gs-hBAeLfq4,59559
502
524
  sglang/srt/managers/tp_worker.py,sha256=cnI2JRxDqM7RXaaXAnLHNyYH4Jt7SB6HLAD5fRoWoNA,10025
503
525
  sglang/srt/managers/tp_worker_overlap_thread.py,sha256=W-FP7dkR9_voS0emMj4N5ML3Iao9gNZc-on6iUflbrw,9835
504
526
  sglang/srt/managers/utils.py,sha256=5i75uLlQOF_5CaT02CrWtwozMTtwTg2_nLP8Dtr-JZQ,1536
505
- sglang/srt/managers/multimodal_processors/base_processor.py,sha256=DMeqUdxyOZ5IKo-Z2NjEteJS-Oz6gG9jyU27c8QwA5A,10367
527
+ sglang/srt/managers/multimodal_processors/base_processor.py,sha256=D8TkKouzX4NSwziRNIoOzvf1mPIHoouDyHpHBRmBl6Y,14190
506
528
  sglang/srt/managers/multimodal_processors/clip.py,sha256=lRc2mcuDbAhZVf-0EfkO81pqDiol9zLvTpDqtPIBQ2k,1525
507
- sglang/srt/managers/multimodal_processors/deepseek_vl_v2.py,sha256=hpjpGFzlRBQ8Xv08i37X_VUhnDp_Qm2xD1_F17vK8fI,3253
508
- sglang/srt/managers/multimodal_processors/gemma3.py,sha256=G52ck_3UQGeyrtvjLqI8B0Tm8iNsyB_ahiMTAvx083U,2191
509
- sglang/srt/managers/multimodal_processors/internvl.py,sha256=mydI4yWRMiIo6y8ZL_wxqU2IPpfVf2eR4SA-yOmK3H0,9172
510
- sglang/srt/managers/multimodal_processors/janus_pro.py,sha256=UJoKQWsoU9kittKDwjWbG2KC12wSA-4A3DpTPhA6VoI,1854
511
- sglang/srt/managers/multimodal_processors/kimi_vl.py,sha256=vC9OeS7gVTHzazbluiQ1I0QRKqszlqK75ghUA1rmUNc,2490
512
- sglang/srt/managers/multimodal_processors/llava.py,sha256=APzkprLvqrQkFA6LoDemUa73FtjQL4lwGSnsx5R4vuk,8004
513
- sglang/srt/managers/multimodal_processors/minicpm.py,sha256=uEnlsImjHBOMVNGlfBGpn1zCDLNeMY58HvJ7ZthL2N4,5698
529
+ sglang/srt/managers/multimodal_processors/deepseek_vl_v2.py,sha256=CMfhhdq7u6GzT8ZENo7ByClvQEx-HKaTGVgdYM1vMNw,3460
530
+ sglang/srt/managers/multimodal_processors/gemma3.py,sha256=YUnVl7WA2inYV0QdBwb6mVIxqBRQorK2ivlB3nlX8PQ,3251
531
+ sglang/srt/managers/multimodal_processors/internvl.py,sha256=PYyumQeL8sxfzAlgYLErMX2GW3PT_IF3GJWDMjesSSg,9395
532
+ sglang/srt/managers/multimodal_processors/janus_pro.py,sha256=nSZYKLoCZtv7sQIM21KCt4jpnzVfcsF84m9CFPWwR7s,2058
533
+ sglang/srt/managers/multimodal_processors/kimi_vl.py,sha256=SNe8dXjZezksfd5YJWLhJsXofSYGsBKtd_kPYj51iBo,2641
534
+ sglang/srt/managers/multimodal_processors/llava.py,sha256=90D2A09EHgdWwapVSeLg5J4YsioeT2AvGmJkepZA-5I,8100
535
+ sglang/srt/managers/multimodal_processors/minicpm.py,sha256=2zHMSvMFvCkzk0v_SIaj1c_CJI7bYZ9we1HCukNb-lo,5544
514
536
  sglang/srt/managers/multimodal_processors/mlama.py,sha256=MLiGS606LzVtdoXvjWGANx-K_7nE9J_fMVmkXN7Gz8k,1661
515
- sglang/srt/managers/multimodal_processors/mllama4.py,sha256=50Yox7TaGrrB7iPjN1dQ_UzuY41x7VLmMcRXBhTgUvE,5592
516
- sglang/srt/managers/multimodal_processors/pixtral.py,sha256=YG4-ufrooQnlGZ4gCnl-Scwor322oCHHbO6-SdztwpI,4064
517
- sglang/srt/managers/multimodal_processors/qwen_vl.py,sha256=l94DOaY9vhlD-QjWVWNHUmLu48UKTb-QN9vXqrQxBgA,6907
518
- sglang/srt/mem_cache/base_prefix_cache.py,sha256=NY62Zo0A0tLJ7ObRLOQqQcXCxoJUDZsK8f5U4dNQjKc,973
519
- sglang/srt/mem_cache/chunk_cache.py,sha256=Lyv3eUEaYnCJCLoZQhCx5WfiiUCrrS4xti3e5VROl1A,1894
537
+ sglang/srt/managers/multimodal_processors/mllama4.py,sha256=IAu09ZPMAHxZKsfGiKjZU_Fruj4AmKA0poqXC0zufWQ,5813
538
+ sglang/srt/managers/multimodal_processors/pixtral.py,sha256=uQJYbxhafNCmg0xP52FdElnkUatAyintER1XNuKz3b8,4195
539
+ sglang/srt/managers/multimodal_processors/qwen_vl.py,sha256=hj_XWTjIALAcUuTVqln9GYWDpwFBJbzrDgq2tPYvTPQ,8709
540
+ sglang/srt/mem_cache/base_prefix_cache.py,sha256=WOUIY6ATzltzXQ7QXS9biSY2o_kzbpDIuTD4C6TLCQQ,1019
541
+ sglang/srt/mem_cache/chunk_cache.py,sha256=YFRsxPdLPrO550zww77mn29JF_I22ZBNyL_HA3aazQQ,2017
520
542
  sglang/srt/mem_cache/flush_cache.py,sha256=GYcxmNXh4hsMpFfNOuCTpKilW7guZwTtAg_usVeM3J0,979
521
- sglang/srt/mem_cache/hiradix_cache.py,sha256=BJR-R2u5YyYIhGIxTY-3rf8Vx60XjCRU8Yhmkn2fzzM,16597
522
- sglang/srt/mem_cache/memory_pool.py,sha256=M1rKyPZ0TBLenO1nQgsjAwheBfMzcR3-B4hPNAEgCEQ,36358
543
+ sglang/srt/mem_cache/hiradix_cache.py,sha256=v2P-sl0gpucJZNDEhO0BdinWL270czE7uFZglOtuS30,16617
544
+ sglang/srt/mem_cache/memory_pool.py,sha256=GymHdB7PQlGlXLgA9OfDbp6002cz1tXagwBIQkYpgK4,36293
545
+ sglang/srt/mem_cache/multimodal_cache.py,sha256=Q-lYcI-3HoLu0WJhE2F_An8g9mkZ8LwMrYnQ4383Rf0,1266
523
546
  sglang/srt/mem_cache/paged_allocator.py,sha256=BrJS0vN1k-vTSgb_M8u_1KoZFRgzgR1WRyImCTq3T0U,9770
524
- sglang/srt/mem_cache/radix_cache.py,sha256=Lm-pco6CJ4orb9IfDpbHm5MnyK8Ya0OF1x9p88dv548,14906
525
- sglang/srt/metrics/collector.py,sha256=o9s4j-QC6JK_S352QVkAUkz35my57gFPWyhh3WUIfiY,19569
547
+ sglang/srt/mem_cache/radix_cache.py,sha256=foS7mmPCCUWDP12aQCZGw7XAJqYfzZTowkoCTOa7jjY,16656
548
+ sglang/srt/metrics/collector.py,sha256=YbFOQojvlzT6i6DqvH87vzVYZfZzhHHl0SLwG76kqfg,19585
526
549
  sglang/srt/metrics/func_timer.py,sha256=VFyNRrbnKVCwnQsrlLin1lITJfjQpf9m8sGPqL5LIsQ,3438
527
- sglang/srt/model_executor/cuda_graph_runner.py,sha256=toZ6OvNcxWQMoPcpifWgeoeJP-fGdwySVzdLkec8Oso,26310
528
- sglang/srt/model_executor/forward_batch_info.py,sha256=b7XH72qIpslgEpy7hyMqCXtC_fWNm_yuqVtQRk8hWPw,27731
529
- sglang/srt/model_executor/model_runner.py,sha256=J0B6nSs8oiuizHM653c0SY5PJ9BbqUmne8igPs1bUdg,49200
550
+ sglang/srt/model_executor/cuda_graph_runner.py,sha256=QzYrlTkqxvqlPEoc9x0QhdxqtzK3pyjjuagt57NN4CM,26530
551
+ sglang/srt/model_executor/expert_location_updater.py,sha256=Wf_o-JPsUH81ZLCZvMkyxqaZngtU6PoVgVX2EMZEBFM,15791
552
+ sglang/srt/model_executor/forward_batch_info.py,sha256=3V5FKLj_dLL5pxy0FtcDZr2nUHGnyW8gRkx1GF7r7dM,27952
553
+ sglang/srt/model_executor/model_runner.py,sha256=bVrjXDzCAb3_H2dj2KbSvgO8wwdYrHKJ3ZGhcnu8eyo,52429
530
554
  sglang/srt/model_loader/__init__.py,sha256=zGZkOBz1zx-pkaIy47BasL3fjDlAcxAXUTjInOhXHAE,919
531
- sglang/srt/model_loader/loader.py,sha256=-TISKGKpehU86vVyGm0xo2GALVVzQSUibi3jEisTBiw,55494
555
+ sglang/srt/model_loader/loader.py,sha256=C2R_e-KbxrWK9v_bVC6U7eRG8SyJ2KxKyYmBx8BxbJ0,55650
532
556
  sglang/srt/model_loader/utils.py,sha256=0NaMR67fESFopaklmsleiL27XH1QUrjZW246MUu1EJ0,1369
533
557
  sglang/srt/model_loader/weight_utils.py,sha256=yKnau-wH9muczoCpDTCVIqXFqz-QJmEEySplX3bMJWk,32153
534
558
  sglang/srt/models/baichuan.py,sha256=HbvlErnkCSK4pRQYCSDxMcrn-1DQyfiNoeDcnRrJas8,15807
535
559
  sglang/srt/models/bert.py,sha256=kHlErDgNX_mIhfWWCnAcH_ncvYg22Y61gI34gW8GuUY,12738
536
560
  sglang/srt/models/chatglm.py,sha256=cajLN9caBl09e0TwOFkiTTKDqwlbmHo_yS-NCjdeQW8,13957
537
- sglang/srt/models/clip.py,sha256=58m-y5lkHIGY0ypYGtgD6gImQ7yZJutYGVl-ygqbNBI,19765
561
+ sglang/srt/models/clip.py,sha256=mkdSNhc2SgRHyeq9tCLEjUGdnA8yS2EMMbMKSpn5dMs,19863
538
562
  sglang/srt/models/commandr.py,sha256=5Y_b3K0QY7D37nFGkyiGgY38RleRui_GJUYcHSuHUZo,15315
539
563
  sglang/srt/models/dbrx.py,sha256=4pn_fdoATg01VEqNnIAxNEsKV5XU7gwHyd289eydq1s,15598
540
564
  sglang/srt/models/deepseek.py,sha256=ZnN02HdgXCB23Vno5V9UMUoOxH5HC82vNTwsVulUJ-o,17206
541
565
  sglang/srt/models/deepseek_janus_pro.py,sha256=OeeI7vZbE4HGpxa8CwT6-Lbfs7J7WMQ3oBNpVJQpv3w,70450
542
566
  sglang/srt/models/deepseek_nextn.py,sha256=Yy5dItwimszQsAN7EjgND2cNQ9bypJ1TtFfhqcBQJnk,5673
543
- sglang/srt/models/deepseek_v2.py,sha256=ueqi4m3S4rj8VL49MdXmxXrNHp2rAsYCfclcjLOafHg,75767
567
+ sglang/srt/models/deepseek_v2.py,sha256=iaFIKpi-_xfcv9Q18WZu7r9kCRZqYyTqApuO1SAvTXw,73855
544
568
  sglang/srt/models/deepseek_vl2.py,sha256=j8BdxZsMjm6lPdbDipEIKhVIVywCP1Vl1Kl46BZ5_0Y,13147
545
- sglang/srt/models/exaone.py,sha256=rX7J0xFt9TSt6tMIhnYMkb5KDnqTJIV4BtjPLFwQ8_8,13425
569
+ sglang/srt/models/exaone.py,sha256=TpO-rtCpEZ8Ua7hGFnS8l2oAYhY0Pij50grc9WQ2mvc,13576
546
570
  sglang/srt/models/gemma.py,sha256=4cdrPISg1VKnsuI-QPTpYvet4BrX8BMKvCIN82iLskw,12641
547
571
  sglang/srt/models/gemma2.py,sha256=kqtwdo93GWKm2iBN29RoIRH2ggRm-K_80LM5btgfBLo,16395
548
572
  sglang/srt/models/gemma2_reward.py,sha256=V8U3_ADUHWPdOwvEe1jhGW-oJmBgL8t1TY3-67Ksv2A,2618
549
573
  sglang/srt/models/gemma3_causal.py,sha256=LfwHhF0nRD7OnmeHXXfQ7rofnFXjJI74gZiptak18RY,24924
550
- sglang/srt/models/gemma3_mm.py,sha256=5rthHzaFNJb82IYUREwxQt4N4fDXW4lIxiptnKpVing,15246
574
+ sglang/srt/models/gemma3_mm.py,sha256=EOW5Q0iOFvJWgpA1QdpwzVicVvv7RulERXWNtC-I_pQ,17004
551
575
  sglang/srt/models/gpt2.py,sha256=kclhxEs8oJk1KCyhmAqo7rZqecVGGHYkc-a1WZi3aIk,9841
552
576
  sglang/srt/models/gpt_bigcode.py,sha256=1D6bi8Zu760gCRZkvdLHFcg8kCkY35ARwQYaMDtYhl4,10307
553
577
  sglang/srt/models/granite.py,sha256=5WOJyNYAlt5RNHSexNfPNihhSxIMd7wPzju1cTixKig,20852
@@ -558,22 +582,24 @@ sglang/srt/models/internvl.py,sha256=kEzkL5tAq3skvK5D7TqhiElSIXrA6cNOd8irYV4aKhA
558
582
  sglang/srt/models/kimi_vl.py,sha256=YoM6CmrF4ZS0SsXKiR-_SfylKhd87ciJjno6_x5LG4o,12874
559
583
  sglang/srt/models/kimi_vl_moonvit.py,sha256=M5L7AJOJ2Zh2pqLZAq8aRqhbTSlipr8XOoD3ix6o2sU,23908
560
584
  sglang/srt/models/llama.py,sha256=-NC9EL9R8iJqaRrkMLewvTP3sgC_f07AHmGBVEdKmQ8,27149
561
- sglang/srt/models/llama4.py,sha256=EZdosYTrzEX0oYnWqocTzB4n7U9_V8fIgJqGxrJn268,19385
585
+ sglang/srt/models/llama4.py,sha256=NwG0mBZQR4B6KVR-Xzp89UQYvVnFMOgkZKVWvtT7Jt4,19454
562
586
  sglang/srt/models/llama_classification.py,sha256=4QWTFaUZIFKYZvEzs8bx8VkOZNIwdYCLrnwrdAw4QK0,3108
563
587
  sglang/srt/models/llama_eagle.py,sha256=Ubh_jmtfiOnriwvHgQT0ZGID7JvYvdSi_QGHOIkEgPE,5028
564
588
  sglang/srt/models/llama_eagle3.py,sha256=KCvUrWn17t7T28G60HwMyy99iB9AbdbPnS2el9n3r6o,6804
565
589
  sglang/srt/models/llama_embedding.py,sha256=zq-_lNu35VBFc7eemiam0zdkGIE8fzrgk5OWYfirZnA,3254
566
590
  sglang/srt/models/llama_reward.py,sha256=LF2nqMV5XOrljGjAwJg43mBv3z6Q040I2EYlgZeCp8k,4681
567
- sglang/srt/models/llava.py,sha256=b9WcshvSqz1cqbuOq1tVTKH5J9D5PN5bBYrWzVKIQzo,37116
591
+ sglang/srt/models/llava.py,sha256=m0-qcEWEUyN7kIiCYJAZTi58MwL4ioqCAD99PSTpsuY,37496
568
592
  sglang/srt/models/llavavid.py,sha256=q0lHlRnoYHKJZsWnkIQdd6dYAQ26t7XsmrqA0zDGmZc,12829
593
+ sglang/srt/models/mimo.py,sha256=Mp-iFp4YHuiuq-H8enUF5K5QbMnVcvEa6mURH6vM3yM,6140
594
+ sglang/srt/models/mimo_mtp.py,sha256=y0wTNObGz0lyVt0zu7apdVlTRLEQmc_xsd8SvgSo_vo,7806
569
595
  sglang/srt/models/minicpm.py,sha256=m5HFsSJj0Po09LY9R6qj6K4gceqWDMOePz3NDGgMGT4,14691
570
596
  sglang/srt/models/minicpm3.py,sha256=6-gfHSfXwyB5zw7AIj-c5TzjpEKR6CM0H67MrD8LVUE,19347
571
- sglang/srt/models/minicpmo.py,sha256=BAiFR78L0j5WDZtOrUf6JgUe9DZs9huIsfQ_4RzUbdA,76319
597
+ sglang/srt/models/minicpmo.py,sha256=umWgRpYqJchXyZOcz7LeBWIo6JatN4Wyr9bufcVmpbk,76060
572
598
  sglang/srt/models/minicpmv.py,sha256=hSDWEcmutqOJv-xs0X_4TaNCDAWFUk71eRHLm9sPC0U,40564
573
- sglang/srt/models/mistral.py,sha256=EYifJUUzN2Z2-iL37eJiNZF_DB0H4pa0mKlgYRIxM70,838
599
+ sglang/srt/models/mistral.py,sha256=z7q5NBVbQcboQTIwhULtsLpFvNferaIv49EzOXVgh7g,3487
574
600
  sglang/srt/models/mixtral.py,sha256=n-Pz7fyWE4m6Uh7sjzAYKNr5Wy4QUj5Yekl0qiCwQI8,17055
575
601
  sglang/srt/models/mixtral_quant.py,sha256=-kQw9r8KcLdO8SNN9RKXzrGq9Q2Al9l9cWHi1VrZSRM,15260
576
- sglang/srt/models/mllama.py,sha256=sOuP3Od3h9_uh_oxDN5rj4CzhZjg82PyElfBHuTxzUQ,39768
602
+ sglang/srt/models/mllama.py,sha256=pkS0UWiqKJHRsFtSZzpSI9O6B5_j1OtI5pf_nyDPp3U,39707
577
603
  sglang/srt/models/mllama4.py,sha256=ejuhIVX0MDojdB5EPR-V-Qd_E9st8KYjnjyeArFbdFs,9084
578
604
  sglang/srt/models/olmo.py,sha256=7-q_fA6XXdG7kPUjpUzYkzMUWJobuSjhqjYw9xSUs_c,12671
579
605
  sglang/srt/models/olmo2.py,sha256=azmljhJF4ivcQfUtfsAUxq3ducE4tRKTL6iwe0IKYMg,14327
@@ -581,26 +607,25 @@ sglang/srt/models/olmoe.py,sha256=TMzt-yB891bvA4X50xL0NjNnFYSx9imlA7N1EG8KNK0,15
581
607
  sglang/srt/models/phi3_small.py,sha256=eJb8aS_3KLObrq3PNkoIyVHaQ6SZTAJe42rbpC54QKg,16012
582
608
  sglang/srt/models/pixtral.py,sha256=Iu7OTvM_nnApk1VjpUb1ucPBU2F1Kov5w6ddYn7gGqE,16983
583
609
  sglang/srt/models/qwen.py,sha256=xYkVmMZS2uMqWhfndc8EYm0olpKFnggfuMp_6aobVi4,10758
584
- sglang/srt/models/qwen2.py,sha256=ab912Yyk0aXOzI-wrxqN-sNF3bTVkNxB8P2uNcOCv9U,16394
585
- sglang/srt/models/qwen2_5_vl.py,sha256=LQee0Yuz6XzKiIFZQBUgRuDN2aX_CqvoxHx7w5a35ww,22603
610
+ sglang/srt/models/qwen2.py,sha256=OBhNcpd2eSTceHFOjJFRBefv9WgZl0FkW5ErRNaKaME,18563
611
+ sglang/srt/models/qwen2_5_vl.py,sha256=i35Gs0XJ8mnyDbXp_D1CmcQJoGS2Wly6BadeGI47Sjk,23031
586
612
  sglang/srt/models/qwen2_classification.py,sha256=dGrMm4ebd30_lBhHOhaV57ig2iOTx3nqB4GEzsrRIM8,2747
587
613
  sglang/srt/models/qwen2_eagle.py,sha256=Iz0HWL2FgSD3FqoFhfYmbIZeEYkPTJ96lYbkncmHJX4,4644
588
- sglang/srt/models/qwen2_moe.py,sha256=iG0d2WwUosOFR9w2YGM9CfvZ1NG-rhse3OUTwSs8a6Q,18567
614
+ sglang/srt/models/qwen2_moe.py,sha256=6jsxIExxs6gd4rezTcP_yFtMlW4bwOWVGskVYQWfNxM,28822
589
615
  sglang/srt/models/qwen2_rm.py,sha256=-mQXDEv11p-I1HXgYLTtY6ROem6UYorO958WsDrzsgs,2837
590
- sglang/srt/models/qwen2_vl.py,sha256=X18_Smisiz6zQHUK4h7-ho8poRKWjUZisjB5LuUwYGk,20946
591
- sglang/srt/models/qwen3.py,sha256=reaowGkotYAGHS5zTCWrvnyxtu92QKus19n-2amtMa4,12358
592
- sglang/srt/models/qwen3_moe.py,sha256=A9Z3OhJqld1sJUDsHymgGxib4lMCMTKxF8iIzHDGdNo,15877
616
+ sglang/srt/models/qwen2_vl.py,sha256=Y-03fgF_8K0Ozd-GMgeCzfHHQS60aPDLfadZdRdy8g8,21311
617
+ sglang/srt/models/qwen3.py,sha256=lL39Ap6eY-7YFUrvLrd1cRcQ3zoUgYaI7D8Y9lb45Ls,13516
618
+ sglang/srt/models/qwen3_moe.py,sha256=6V3MCPhBc_gul2Qqu9d1cqoEt5YHXmo4jp48AxJN-i8,29457
593
619
  sglang/srt/models/registry.py,sha256=inKh9iwOp3LFYm3nqujg-OtABClOP-ifc1stA9cZegA,3434
594
620
  sglang/srt/models/roberta.py,sha256=77H_-9jtjqpHlpQhBuZXs7RUG-dSjauDkpHhFe61DpE,6320
621
+ sglang/srt/models/siglip.py,sha256=DIVJRwdtpLD2QT1kVPIHw7Bn9BE40xJbkHujDNzkjgA,9892
595
622
  sglang/srt/models/stablelm.py,sha256=0x_31uIr3WcWwecdPAI3ek9KkyKBJS7VwknTk2y0gjY,12281
596
623
  sglang/srt/models/torch_native_llama.py,sha256=oTxxof5Wx2b2egIwWx56LeHjtPGQleQ2zM5jXHMiuOU,19293
597
- sglang/srt/models/xiaomi_mimo.py,sha256=Mp-iFp4YHuiuq-H8enUF5K5QbMnVcvEa6mURH6vM3yM,6140
598
624
  sglang/srt/models/xverse.py,sha256=DsNVI9JpzN4jj0Ry6aTrj7r-xq5YLOoDX2kH4YLJA-I,14035
599
625
  sglang/srt/models/xverse_moe.py,sha256=7KCM2-j12towDMNvXkuuYiBOmNauH6NG4Ip40x0khqA,16782
600
626
  sglang/srt/models/yivl.py,sha256=oToK7-u5IGO7xwpJIQ7VtudlK6-zPqJX4bt6_wv0SH8,4850
601
- sglang/srt/openai_api/adapter.py,sha256=rTVMbR6jbY-lbMZL_VvWF-3E6FQrD2nb0HMg2OrBP88,77748
602
- sglang/srt/openai_api/protocol.py,sha256=CsMwbu09RzmdZ5d6nrZ5di-5_kN1g8452kKBlX9sF6c,14353
603
- sglang/srt/platforms/interface.py,sha256=hym3iooBB4C8if5hDZezgVN6h4NIOu7sg2ZUBIV6XmM,11246
627
+ sglang/srt/openai_api/adapter.py,sha256=J8AHUwfCzai4d_fHGg92SA0evdn8IPTwH01u6XrEOj8,78334
628
+ sglang/srt/openai_api/protocol.py,sha256=6HnE8MZ5m2V78mJZ9Im9NyaD4FqC1WrJT8Ewx1iFySI,14459
604
629
  sglang/srt/sampling/custom_logit_processor.py,sha256=AwODYVJdRkcQ8PGtJrhzKsqAgn8XZLQbAmR9fGiQzmc,1608
605
630
  sglang/srt/sampling/sampling_batch_info.py,sha256=VjOQpiXsY2vlTPtSb0T4piXIEtE54QefDpTVSDJ7bXE,11988
606
631
  sglang/srt/sampling/sampling_params.py,sha256=tfUwWgxu6JWXsOClX_MFGTfetgRE63CQZsIpOhnWcoE,6013
@@ -611,8 +636,8 @@ sglang/srt/sampling/penaltylib/orchestrator.py,sha256=XM-Lm6u7gYPtMZrTIc0FR4QxNZ
611
636
  sglang/srt/sampling/penaltylib/presence_penalty.py,sha256=NRh10AJrrQlGJ6S-enGdRefrTrWpyqrSm-aNnyqQNQQ,2119
612
637
  sglang/srt/speculative/build_eagle_tree.py,sha256=lt4sXUehPi26MT2-2Z0VivtF6AP7kirSaEO_u-YJ4J4,11670
613
638
  sglang/srt/speculative/eagle_draft_cuda_graph_runner.py,sha256=zQl6o6_T08UWIzkZbMghwVy_O2pLOyAYreM9VmyHRmY,9298
614
- sglang/srt/speculative/eagle_utils.py,sha256=DKYmQrO1Mg4i_8e-7YpbVtDifMWxMkAG3rATRh9gQOQ,28694
615
- sglang/srt/speculative/eagle_worker.py,sha256=M3vSOd2MHzECAcWogFuGjdYt-AGuHFqfODQDl_Bo6qE,27012
639
+ sglang/srt/speculative/eagle_utils.py,sha256=uENgCjXzPK--nynUBHKaSb5alRay6QvJ4hOn0BUxckE,33237
640
+ sglang/srt/speculative/eagle_worker.py,sha256=2k6ygbkJ1FK1I3vJNpvISQn8Ac3lW3i3xFRr1ZugIyY,28843
616
641
  sglang/srt/speculative/spec_info.py,sha256=rhaKG0TzyF9XZYHEWp1jccwTBohSNsUDvxHFtAoOl18,709
617
642
  sglang/test/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
618
643
  sglang/test/few_shot_gsm8k.py,sha256=qnEejCyPHGEMBEiNc7T4-t9lvoo2DNN72RXw-ei_TnY,4300
@@ -630,17 +655,18 @@ sglang/test/test_activation.py,sha256=GeTIJHxlLQfW3kM-X1FGa8Sa3dSGKHEXl5wEy-hfGi
630
655
  sglang/test/test_block_fp8.py,sha256=bsV6Y_tCUF2ROEmuPDegNmHzGF-T4AgOvH7eYmAmKtA,21604
631
656
  sglang/test/test_block_fp8_ep.py,sha256=N1rvqbPErBaFFpeAw8TLYXGNZOoG7cfIBP2p5XbSyMo,10806
632
657
  sglang/test/test_custom_ops.py,sha256=2bSo9P5_rJZYFq8Y8IKRimDfFyZZGJluhL7Ngny0Pf4,5571
658
+ sglang/test/test_cutlass_moe.py,sha256=XPgC2wrXs04CEMVUKN362WBRIdWNZhFe_LYvCFlTBkY,9893
633
659
  sglang/test/test_deepep_utils.py,sha256=749ysTBGNzh6rYUCJhhZBtZpeD15eWTeNHYCytcvZtc,7448
634
660
  sglang/test/test_dynamic_grad_mode.py,sha256=L76yUCuk_ymNpXD2CmO8r2GiGjIvD_gtTsuFDs2NolI,1638
635
661
  sglang/test/test_layernorm.py,sha256=2GMWqqNDuGvSMSsEBF5eDCzwVSYA9E6hGhRo6s4ecKg,3764
636
662
  sglang/test/test_programs.py,sha256=DJIbTChloPwaDiEWHQoSTuKv3BGx0-K8Y5e1mDDTACM,18910
637
- sglang/test/test_utils.py,sha256=XijnLXyC7t1Kfg_yz3Y426DgQx8PYsE8iOesdHLAPY8,35032
663
+ sglang/test/test_utils.py,sha256=7kMpQ28wvIb5_tJiH1J31FEOQ0aG-xJgPJI59c6iTYE,33859
638
664
  sglang/test/attention/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
639
665
  sglang/test/attention/test_flashattn_backend.py,sha256=_rTG849FwQdVTyGKkqhczaOqngBmRWXFmkl5NnuK1GM,13914
640
666
  sglang/test/attention/test_flashattn_mla_backend.py,sha256=g4O50WblTpM7_Gq2b76k0i25_z01BOUBQ4i6PmyxpO4,10774
641
667
  sglang/test/attention/test_prefix_chunk_info.py,sha256=er0i3KGHMkw-4UZB1GCFd4oYwRcXfU5wpO1ORqpNGGA,7626
642
- sglang-0.4.6.post4.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
643
- sglang-0.4.6.post4.dist-info/METADATA,sha256=LYS-QShEa42mO05m4fh0JjTDKD9a4rKtxYaB2vNK_jk,26006
644
- sglang-0.4.6.post4.dist-info/WHEEL,sha256=DnLRTWE75wApRYVsjgc6wsVswC54sMSJhAEd4xhDpBk,91
645
- sglang-0.4.6.post4.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
646
- sglang-0.4.6.post4.dist-info/RECORD,,
668
+ sglang-0.4.6.post5.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
669
+ sglang-0.4.6.post5.dist-info/METADATA,sha256=EAgGsHSr-8SE4rQOA2HRCN0L9H3TTbKAg_XIA8lBUW0,26727
670
+ sglang-0.4.6.post5.dist-info/WHEEL,sha256=zaaOINJESkSfm_4HQVc5ssNzHCPXhJm0kEUakpsEHaU,91
671
+ sglang-0.4.6.post5.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
672
+ sglang-0.4.6.post5.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: setuptools (80.4.0)
2
+ Generator: setuptools (80.8.0)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
5
5