sglang 0.4.6.post1__py3-none-any.whl → 0.4.6.post2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (61) hide show
  1. sglang/bench_one_batch.py +2 -0
  2. sglang/check_env.py +3 -3
  3. sglang/srt/configs/__init__.py +4 -0
  4. sglang/srt/configs/kimi_vl.py +38 -0
  5. sglang/srt/configs/kimi_vl_moonvit.py +32 -0
  6. sglang/srt/configs/model_config.py +15 -0
  7. sglang/srt/conversation.py +122 -1
  8. sglang/srt/entrypoints/engine.py +44 -22
  9. sglang/srt/function_call_parser.py +97 -0
  10. sglang/srt/hf_transformers_utils.py +2 -0
  11. sglang/srt/layers/attention/cutlass_mla_backend.py +1 -1
  12. sglang/srt/layers/attention/flashinfer_backend.py +107 -82
  13. sglang/srt/layers/attention/flashinfer_mla_backend.py +27 -16
  14. sglang/srt/layers/attention/flashmla_backend.py +3 -0
  15. sglang/srt/layers/dp_attention.py +5 -2
  16. sglang/srt/layers/moe/ep_moe/token_dispatcher.py +1 -3
  17. sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=192,device_name=NVIDIA_A800-SXM4-80GB.json +146 -0
  18. sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=384,device_name=NVIDIA_H100_80GB_HBM3.json +146 -0
  19. sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=768,device_name=NVIDIA_A800-SXM4-80GB.json +146 -0
  20. sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=768,device_name=NVIDIA_H100_80GB_HBM3.json +146 -0
  21. sglang/srt/layers/moe/fused_moe_triton/fused_moe.py +8 -6
  22. sglang/srt/layers/quantization/__init__.py +2 -2
  23. sglang/srt/layers/quantization/deep_gemm.py +1 -1
  24. sglang/srt/layers/utils.py +35 -0
  25. sglang/srt/lora/layers.py +35 -9
  26. sglang/srt/lora/lora_manager.py +84 -35
  27. sglang/srt/managers/data_parallel_controller.py +52 -34
  28. sglang/srt/managers/multimodal_processors/kimi_vl.py +73 -0
  29. sglang/srt/managers/schedule_batch.py +25 -15
  30. sglang/srt/managers/scheduler.py +263 -59
  31. sglang/srt/managers/scheduler_output_processor_mixin.py +1 -1
  32. sglang/srt/managers/tp_worker.py +51 -16
  33. sglang/srt/managers/tp_worker_overlap_thread.py +9 -3
  34. sglang/srt/mem_cache/memory_pool.py +70 -36
  35. sglang/srt/model_executor/cuda_graph_runner.py +82 -19
  36. sglang/srt/model_executor/forward_batch_info.py +31 -1
  37. sglang/srt/model_executor/model_runner.py +115 -57
  38. sglang/srt/models/deepseek_nextn.py +1 -257
  39. sglang/srt/models/deepseek_v2.py +78 -18
  40. sglang/srt/models/kimi_vl.py +308 -0
  41. sglang/srt/models/kimi_vl_moonvit.py +639 -0
  42. sglang/srt/models/llama.py +92 -30
  43. sglang/srt/models/llama4.py +2 -1
  44. sglang/srt/models/llama_eagle.py +4 -1
  45. sglang/srt/models/llama_eagle3.py +4 -1
  46. sglang/srt/models/qwen2_moe.py +8 -3
  47. sglang/srt/models/qwen2_vl.py +0 -12
  48. sglang/srt/models/qwen3_moe.py +8 -3
  49. sglang/srt/openai_api/adapter.py +34 -22
  50. sglang/srt/openai_api/protocol.py +11 -1
  51. sglang/srt/server_args.py +67 -22
  52. sglang/srt/speculative/eagle_worker.py +3 -2
  53. sglang/srt/utils.py +88 -9
  54. sglang/test/runners.py +4 -0
  55. sglang/test/test_utils.py +29 -0
  56. sglang/version.py +1 -1
  57. {sglang-0.4.6.post1.dist-info → sglang-0.4.6.post2.dist-info}/METADATA +5 -4
  58. {sglang-0.4.6.post1.dist-info → sglang-0.4.6.post2.dist-info}/RECORD +61 -51
  59. {sglang-0.4.6.post1.dist-info → sglang-0.4.6.post2.dist-info}/WHEEL +1 -1
  60. {sglang-0.4.6.post1.dist-info → sglang-0.4.6.post2.dist-info}/licenses/LICENSE +0 -0
  61. {sglang-0.4.6.post1.dist-info → sglang-0.4.6.post2.dist-info}/top_level.txt +0 -0
@@ -1,16 +1,16 @@
1
1
  sglang/__init__.py,sha256=T-fZEjKP66Q1q3PB56oREs5U3zf6bL0fNcdIbW8jMhE,1652
2
2
  sglang/api.py,sha256=vHiKBg8wwIdmrpnGclop5BzJ-1Q88emrlrfLwNCHg98,7010
3
3
  sglang/bench_offline_throughput.py,sha256=OQb-AjL4UNymmir02ht43uzgaNsnO_I11nXSowKMqBI,13841
4
- sglang/bench_one_batch.py,sha256=gUIYcFWM_oYSXnM4CHYJcyuX0l1aMG-afK7-iFjAJZI,19584
4
+ sglang/bench_one_batch.py,sha256=_xdxxdUqJtEGfURmBf0WFrQv38Q6vPlfG7QO2b4Fe6g,19622
5
5
  sglang/bench_one_batch_server.py,sha256=8VYNhaQbWGP8TkNVuy_sPjD5FiuVZHamtGRWKwa-Z-Q,5962
6
6
  sglang/bench_serving.py,sha256=8rbek9PLYEHdt8fdll-z_P9e6GpmlLohHiyqY99JXIs,57567
7
- sglang/check_env.py,sha256=76itNLUw9KlqbiY1BI4u4YaMZaqyCNcrCLUIb6aHflM,8396
7
+ sglang/check_env.py,sha256=qDMIG2rCNBH1yKnxQmF-Bp10oiFMUKMgfZLHZYOmdSY,8412
8
8
  sglang/compile_deep_gemm.py,sha256=Umy3oYFeCn40qHUdwlPVuFXmA24fFYB-fuWApgZnEfw,6211
9
9
  sglang/global_config.py,sha256=xzLdk8W53fneFblNh8iIjGF9C3-7mnzR1-LleD9Btxg,1495
10
10
  sglang/launch_server.py,sha256=mDXfwha8LHpWQJekcCosR98QhCQsbmilsBlI5jAIgg0,420
11
11
  sglang/llama3_eval.py,sha256=gWSboDchIGybIce88bJlrCG0yiLZ513mw4gcutJlzGM,10017
12
12
  sglang/utils.py,sha256=GIcgiRHkZ-gyPxXOdn1qFF41jkg4-YdDxbPc4mzO-qk,16159
13
- sglang/version.py,sha256=mb7cZWFtBTYPgotnX_1oAZadFITLHrAXwTSs2Eb1dvU,28
13
+ sglang/version.py,sha256=EOm4637qsQ4gxuzOdaxFFBpWIBeQl7iFLSjMjGurEHg,28
14
14
  sglang/lang/chat_template.py,sha256=MwNL5dNTe8g_l2ljZubnrazEgT2xEv-9O2D0Ezwxy4I,19658
15
15
  sglang/lang/choices.py,sha256=-W1DVw9N9ZliVpvmWrzIXG4cswAah8eMQrHWzkS3D8o,6234
16
16
  sglang/lang/compiler.py,sha256=MAuzoOOpb98njJ7Io2SDmFkhTroDYiq0te0ZpfHkMY4,7597
@@ -27,27 +27,29 @@ sglang/lang/backend/vertexai.py,sha256=gz0uNYyBb88jbPYz6ZIJ774fefrcbuVdoK33bphUZ
27
27
  sglang/srt/_custom_ops.py,sha256=L7NuEaRD_Q6Q54n0NZnLXgWZURbnn8Tkg4NQedE6zgA,3616
28
28
  sglang/srt/aio_rwlock.py,sha256=6LYtOdeTUY3hkfa1dmYkgsaF2ttrwIF3hUWz2AZ2fqw,2970
29
29
  sglang/srt/code_completion_parser.py,sha256=iYRFBxXBAysHcBnf9IHmmyjVkrqKu_9h6Z0_EEjjTp4,5404
30
- sglang/srt/conversation.py,sha256=jgm15yl2SPjSlVjLPwWYklUsUUElq-7W6-KqqGc30vs,30262
30
+ sglang/srt/conversation.py,sha256=otEs_H81NcYsy1PKx8l5Q0BUOIXjHscBlRVEDApWQos,34020
31
31
  sglang/srt/custom_op.py,sha256=J1PUcGaeJJjfAjp06BQsLpUkKyR1zsh9MvDiDlqqJsg,1129
32
- sglang/srt/function_call_parser.py,sha256=gkCzjf7F2xYUmRunrOKzuB_biTdTKxdA1Vil-v2NlCs,29546
33
- sglang/srt/hf_transformers_utils.py,sha256=N2f-gA8yUq-UP_TJT276gNbDNzmddWsmWnq3px6TIj8,9342
32
+ sglang/srt/function_call_parser.py,sha256=evwCPbLFjgNiRf-1CcxVFYbF08UVsh0ZGvq_R35TPlw,33379
33
+ sglang/srt/hf_transformers_utils.py,sha256=JEDiaMYzq89sXWIu_CD2kmnNF1OA-gUJOkyh6kWolr0,9403
34
34
  sglang/srt/mm_utils.py,sha256=1ScBunw_x4W8ebM_AcJ62-1T2mfT8NlMJqdAhkF1lb0,12367
35
35
  sglang/srt/model_parallel.py,sha256=eLXZhvJ4wG6dh0FontNCIdVZvHYdWgaeY-5cu7TD9tE,6078
36
36
  sglang/srt/patch_torch.py,sha256=OUPCGQSQz3MVZB1zZ_Eq8lXiw0uIKJ_HWjqQolI8FsM,3088
37
37
  sglang/srt/reasoning_parser.py,sha256=8AMk3XI8mfvz4AUuRHf_pNYpM_Mr64uT9EZ3o90cqQ8,6341
38
- sglang/srt/server_args.py,sha256=jRHEskSyfmHbCnyqRzp3deI5HizDenDiyLjF65ZUqvg,55149
38
+ sglang/srt/server_args.py,sha256=I4Gxme7w3Fpzj6tsbGu8LmLaMLpxnhqqFXSGVjh6Pi8,56945
39
39
  sglang/srt/torch_memory_saver_adapter.py,sha256=HYlgYJ2sgmjs2RSjU2KbCaXijRg3mTDZ0ZcCB5Bt6Ps,2211
40
- sglang/srt/utils.py,sha256=u_YB-FXi3AY6mhRmk8wdPcKKAo1sZY0bMUgnjq8BtJI,63033
40
+ sglang/srt/utils.py,sha256=AtpND4l1ho_h5N6BIVBRgPAIKjG4DomqRQa_Z08ugvs,65335
41
41
  sglang/srt/warmup.py,sha256=FmJiYfjRr3X_eAe7ojQaPoN17LvHpjDmRWRnO-k86AQ,1469
42
- sglang/srt/configs/__init__.py,sha256=vulncVn70WqIT6s0HaB8p_Q6FjOiaLwNZWpoJS9FIuQ,399
42
+ sglang/srt/configs/__init__.py,sha256=8EcVRP95epZ49DxBa6LgKWt7eO3Qe7Hrr3V1c6HkMnY,553
43
43
  sglang/srt/configs/chatglm.py,sha256=j-b0YkdYUmQm2y1kNmMJtKeACxWKmBbvNNkDWbs6kbI,2907
44
44
  sglang/srt/configs/dbrx.py,sha256=tdhIkXAQl1yr0MxqFmsDG1E0e2puRTTKm6UTyANBLac,11005
45
45
  sglang/srt/configs/deepseekvl2.py,sha256=21jZravchHcwyTQ5ROu1NzwI_eu-ngt3v8SRMm4XE0k,23327
46
46
  sglang/srt/configs/device_config.py,sha256=kfmpPOECqYxcRoY-ko0QZRhyiBWUGP2CMF51DMUN5nU,435
47
47
  sglang/srt/configs/exaone.py,sha256=Duxd4yQoKy8GWEzZD_kCY_OzmN_67CTJL_Kgn0eXk3g,10731
48
48
  sglang/srt/configs/janus_pro.py,sha256=-QtJ4ZGZiAJb0AkOEcuCHzIKLw23nF8nRk3rdCcoUO0,19016
49
+ sglang/srt/configs/kimi_vl.py,sha256=4W7VQI3pr888ZsFA2SqCQo4mI0seXTOrGQ-x3oTvWew,1358
50
+ sglang/srt/configs/kimi_vl_moonvit.py,sha256=hx2Rt4JSFbvy2HUTeLjBpge87m8M6ITAhqsgdNf_Jd4,1163
49
51
  sglang/srt/configs/load_config.py,sha256=qs-AxuplouBx2tsv9KGBOLZPbwzuVA4vbktbGP_cRp8,3309
50
- sglang/srt/configs/model_config.py,sha256=GtVEAqxcitVldxLroaHYwoILjfa--a2KmbcBMyyeF08,22421
52
+ sglang/srt/configs/model_config.py,sha256=xyVgImD3bvaDuDuGnWsB-Z81McWzs83Sju3M7J54f8A,23134
51
53
  sglang/srt/configs/utils.py,sha256=3nHUfisMs_Ltuhv8OZTNCJp63YJKJVF43h1QZB1zqx8,670
52
54
  sglang/srt/connector/__init__.py,sha256=czLX5JOxuMhH-T9eSJzoc1qv1B4z9chyffDRL5I6wo4,1247
53
55
  sglang/srt/connector/base_connector.py,sha256=i6i1TIzsz4NbSEkrdMPq-urb2sN2aLAx8dazga4gB9U,2833
@@ -90,12 +92,12 @@ sglang/srt/distributed/device_communicators/pynccl_wrapper.py,sha256=LblisImY9d6
90
92
  sglang/srt/distributed/device_communicators/shm_broadcast.py,sha256=bbruDIM1GgKIdB6gi71_I0mpB179I-qyvwKuSj1Kaic,20816
91
93
  sglang/srt/distributed/device_communicators/xpu_communicator.py,sha256=ajW6132BvA6jkeipEIgN27TFycI0U06Ih2Z8WNjlA4s,1593
92
94
  sglang/srt/entrypoints/EngineBase.py,sha256=xoyvp6XAeDLY2_Q2Ng33H-fRhrXHv2ldJJKd-HuDhqE,1870
93
- sglang/srt/entrypoints/engine.py,sha256=e5BPBIewPTQpYlk1c2eC4C_xyQgJ3mgNEm2Sg3GfV2s,22518
95
+ sglang/srt/entrypoints/engine.py,sha256=4S0ubmNIo8adkapEUOram1MXjkmyiBWXVoHCjXyHAIw,23430
94
96
  sglang/srt/entrypoints/http_server.py,sha256=vvyvCosUp5aTFlD8k4IyZDzj2yXQIsndhPkTl4u1nGc,29573
95
97
  sglang/srt/entrypoints/http_server_engine.py,sha256=ihA6y3GXRs28Y9U3SgdQcJQjnw_SVIby7QrVgiafX04,4846
96
98
  sglang/srt/entrypoints/verl_engine.py,sha256=XLYdwTwhH0jTjw8xczgZXWfBXMRb_ur2bg4TN0dTwfI,6975
97
99
  sglang/srt/layers/activation.py,sha256=oSkdo8B8najXFcVay3Y__CEvgXh87lAIhG0CMp2Ugqs,5954
98
- sglang/srt/layers/dp_attention.py,sha256=WJgXg_KyBzDHkwyfUFBowpDRFd0q5Q9LgEhqT-qT_ys,7549
100
+ sglang/srt/layers/dp_attention.py,sha256=I5cJnBT996mzjpNRrzcZXGt9j8nrkgD4A4T-BHiHkGM,7649
99
101
  sglang/srt/layers/elementwise.py,sha256=XCrR2i-9dP-H6jQo2zUuquwZrsl_wEQqj5Wxk6WUf7o,13987
100
102
  sglang/srt/layers/layernorm.py,sha256=2XEaRK9e6syWO3YLcqWqlR7hZ5R-CFDqbCII-zntQLM,5957
101
103
  sglang/srt/layers/linear.py,sha256=nC9MxJrFap1BEyqgFlBySH4IeQruIbcBp32cOhUl5Fw,52149
@@ -106,14 +108,15 @@ sglang/srt/layers/radix_attention.py,sha256=F71GgDes_fEt_cHxR9HM2QhNG5u7uF4zDAuL
106
108
  sglang/srt/layers/rotary_embedding.py,sha256=eVBwYvGpFhL1KyyPutQuZotmvSpChcxzyhpmcbQ6cKQ,48267
107
109
  sglang/srt/layers/sampler.py,sha256=PNgMXm2vsNsE6Rt89R5GLDC3lDxdIujoWli8F3vldng,11384
108
110
  sglang/srt/layers/torchao_utils.py,sha256=Ws24FdRBSkTpyeyA6bQrdDm-W5wfDxKvSIPUSahyMfA,4063
111
+ sglang/srt/layers/utils.py,sha256=tkTz86DFZ4NRMEUc4QkYNskUskdxXoEqkWqaMGbhP7E,1045
109
112
  sglang/srt/layers/vocab_parallel_embedding.py,sha256=QUxd4sELx6p3dHvEKmccPZ-phdd_9EjNdwjH3SJ9zxI,22238
110
113
  sglang/srt/layers/attention/base_attn_backend.py,sha256=lGujcYJ_CxHJy0Q9L6Phn3ds-nBGMy0OGj3R54R65iQ,3334
111
- sglang/srt/layers/attention/cutlass_mla_backend.py,sha256=kqtTVCIgDhcW5y9iWP8xcwGPuev-V5ipAUG-Ae3ot7g,9883
114
+ sglang/srt/layers/attention/cutlass_mla_backend.py,sha256=kCNn5Ub0jCsFjhVhuE-9qK53gu5a9oMStMeT2lcc6CU,9904
112
115
  sglang/srt/layers/attention/double_sparsity_backend.py,sha256=2ZRL_gYz14idoVqQzeQ6N77nXer0f_8_TUYw40XUUz0,9161
113
116
  sglang/srt/layers/attention/flashattention_backend.py,sha256=ysJt9pJ8pg_kVxvVUTvUL22-O7ABHCenLGGcqCotD6A,83206
114
- sglang/srt/layers/attention/flashinfer_backend.py,sha256=YtMTgMhxxNrAbSoWTPJczgY4SR3WjnAPXPoJ2d5PUZY,46394
115
- sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=pnVhvVEK87iFW8gUb1G7X7c1tqro8R2DSEOFCnlV8Bo,30301
116
- sglang/srt/layers/attention/flashmla_backend.py,sha256=IyE4w7GcNOxjjy3mQeuAMjPtBNvI-6JkoxvBlFxFvec,10270
117
+ sglang/srt/layers/attention/flashinfer_backend.py,sha256=4TavTj9AH4aVccsnDbulYnJ0hKcHgWm9gpNtcbsf2kI,47099
118
+ sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=LBMAeC1OFEQ6hjN1GHpaURrM-yWKC_lxTqqERvvehJ8,30616
119
+ sglang/srt/layers/attention/flashmla_backend.py,sha256=wR0bkLz3mj5EfuHEi9fwEP2vtq6xFhsrIijpFb009o4,10340
117
120
  sglang/srt/layers/attention/torch_native_backend.py,sha256=K5hUqBgakk2COSQqsaxWs0yEVOHS-7BlOygZTOeI8kE,9444
118
121
  sglang/srt/layers/attention/triton_backend.py,sha256=oEEiUwHbm4rNw5ExbQ2c3n0TwAgkk77yuLFenj9bHOo,26902
119
122
  sglang/srt/layers/attention/utils.py,sha256=rxB4sbNIHDTges78bDbnpd_hUgtyb3e16wUwgI4WmoU,2751
@@ -129,9 +132,9 @@ sglang/srt/layers/moe/topk.py,sha256=K-VU64nWBV07bu1Okn-uYbhz9gylq-KFNRYn2SFzu28
129
132
  sglang/srt/layers/moe/ep_moe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
130
133
  sglang/srt/layers/moe/ep_moe/kernels.py,sha256=ijqRzS-tb0LGnDU5hW-g0JH104ppADrWaUIDGxb9Feo,22919
131
134
  sglang/srt/layers/moe/ep_moe/layer.py,sha256=SZ0shPwgDp7xj-TCv9bfg5O7f2AXjF6xmBP5xkZ0Ips,36440
132
- sglang/srt/layers/moe/ep_moe/token_dispatcher.py,sha256=zQV7Qr-Zrcr3D3efVvZepRQM02bj5djHPsijPssavk8,20430
135
+ sglang/srt/layers/moe/ep_moe/token_dispatcher.py,sha256=zqZCOsBk-fNRQHxmgt8XSgUG6AJjdKFRgJZ4YtuItJ4,20383
133
136
  sglang/srt/layers/moe/fused_moe_triton/__init__.py,sha256=h9yMFAL_bagUf-qBED8gSWdCOb7d8IdA-pE-L_nIg8E,842
134
- sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=13ygSeBoRkiqsERSHOIbIxLplVsSl-SUT6JxYPB-ViM,55968
137
+ sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=HJerp49tivE-IBZpy9JQs0UMx4goPGGO6gU6RINe2rk,55930
135
138
  sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=BMOV76fabrZcoyDmRpRbH11Jc0ogWH2k2QAQwvZIpgI,25084
136
139
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=iNGsE2ZeVnQEnN4A8UJ9Jv0d3hbRF2MJ9oBgjup5Szk,2737
137
140
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json",sha256=JJN0hryyLr5Zv3dSS7C8cPFhAwTT6XxUVnBGMZvV6JA,2752
@@ -144,14 +147,18 @@ sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=BMOV76fabrZcoyDmRpRbH11Jc
144
147
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=1,N=3584,device_name=NVIDIA_A100-SXM4-80GB.json",sha256=yf33YmWlVSjjyg0Q4OMAWvc9gjRxvttMrQBUEOfPl4I,4153
145
148
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=1,N=7168,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=ZWMClYN1moVRUP2f0hYac38di_pUgZggyl9d2D5rnoc,4136
146
149
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=1,N=7168,device_name=NVIDIA_A100-SXM4-80GB.json",sha256=C65Q2Mv1LxFQ_qDnv11IZ9nwl7sGZo72nWDflMttu4g,4147
150
+ "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=192,device_name=NVIDIA_A800-SXM4-80GB.json",sha256=T-_T-oW4qpjTIBaGVxukJksRE7Yg8m9HNHgJ2XmR3aI,3242
147
151
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=192,device_name=NVIDIA_H100_80GB_HBM3.json",sha256=I3k416HbXU_rYb8scD8gAI4fuBlElHl06PM347Qa11w,3253
148
152
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=192,device_name=NVIDIA_H20.json",sha256=RgV8C4F1LO09h01YsgF_eqX6GNoBtC7ulPfJRUUbg_g,3241
149
153
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=192,device_name=NVIDIA_H200.json",sha256=nsNEuDNks0tVLfQfIm7xxFwEeptTfQcoa9fJy0NS8xQ,3247
154
+ "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=384,device_name=NVIDIA_H100_80GB_HBM3.json",sha256=R4gBc3sMY5QwOtcGwGKdk2Ak4UsUbBd3jDUeKKk0O1U,3257
150
155
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=384,device_name=NVIDIA_H20,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=qbqjisJ4oKmcYzumHPRk5UyOzsdi8J6xas82UWHMeAI,3263
151
156
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=384,device_name=NVIDIA_H20.json",sha256=vS2DRIDOqWyiBvbG6H746ownfkD1F8Aj2YZ0ET9xll8,3232
152
157
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=384,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=1n5XyZZ5sKAi-Z1duWOhLUfr6gkvnOpvxfbqIT6iU_4,3265
153
158
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=384,device_name=NVIDIA_H200.json",sha256=xqhl748it8GV2KXX0XixitE_ywnsKksqK8AGL7tAgT8,3254
154
159
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=512,device_name=NVIDIA_H100_80GB_HBM3.json",sha256=FsWbV4Q6AzAtgegVuENBDz2ZcSJsqNiwUIVfQbpP7hQ,3244
160
+ "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=768,device_name=NVIDIA_A800-SXM4-80GB.json",sha256=T5rXJOZYNEs_3hE8g3ch802DnySbNiIqdn0s0RlJr8U,3249
161
+ "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=768,device_name=NVIDIA_H100_80GB_HBM3.json",sha256=9L5C8VcSsiUr5XryXB1AO3DknlAQowp6DU6S7OSzEA0,3248
155
162
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=768,device_name=NVIDIA_H20,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=IuvyC8TNhCVAmUZfLSoETsyCKsmejKXrs_0zuwFLPAU,3265
156
163
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=768,device_name=NVIDIA_H20.json",sha256=10Ntu2aVD5vGLonx-jW0qNw-tgZWdZmzMGx7utDVeng,3237
157
164
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=128,N=768,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=pdQ1RvXvdWDn8Y8-8MAX3vn-T-wbtkZvHV9GZZvNjnc,3266
@@ -280,11 +287,11 @@ sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=BMOV76fabrZcoyDmRpRbH11Jc
280
287
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=8,N=8192,device_name=AMD_Radeon_Graphics,dtype=fp8_w8a8.json",sha256=-RzUWSIAAsg6iA-8SPMa68hPpBVoUyMJs3dLP7edRu0,4323
281
288
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=8,N=8192,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json",sha256=sY2nWMPh9lsIkhPCjkHO245wpnfFbrHmzdcZDVFPVww,3265
282
289
  "sglang/srt/layers/moe/fused_moe_triton/configs/E=8,N=8192,device_name=NVIDIA_H200,dtype=fp8_w8a8.json",sha256=Uz5X80VcNBOaxshwVNUEittHk2zqB4HQCfTJ4TPG5aM,3274
283
- sglang/srt/layers/quantization/__init__.py,sha256=UOQcyCvKFkX0u_OPPex7X5X98iUR3lXgBnLbffu0n9g,12424
290
+ sglang/srt/layers/quantization/__init__.py,sha256=WVaItwaovrn-tZiAK0Wvs5RkV_yXi88K4z3xHB44Wf8,12424
284
291
  sglang/srt/layers/quantization/awq.py,sha256=KemDG55U3B6YZVjMV71awVAIj0islFvtxcUHmOBeGy0,6739
285
292
  sglang/srt/layers/quantization/base_config.py,sha256=jWk_egQrVNMYmQgbTI9vkcgzScLFjB5_sywFlAfE5J0,4776
286
293
  sglang/srt/layers/quantization/blockwise_int8.py,sha256=cu9-JiCZDfMfvB97Kv_-eEG87VX5bRFIllFkzpO_xIg,15122
287
- sglang/srt/layers/quantization/deep_gemm.py,sha256=UFzsd0iiqVTBo0Ow_6ylVVFK8B9EUWTNQQYGvsNfm2s,13129
294
+ sglang/srt/layers/quantization/deep_gemm.py,sha256=VmSSrhswu_vL0ecmQaBZsBTPYSX5OfjxVBgCGYXLUug,13141
288
295
  sglang/srt/layers/quantization/fp8.py,sha256=da-6ji_HBISKwIgMMX-JGlDKMLi-qL9j2XLer5cFAsU,40945
289
296
  sglang/srt/layers/quantization/fp8_kernel.py,sha256=C2_hOLRO27-Yvjy-Nm2niehD2gWSMuP6TnNX07ESqh4,32018
290
297
  sglang/srt/layers/quantization/fp8_utils.py,sha256=vqH-bMb2DD0A7Y7hZjN-TGTg5h6aJ-cLW9H2adyZzqk,18651
@@ -457,10 +464,10 @@ sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a
457
464
  "sglang/srt/layers/quantization/configs/N=7168,K=256,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=PD4AJYCkHfy2ivv9baMouFXzBTy0eKMumbAfxfm91HI,3256
458
465
  "sglang/srt/layers/quantization/configs/N=7168,K=256,device_name=NVIDIA_H20,dtype=int8_w8a8,block_shape=[128, 128].json",sha256=FImA-TJ_tQDjqwoNWxS--sRDoKDXf9gamlME3tkxH58,3252
459
466
  "sglang/srt/layers/quantization/configs/N=7168,K=256,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=FFBjSWlpKXMxfAUUYUqXbOK_Hd7qBeBsfbcaa9uB4qY,3249
460
- sglang/srt/lora/layers.py,sha256=cu1kqDCuH05ck8HVtwmVuMVBzcPJZeDY3mk486teB4E,11848
467
+ sglang/srt/lora/layers.py,sha256=xdP2Gwlw9PCPZBhujGqO6aBn0eGxpVeIBFUp1LIGCto,13119
461
468
  sglang/srt/lora/lora.py,sha256=uNvbjZ_Wr1SLI9-ElRJA_JKwkibSGroP5Bfpsr9MI-Y,7527
462
469
  sglang/srt/lora/lora_config.py,sha256=qDgMTx_69jyJUl29O5FxLzYa0BMhqYVXWXfyyVOvGm0,1684
463
- sglang/srt/lora/lora_manager.py,sha256=nyqkm7RLoQE6myfqcH9r0zwME4aEZ3pFkVjY36QTlvA,9200
470
+ sglang/srt/lora/lora_manager.py,sha256=u8jwO1IeAb7zE47YU-2fXwx7RmxXaYCc39uJxvYHoHY,11797
464
471
  sglang/srt/lora/mem_pool.py,sha256=xUFoHUDJgX9lt2YugD9HUY5tIMnJiazYMZ6LYqSGv-E,9633
465
472
  sglang/srt/lora/utils.py,sha256=GjEBgsGhDhX4NqVqeaciznQ8RotKZmb2c-nw4YMLHxA,5251
466
473
  sglang/srt/lora/backend/base_backend.py,sha256=EIz8I-GIrdmK4fISw3ENhbJVVITaxKfyLxHXGPU4fPs,5044
@@ -473,26 +480,27 @@ sglang/srt/lora/triton_ops/sgemm_lora_a.py,sha256=ZmWEqHJaorRNNj-c_ZXPi_pX8X_yIA
473
480
  sglang/srt/lora/triton_ops/sgemm_lora_b.py,sha256=Q58UzWUb3QFqY_ZxWA3poN373N0Hwkks5AQRKIuvFC8,4517
474
481
  sglang/srt/managers/cache_controller.py,sha256=d4RGqbut1FlzJnpqr7WY_TYmRjYPS07OoOVbztjs5xI,18959
475
482
  sglang/srt/managers/configure_logging.py,sha256=fOJaXAQ1n9m-8KPJndpsKvS885i69SMafoEADLIVfIM,1633
476
- sglang/srt/managers/data_parallel_controller.py,sha256=Oo-0sbF0W1fcpw88-iKH_7pttYjWl8IHCePcuF3rU5c,10894
483
+ sglang/srt/managers/data_parallel_controller.py,sha256=UgMruoTjQDWDCZK7ATmmgNrrY011pDqrFGl4vJdBpKU,11677
477
484
  sglang/srt/managers/detokenizer_manager.py,sha256=3S3aRvKSi75RQSxEEQkeyxKDNNunWiw9wlwsbT1VXSo,10099
478
485
  sglang/srt/managers/expert_distribution.py,sha256=r3o5RGI0gnV7xb60AApqKYa0oiSB37oB7hQBX7P3xZM,3225
479
486
  sglang/srt/managers/io_struct.py,sha256=9mdBGOkblguT1x6Ds9wL3j0MWAQiUQVdVRL4a7IUnA4,31631
480
487
  sglang/srt/managers/mm_utils.py,sha256=JTu5B7jZWTtZi8LCpVa6ITvSToxcuf5PDbb3FJC9M6o,18089
481
488
  sglang/srt/managers/multimodal_processor.py,sha256=XlRYvNhF6XOssreRX9DZPhLSpps_VE62gSKw3EGdNPo,2088
482
- sglang/srt/managers/schedule_batch.py,sha256=zUQGVjLbi9TK5tfyzHNMSAnPeNeFi9GFI2AC8Fr2pbo,63824
489
+ sglang/srt/managers/schedule_batch.py,sha256=E_Q3v4F7oioPqQFu891NlY_UK-9O6dJ7GnitjnKa1LU,64272
483
490
  sglang/srt/managers/schedule_policy.py,sha256=E1qVq2G3jptKdX9nlqfayeRBUll9xB6bK8nBf3EW32E,19469
484
- sglang/srt/managers/scheduler.py,sha256=7o03npmnu775d1DRDAkTJjl8OuJlE_xuM3BQji6BYLI,80808
485
- sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=GxdkTR24_P_2C3ib0dc7Xqklrz8SiHtUTlM0c7AlKlk,26754
491
+ sglang/srt/managers/scheduler.py,sha256=OuSUf31bxFSx4tUbNggAX3DyIfD4iuJoLwJbyp5Py64,89816
492
+ sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=15Eicph3bPVuBMPsMPOLReNc2Kmi6m1WXlq0UbYtj9g,26773
486
493
  sglang/srt/managers/session_controller.py,sha256=o-ifit0n4_xHLNmyD0Ams8FxGRgxFybX-Vz1hwgr3UQ,5755
487
494
  sglang/srt/managers/tokenizer_manager.py,sha256=4l4PAvfQrJqlYADQbl7cgpLhBBY52pzI5AzRYIzAjLs,50693
488
- sglang/srt/managers/tp_worker.py,sha256=LhbhCovDvab6Cx4faR88s4q_3D-Di9s5sKCndsDxF9E,8966
489
- sglang/srt/managers/tp_worker_overlap_thread.py,sha256=lkG_yN6_UEv5mhmZ7cKP7_A5sIVMQw1GPwkqM91EWSE,9304
495
+ sglang/srt/managers/tp_worker.py,sha256=zo9OLsBABpBUyBgTKPPcDhtrLkRB_edyN9ANzGz_Pzc,10228
496
+ sglang/srt/managers/tp_worker_overlap_thread.py,sha256=PyBiUdHeh1Z_o_R34lNB28SBjqTP4nArNCQhX0O6K2M,9440
490
497
  sglang/srt/managers/utils.py,sha256=5i75uLlQOF_5CaT02CrWtwozMTtwTg2_nLP8Dtr-JZQ,1536
491
498
  sglang/srt/managers/multimodal_processors/base_processor.py,sha256=ata9H6Ry4QfqBoA_g0auG0sMnKfGrlZn74lM77ihtiA,10172
492
499
  sglang/srt/managers/multimodal_processors/clip.py,sha256=lRc2mcuDbAhZVf-0EfkO81pqDiol9zLvTpDqtPIBQ2k,1525
493
500
  sglang/srt/managers/multimodal_processors/deepseek_vl_v2.py,sha256=hpjpGFzlRBQ8Xv08i37X_VUhnDp_Qm2xD1_F17vK8fI,3253
494
501
  sglang/srt/managers/multimodal_processors/gemma3.py,sha256=G52ck_3UQGeyrtvjLqI8B0Tm8iNsyB_ahiMTAvx083U,2191
495
502
  sglang/srt/managers/multimodal_processors/janus_pro.py,sha256=UJoKQWsoU9kittKDwjWbG2KC12wSA-4A3DpTPhA6VoI,1854
503
+ sglang/srt/managers/multimodal_processors/kimi_vl.py,sha256=vC9OeS7gVTHzazbluiQ1I0QRKqszlqK75ghUA1rmUNc,2490
496
504
  sglang/srt/managers/multimodal_processors/llava.py,sha256=8mac3vUUpVd12o43k1TyMaLEySZB915ks8Q5epeZmbg,6209
497
505
  sglang/srt/managers/multimodal_processors/minicpm.py,sha256=uEnlsImjHBOMVNGlfBGpn1zCDLNeMY58HvJ7ZthL2N4,5698
498
506
  sglang/srt/managers/multimodal_processors/mlama.py,sha256=MLiGS606LzVtdoXvjWGANx-K_7nE9J_fMVmkXN7Gz8k,1661
@@ -502,14 +510,14 @@ sglang/srt/mem_cache/base_prefix_cache.py,sha256=NY62Zo0A0tLJ7ObRLOQqQcXCxoJUDZs
502
510
  sglang/srt/mem_cache/chunk_cache.py,sha256=it5SfL1FwMbrdeOH-I-Eu_i-I9hFB1xL-z_brIUoCkk,1835
503
511
  sglang/srt/mem_cache/flush_cache.py,sha256=GYcxmNXh4hsMpFfNOuCTpKilW7guZwTtAg_usVeM3J0,979
504
512
  sglang/srt/mem_cache/hiradix_cache.py,sha256=BJR-R2u5YyYIhGIxTY-3rf8Vx60XjCRU8Yhmkn2fzzM,16597
505
- sglang/srt/mem_cache/memory_pool.py,sha256=J2eAAefAl0TIejH7h-hwz_ak_T-fSh_e45tUNrhX0BE,34599
513
+ sglang/srt/mem_cache/memory_pool.py,sha256=ZJYAceAtEv326tYERXsHeBy7_0HGnk_jpfEKJTJwPMU,36260
506
514
  sglang/srt/mem_cache/paged_allocator.py,sha256=BrJS0vN1k-vTSgb_M8u_1KoZFRgzgR1WRyImCTq3T0U,9770
507
515
  sglang/srt/mem_cache/radix_cache.py,sha256=Lm-pco6CJ4orb9IfDpbHm5MnyK8Ya0OF1x9p88dv548,14906
508
516
  sglang/srt/metrics/collector.py,sha256=zHg4twFQJvuK1mSme3-EYQa9PJryfp_u7a4RxQ5RcO0,8874
509
517
  sglang/srt/metrics/func_timer.py,sha256=VFyNRrbnKVCwnQsrlLin1lITJfjQpf9m8sGPqL5LIsQ,3438
510
- sglang/srt/model_executor/cuda_graph_runner.py,sha256=iFryO9dglpnFCoNWxZqKdUhQycT8In29C0kIba3G1Dw,23687
511
- sglang/srt/model_executor/forward_batch_info.py,sha256=T9B5vWaJwlKUH0fQTPe3XdbkTYEUI6iKxBxUHs-cAMM,26632
512
- sglang/srt/model_executor/model_runner.py,sha256=O4vKZ4c-u69ZeKPBjAfiunvtnQHskZVmbUUK4fKFb5E,46417
518
+ sglang/srt/model_executor/cuda_graph_runner.py,sha256=ISDLqpJZ0_WjX2IqWt6yASy4yLMUchVc9-6J_bK-UBY,26208
519
+ sglang/srt/model_executor/forward_batch_info.py,sha256=Kz30RuEjuOAN9_8hlvvknF4qeohyas7NrS90FCRtIMg,27730
520
+ sglang/srt/model_executor/model_runner.py,sha256=FYNlATMIQ-zC_NDqpWu3hBu7A-rxhgaPqF029U7txvo,48596
513
521
  sglang/srt/model_loader/__init__.py,sha256=zGZkOBz1zx-pkaIy47BasL3fjDlAcxAXUTjInOhXHAE,919
514
522
  sglang/srt/model_loader/loader.py,sha256=YYmtvkQw0B1qgPw0_gN-K4yy7CEYbTSR__0Dl1Fnm6k,55342
515
523
  sglang/srt/model_loader/utils.py,sha256=0NaMR67fESFopaklmsleiL27XH1QUrjZW246MUu1EJ0,1369
@@ -522,8 +530,8 @@ sglang/srt/models/commandr.py,sha256=5Y_b3K0QY7D37nFGkyiGgY38RleRui_GJUYcHSuHUZo
522
530
  sglang/srt/models/dbrx.py,sha256=4pn_fdoATg01VEqNnIAxNEsKV5XU7gwHyd289eydq1s,15598
523
531
  sglang/srt/models/deepseek.py,sha256=ZnN02HdgXCB23Vno5V9UMUoOxH5HC82vNTwsVulUJ-o,17206
524
532
  sglang/srt/models/deepseek_janus_pro.py,sha256=8wAzvcGdyo--3faMN4QtagT1eAZMhMFduvpCXqUS48Q,70456
525
- sglang/srt/models/deepseek_nextn.py,sha256=XW0PJAvUVx5i1F6liNMooopj833qyQ4Y4ujn3iJDDak,17825
526
- sglang/srt/models/deepseek_v2.py,sha256=6fEihiaHcl9tjawa1GnCKGIappuLnDfmmVChhPswSIU,71820
533
+ sglang/srt/models/deepseek_nextn.py,sha256=ptShwRSOLQbFRU1lJ_uHL1byA8z9d-YKAH4eEiLXPeM,6249
534
+ sglang/srt/models/deepseek_v2.py,sha256=1RJvBzWWTOYJ1U7s65xK1V15QFvJv7mfkNTIYgape-w,73943
527
535
  sglang/srt/models/deepseek_vl2.py,sha256=j8BdxZsMjm6lPdbDipEIKhVIVywCP1Vl1Kl46BZ5_0Y,13147
528
536
  sglang/srt/models/exaone.py,sha256=rX7J0xFt9TSt6tMIhnYMkb5KDnqTJIV4BtjPLFwQ8_8,13425
529
537
  sglang/srt/models/gemma.py,sha256=4cdrPISg1VKnsuI-QPTpYvet4BrX8BMKvCIN82iLskw,12641
@@ -537,11 +545,13 @@ sglang/srt/models/granite.py,sha256=5WOJyNYAlt5RNHSexNfPNihhSxIMd7wPzju1cTixKig,
537
545
  sglang/srt/models/grok.py,sha256=vESZeGS4adI_JAerXIkCcTm15-CNiGeS7VHc36C6w1A,28033
538
546
  sglang/srt/models/internlm2.py,sha256=RDAT9drjdgVEFmCMq99RTn3weMQFhl1NHhkhyDX8f7M,13056
539
547
  sglang/srt/models/internlm2_reward.py,sha256=ndfGmyqYZbVZ7C7rJ-v9oK3wa-EpoBGybS8MlyKZi2E,2522
540
- sglang/srt/models/llama.py,sha256=Y4ROe8ohP84G4vin_Sr_vjG0XRoM5gGgnrojxOXn_uc,24942
541
- sglang/srt/models/llama4.py,sha256=idwV_rEJ_tPMD1iLQzvaJqmux-Osoa3bc0g04VYgu1w,17867
548
+ sglang/srt/models/kimi_vl.py,sha256=YoM6CmrF4ZS0SsXKiR-_SfylKhd87ciJjno6_x5LG4o,12874
549
+ sglang/srt/models/kimi_vl_moonvit.py,sha256=M5L7AJOJ2Zh2pqLZAq8aRqhbTSlipr8XOoD3ix6o2sU,23908
550
+ sglang/srt/models/llama.py,sha256=45bs_qVp53RmnU-zXaHrj2vvhxvmBsWgEemnBtvI8_k,26978
551
+ sglang/srt/models/llama4.py,sha256=xopptG6PXpnGKCMX-o4QAfiWpDpyLUicTPsQKm1rorI,17942
542
552
  sglang/srt/models/llama_classification.py,sha256=4QWTFaUZIFKYZvEzs8bx8VkOZNIwdYCLrnwrdAw4QK0,3108
543
- sglang/srt/models/llama_eagle.py,sha256=OB2lKsjn7BcfCZljklnhk83me8j0PuQmYLou7baNcq4,4866
544
- sglang/srt/models/llama_eagle3.py,sha256=v3bftBVDIGjnzngQYnu19cy0J_3w7yruHqLP5nsAQDM,6642
553
+ sglang/srt/models/llama_eagle.py,sha256=Ubh_jmtfiOnriwvHgQT0ZGID7JvYvdSi_QGHOIkEgPE,5028
554
+ sglang/srt/models/llama_eagle3.py,sha256=KCvUrWn17t7T28G60HwMyy99iB9AbdbPnS2el9n3r6o,6804
545
555
  sglang/srt/models/llama_embedding.py,sha256=zq-_lNu35VBFc7eemiam0zdkGIE8fzrgk5OWYfirZnA,3254
546
556
  sglang/srt/models/llama_reward.py,sha256=LF2nqMV5XOrljGjAwJg43mBv3z6Q040I2EYlgZeCp8k,4681
547
557
  sglang/srt/models/llava.py,sha256=KMwNNrlMuMaKEOZMDRBKBQbe6uctpKTLc0zOceyGC34,27242
@@ -564,11 +574,11 @@ sglang/srt/models/qwen2.py,sha256=ab912Yyk0aXOzI-wrxqN-sNF3bTVkNxB8P2uNcOCv9U,16
564
574
  sglang/srt/models/qwen2_5_vl.py,sha256=mqgmDHleJN3GmuZG1pUSpIZYKO1omTsa8P5MXYULAGM,22462
565
575
  sglang/srt/models/qwen2_classification.py,sha256=dGrMm4ebd30_lBhHOhaV57ig2iOTx3nqB4GEzsrRIM8,2747
566
576
  sglang/srt/models/qwen2_eagle.py,sha256=Iz0HWL2FgSD3FqoFhfYmbIZeEYkPTJ96lYbkncmHJX4,4644
567
- sglang/srt/models/qwen2_moe.py,sha256=bmS2pyHD5zQo5plTCzAo_mjnahVtJ1jaRSURX1PlQC4,18313
577
+ sglang/srt/models/qwen2_moe.py,sha256=iG0d2WwUosOFR9w2YGM9CfvZ1NG-rhse3OUTwSs8a6Q,18567
568
578
  sglang/srt/models/qwen2_rm.py,sha256=-mQXDEv11p-I1HXgYLTtY6ROem6UYorO958WsDrzsgs,2837
569
- sglang/srt/models/qwen2_vl.py,sha256=tgES87Rmdl7hqMLAnxYqpWerxK28n5UY7Ma5309TPqs,21408
579
+ sglang/srt/models/qwen2_vl.py,sha256=EaDBXbzeIToYUUzs0yyByXE66-G1BCfATXJgkaHa-PE,20975
570
580
  sglang/srt/models/qwen3.py,sha256=reaowGkotYAGHS5zTCWrvnyxtu92QKus19n-2amtMa4,12358
571
- sglang/srt/models/qwen3_moe.py,sha256=Tee7oW6Xvo2pV_Q93y-HKykBFiPjo_-YfeIsIelB3hA,15623
581
+ sglang/srt/models/qwen3_moe.py,sha256=A9Z3OhJqld1sJUDsHymgGxib4lMCMTKxF8iIzHDGdNo,15877
572
582
  sglang/srt/models/registry.py,sha256=inKh9iwOp3LFYm3nqujg-OtABClOP-ifc1stA9cZegA,3434
573
583
  sglang/srt/models/roberta.py,sha256=Zgd35och3pW6TYrNeEoeOZ8qPfbFwB3ngThpVWSPBcY,6320
574
584
  sglang/srt/models/stablelm.py,sha256=0x_31uIr3WcWwecdPAI3ek9KkyKBJS7VwknTk2y0gjY,12281
@@ -576,8 +586,8 @@ sglang/srt/models/torch_native_llama.py,sha256=5tfFSMAXB3ScToqTALtCXa8Oo-qPCJh-K
576
586
  sglang/srt/models/xverse.py,sha256=DsNVI9JpzN4jj0Ry6aTrj7r-xq5YLOoDX2kH4YLJA-I,14035
577
587
  sglang/srt/models/xverse_moe.py,sha256=7KCM2-j12towDMNvXkuuYiBOmNauH6NG4Ip40x0khqA,16782
578
588
  sglang/srt/models/yivl.py,sha256=oToK7-u5IGO7xwpJIQ7VtudlK6-zPqJX4bt6_wv0SH8,4850
579
- sglang/srt/openai_api/adapter.py,sha256=7WMplmT0SWJXo5F8s1s3Q9_6WV_cTscMS1Bodbl9Xes,76746
580
- sglang/srt/openai_api/protocol.py,sha256=8Iu4t9JlH99QggKl55PYQWTW81u5mpOj0aA-bs44A_c,13621
589
+ sglang/srt/openai_api/adapter.py,sha256=mMaaN2hVhRARIzfXFfmqORYLO8bXUi-GCOJLZq0lYFg,77283
590
+ sglang/srt/openai_api/protocol.py,sha256=eTSp9x4uFABDxTYRnnftgoVSF5PWlkixnFTfQRyG0dM,14142
581
591
  sglang/srt/platforms/interface.py,sha256=hym3iooBB4C8if5hDZezgVN6h4NIOu7sg2ZUBIV6XmM,11246
582
592
  sglang/srt/sampling/custom_logit_processor.py,sha256=tDvoLgLqn-sy1qcY6vSrpbnHCeqbdk0uhMOO-uy4p4E,1099
583
593
  sglang/srt/sampling/sampling_batch_info.py,sha256=4LCowU2bk0TOSfIGpEy90N1SpTsiOKK8Rx1ZYcklUFQ,11988
@@ -590,13 +600,13 @@ sglang/srt/sampling/penaltylib/presence_penalty.py,sha256=NRh10AJrrQlGJ6S-enGdRe
590
600
  sglang/srt/speculative/build_eagle_tree.py,sha256=lt4sXUehPi26MT2-2Z0VivtF6AP7kirSaEO_u-YJ4J4,11670
591
601
  sglang/srt/speculative/eagle_draft_cuda_graph_runner.py,sha256=NviXdUvowQkV1kLs3eXLlxJx6UZzyQMZH03zCXpsIg4,9291
592
602
  sglang/srt/speculative/eagle_utils.py,sha256=iJYhklXHfDgEKbVB39HkVEea-XTEC60Z_LjIVjkrZQs,28701
593
- sglang/srt/speculative/eagle_worker.py,sha256=D4G8hnwtc8xQt1okG4TY9wYSXbKTqGVDAD22AUXW6pA,26824
603
+ sglang/srt/speculative/eagle_worker.py,sha256=MwsBbKyV-dCwzYlIpVcb-urk-GSdoe_kY8KHe5Gkw7A,26860
594
604
  sglang/srt/speculative/spec_info.py,sha256=rhaKG0TzyF9XZYHEWp1jccwTBohSNsUDvxHFtAoOl18,709
595
605
  sglang/test/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
596
606
  sglang/test/few_shot_gsm8k.py,sha256=7VLbWl4nCQs1wjtW4q-46jf9jUCycSs5Iw8v7sUSzBw,4284
597
607
  sglang/test/few_shot_gsm8k_engine.py,sha256=QQbrwOX6-cJDD3RZC_e7zPnt6aSo8JdF8X_lRHSjdDM,3886
598
608
  sglang/test/run_eval.py,sha256=9yO0hXZOcn4abEOs96T-XPguDEklK16Ltco0pGF3zCg,4020
599
- sglang/test/runners.py,sha256=vSOl38rVDR3l2ezVCs672vE-LcOA2rJHjlkhLgEjcz8,30260
609
+ sglang/test/runners.py,sha256=WWAu07NXSJV1y4W-iEi_iOCy1P5Ow9rL0ex-U969Nws,30417
600
610
  sglang/test/send_one.py,sha256=_l72sRfuXRUldyD3PD63hg_WxNvvhW5unNnbe4XuAwk,4380
601
611
  sglang/test/simple_eval_common.py,sha256=joqrGysuLnJFtzDRIgFkMsRyKUSyjVPFWp0_PHAL3Ik,12378
602
612
  sglang/test/simple_eval_gpqa.py,sha256=8Xt9Bw05c7SZTYrCZgB68OZUqUbLo69ywiyx0bTvSUk,3220
@@ -611,13 +621,13 @@ sglang/test/test_custom_ops.py,sha256=2bSo9P5_rJZYFq8Y8IKRimDfFyZZGJluhL7Ngny0Pf
611
621
  sglang/test/test_dynamic_grad_mode.py,sha256=L76yUCuk_ymNpXD2CmO8r2GiGjIvD_gtTsuFDs2NolI,1638
612
622
  sglang/test/test_layernorm.py,sha256=2GMWqqNDuGvSMSsEBF5eDCzwVSYA9E6hGhRo6s4ecKg,3764
613
623
  sglang/test/test_programs.py,sha256=VZ3vXtUDBnXz0M7gFdDH8hXg9Wa0j_qI8CVqjEgRN_E,18877
614
- sglang/test/test_utils.py,sha256=1U4Jtx_oz_UtS3SSJdqGuh3ujnj2g8pZjN5MYsbsBwI,32164
624
+ sglang/test/test_utils.py,sha256=WqLvYA2N18USdHWY2kKmrIixLtiOb3r4HJ2uT1kRu1o,32905
615
625
  sglang/test/attention/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
616
626
  sglang/test/attention/test_flashattn_backend.py,sha256=_rTG849FwQdVTyGKkqhczaOqngBmRWXFmkl5NnuK1GM,13914
617
627
  sglang/test/attention/test_flashattn_mla_backend.py,sha256=g4O50WblTpM7_Gq2b76k0i25_z01BOUBQ4i6PmyxpO4,10774
618
628
  sglang/test/attention/test_prefix_chunk_info.py,sha256=er0i3KGHMkw-4UZB1GCFd4oYwRcXfU5wpO1ORqpNGGA,7626
619
- sglang-0.4.6.post1.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
620
- sglang-0.4.6.post1.dist-info/METADATA,sha256=UTh1TF2jiAdQunwLv7_bmww5_18c4uD7FCaeO-Z3gAs,25361
621
- sglang-0.4.6.post1.dist-info/WHEEL,sha256=ck4Vq1_RXyvS4Jt6SI0Vz6fyVs4GWg7AINwpsaGEgPE,91
622
- sglang-0.4.6.post1.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
623
- sglang-0.4.6.post1.dist-info/RECORD,,
629
+ sglang-0.4.6.post2.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
630
+ sglang-0.4.6.post2.dist-info/METADATA,sha256=XZjs979dHuGsAVGlpT-ZQd9msQWxI4mN1WTtmG6CPvo,25419
631
+ sglang-0.4.6.post2.dist-info/WHEEL,sha256=wXxTzcEDnjrTwFYjLPcsW_7_XihufBwmpiBeiXNBGEA,91
632
+ sglang-0.4.6.post2.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
633
+ sglang-0.4.6.post2.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: setuptools (80.0.0)
2
+ Generator: setuptools (80.1.0)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
5
5