sglang 0.5.3rc2__py3-none-any.whl → 0.5.4.post1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (419) hide show
  1. sglang/bench_one_batch.py +47 -28
  2. sglang/bench_one_batch_server.py +41 -25
  3. sglang/bench_serving.py +378 -160
  4. sglang/check_env.py +1 -1
  5. sglang/compile_deep_gemm.py +6 -2
  6. sglang/global_config.py +1 -25
  7. sglang/lang/api.py +6 -0
  8. sglang/lang/interpreter.py +1 -0
  9. sglang/lang/ir.py +13 -0
  10. sglang/launch_server.py +10 -15
  11. sglang/profiler.py +18 -1
  12. sglang/srt/_custom_ops.py +1 -1
  13. sglang/srt/batch_invariant_ops/batch_invariant_ops.py +105 -10
  14. sglang/srt/checkpoint_engine/checkpoint_engine_worker.py +142 -0
  15. sglang/srt/compilation/backend.py +437 -0
  16. sglang/srt/compilation/compilation_config.py +20 -0
  17. sglang/srt/compilation/compilation_counter.py +47 -0
  18. sglang/srt/compilation/compile.py +210 -0
  19. sglang/srt/compilation/compiler_interface.py +503 -0
  20. sglang/srt/compilation/cuda_piecewise_backend.py +228 -0
  21. sglang/srt/compilation/fix_functionalization.py +134 -0
  22. sglang/srt/compilation/fx_utils.py +83 -0
  23. sglang/srt/compilation/inductor_pass.py +140 -0
  24. sglang/srt/compilation/pass_manager.py +66 -0
  25. sglang/srt/compilation/piecewise_context_manager.py +40 -0
  26. sglang/srt/compilation/weak_ref_tensor_jit.py +16 -0
  27. sglang/srt/configs/__init__.py +4 -0
  28. sglang/srt/configs/deepseek_ocr.py +262 -0
  29. sglang/srt/configs/deepseekvl2.py +194 -96
  30. sglang/srt/configs/dots_vlm.py +2 -7
  31. sglang/srt/configs/falcon_h1.py +13 -64
  32. sglang/srt/configs/load_config.py +25 -2
  33. sglang/srt/configs/mamba_utils.py +117 -0
  34. sglang/srt/configs/model_config.py +136 -25
  35. sglang/srt/configs/modelopt_config.py +30 -0
  36. sglang/srt/configs/nemotron_h.py +286 -0
  37. sglang/srt/configs/olmo3.py +105 -0
  38. sglang/srt/configs/points_v15_chat.py +29 -0
  39. sglang/srt/configs/qwen3_next.py +11 -47
  40. sglang/srt/configs/qwen3_omni.py +613 -0
  41. sglang/srt/configs/qwen3_vl.py +0 -10
  42. sglang/srt/connector/remote_instance.py +1 -1
  43. sglang/srt/constrained/base_grammar_backend.py +5 -1
  44. sglang/srt/constrained/llguidance_backend.py +5 -0
  45. sglang/srt/constrained/outlines_backend.py +1 -1
  46. sglang/srt/constrained/reasoner_grammar_backend.py +9 -6
  47. sglang/srt/constrained/utils.py +12 -0
  48. sglang/srt/constrained/xgrammar_backend.py +20 -11
  49. sglang/srt/disaggregation/ascend/transfer_engine.py +1 -1
  50. sglang/srt/disaggregation/base/conn.py +17 -4
  51. sglang/srt/disaggregation/common/conn.py +4 -2
  52. sglang/srt/disaggregation/decode.py +123 -31
  53. sglang/srt/disaggregation/decode_kvcache_offload_manager.py +1 -1
  54. sglang/srt/disaggregation/fake/conn.py +11 -3
  55. sglang/srt/disaggregation/mooncake/conn.py +157 -19
  56. sglang/srt/disaggregation/nixl/conn.py +69 -24
  57. sglang/srt/disaggregation/prefill.py +96 -270
  58. sglang/srt/distributed/device_communicators/all_reduce_utils.py +4 -4
  59. sglang/srt/distributed/device_communicators/custom_all_reduce.py +6 -6
  60. sglang/srt/distributed/device_communicators/pymscclpp.py +2 -2
  61. sglang/srt/distributed/device_communicators/pynccl.py +24 -12
  62. sglang/srt/distributed/device_communicators/pynccl_allocator.py +2 -2
  63. sglang/srt/distributed/device_communicators/symm_mem.py +1 -1
  64. sglang/srt/distributed/naive_distributed.py +5 -4
  65. sglang/srt/distributed/parallel_state.py +63 -19
  66. sglang/srt/elastic_ep/elastic_ep.py +74 -0
  67. sglang/srt/entrypoints/context.py +3 -2
  68. sglang/srt/entrypoints/engine.py +83 -80
  69. sglang/srt/entrypoints/grpc_server.py +430 -234
  70. sglang/srt/entrypoints/harmony_utils.py +2 -2
  71. sglang/srt/entrypoints/http_server.py +195 -102
  72. sglang/srt/entrypoints/http_server_engine.py +1 -7
  73. sglang/srt/entrypoints/openai/protocol.py +225 -37
  74. sglang/srt/entrypoints/openai/serving_base.py +49 -2
  75. sglang/srt/entrypoints/openai/serving_chat.py +29 -74
  76. sglang/srt/entrypoints/openai/serving_classify.py +204 -0
  77. sglang/srt/entrypoints/openai/serving_completions.py +15 -1
  78. sglang/srt/entrypoints/openai/serving_responses.py +5 -2
  79. sglang/srt/entrypoints/openai/serving_tokenize.py +144 -0
  80. sglang/srt/environ.py +58 -6
  81. sglang/srt/eplb/eplb_algorithms/__init__.py +18 -1
  82. sglang/srt/eplb/eplb_algorithms/deepseek.py +0 -2
  83. sglang/srt/eplb/eplb_algorithms/elasticity_aware.py +87 -0
  84. sglang/srt/eplb/expert_distribution.py +33 -4
  85. sglang/srt/eplb/expert_location_dispatch.py +2 -2
  86. sglang/srt/eplb/expert_location_updater.py +2 -2
  87. sglang/srt/function_call/base_format_detector.py +17 -18
  88. sglang/srt/function_call/function_call_parser.py +20 -14
  89. sglang/srt/function_call/glm4_moe_detector.py +1 -5
  90. sglang/srt/function_call/gpt_oss_detector.py +1 -1
  91. sglang/srt/function_call/json_array_parser.py +0 -2
  92. sglang/srt/function_call/minimax_m2.py +367 -0
  93. sglang/srt/function_call/utils.py +2 -2
  94. sglang/srt/grpc/compile_proto.py +3 -3
  95. sglang/srt/{entrypoints → grpc}/grpc_request_manager.py +112 -52
  96. sglang/srt/grpc/health_servicer.py +189 -0
  97. sglang/srt/grpc/scheduler_launcher.py +181 -0
  98. sglang/srt/grpc/sglang_scheduler_pb2.py +78 -70
  99. sglang/srt/grpc/sglang_scheduler_pb2.pyi +66 -10
  100. sglang/srt/grpc/sglang_scheduler_pb2_grpc.py +89 -1
  101. sglang/srt/layers/activation.py +10 -1
  102. sglang/srt/layers/attention/aiter_backend.py +3 -3
  103. sglang/srt/layers/attention/ascend_backend.py +17 -1
  104. sglang/srt/layers/attention/attention_registry.py +43 -23
  105. sglang/srt/layers/attention/base_attn_backend.py +20 -1
  106. sglang/srt/layers/attention/double_sparsity_backend.py +2 -2
  107. sglang/srt/layers/attention/fla/chunk.py +0 -1
  108. sglang/srt/layers/attention/fla/chunk_o.py +1 -1
  109. sglang/srt/layers/attention/fla/index.py +0 -2
  110. sglang/srt/layers/attention/fla/layernorm_gated.py +50 -32
  111. sglang/srt/layers/attention/fla/utils.py +0 -3
  112. sglang/srt/layers/attention/fla/wy_fast.py +0 -2
  113. sglang/srt/layers/attention/flashattention_backend.py +24 -10
  114. sglang/srt/layers/attention/flashinfer_backend.py +258 -22
  115. sglang/srt/layers/attention/flashinfer_mla_backend.py +38 -28
  116. sglang/srt/layers/attention/flashmla_backend.py +2 -2
  117. sglang/srt/layers/attention/hybrid_attn_backend.py +1 -1
  118. sglang/srt/layers/attention/hybrid_linear_attn_backend.py +165 -62
  119. sglang/srt/layers/attention/intel_amx_backend.py +1 -1
  120. sglang/srt/layers/attention/mamba/causal_conv1d.py +1 -1
  121. sglang/srt/layers/attention/mamba/causal_conv1d_triton.py +9 -5
  122. sglang/srt/layers/attention/mamba/mamba.py +189 -241
  123. sglang/srt/layers/attention/mamba/mamba2_metadata.py +211 -0
  124. sglang/srt/layers/attention/mamba/mixer2_rms_norm_gated.py +120 -0
  125. sglang/srt/layers/attention/mamba/ops/ssd_bmm.py +0 -50
  126. sglang/srt/layers/attention/mamba/ops/ssd_chunk_scan.py +0 -60
  127. sglang/srt/layers/attention/mamba/ops/ssd_chunk_state.py +0 -111
  128. sglang/srt/layers/attention/mamba/ops/ssd_combined.py +0 -1
  129. sglang/srt/layers/attention/mamba/ops/ssd_state_passing.py +0 -11
  130. sglang/srt/layers/attention/npu_ops/mla_preprocess.py +1 -1
  131. sglang/srt/layers/attention/nsa/nsa_indexer.py +40 -83
  132. sglang/srt/layers/attention/nsa/triton_kernel.py +136 -0
  133. sglang/srt/layers/attention/nsa/utils.py +0 -1
  134. sglang/srt/layers/attention/nsa_backend.py +404 -90
  135. sglang/srt/layers/attention/triton_backend.py +208 -34
  136. sglang/srt/layers/attention/triton_ops/double_sparsity_attention.py +2 -2
  137. sglang/srt/layers/attention/triton_ops/extend_attention.py +539 -44
  138. sglang/srt/layers/attention/trtllm_mha_backend.py +2 -2
  139. sglang/srt/layers/attention/trtllm_mla_backend.py +362 -43
  140. sglang/srt/layers/attention/utils.py +89 -7
  141. sglang/srt/layers/attention/vision.py +3 -3
  142. sglang/srt/layers/attention/xpu_backend.py +1028 -0
  143. sglang/srt/layers/communicator.py +12 -7
  144. sglang/srt/layers/{quantization/deep_gemm_wrapper → deep_gemm_wrapper}/compile_utils.py +5 -9
  145. sglang/srt/layers/{quantization/deep_gemm_wrapper → deep_gemm_wrapper}/configurer.py +4 -3
  146. sglang/srt/layers/{quantization/deep_gemm_wrapper → deep_gemm_wrapper}/entrypoint.py +3 -3
  147. sglang/srt/layers/dp_attention.py +17 -0
  148. sglang/srt/layers/layernorm.py +64 -19
  149. sglang/srt/layers/linear.py +9 -1
  150. sglang/srt/layers/logits_processor.py +152 -17
  151. sglang/srt/layers/modelopt_utils.py +11 -0
  152. sglang/srt/layers/moe/cutlass_moe.py +0 -2
  153. sglang/srt/layers/moe/cutlass_w4a8_moe.py +351 -21
  154. sglang/srt/layers/moe/ep_moe/kernels.py +229 -457
  155. sglang/srt/layers/moe/ep_moe/layer.py +154 -625
  156. sglang/srt/layers/moe/flashinfer_cutedsl_moe.py +1 -1
  157. sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=128,N=192,device_name=NVIDIA_H200,dtype=fp8_w8a8.json +146 -0
  158. sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=256,N=256,device_name=NVIDIA_B200.json +146 -0
  159. sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_config.py +11 -3
  160. sglang/srt/layers/moe/fused_moe_triton/layer.py +79 -73
  161. sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py +25 -46
  162. sglang/srt/layers/moe/moe_runner/deep_gemm.py +569 -0
  163. sglang/srt/layers/moe/moe_runner/runner.py +6 -0
  164. sglang/srt/layers/moe/moe_runner/triton.py +3 -1
  165. sglang/srt/layers/moe/moe_runner/triton_kernels.py +194 -0
  166. sglang/srt/layers/moe/rocm_moe_utils.py +0 -1
  167. sglang/srt/layers/moe/router.py +51 -15
  168. sglang/srt/layers/moe/token_dispatcher/__init__.py +14 -4
  169. sglang/srt/layers/moe/token_dispatcher/base.py +12 -6
  170. sglang/srt/layers/moe/token_dispatcher/deepep.py +127 -110
  171. sglang/srt/layers/moe/token_dispatcher/mooncake.py +386 -0
  172. sglang/srt/layers/moe/token_dispatcher/standard.py +46 -0
  173. sglang/srt/layers/moe/topk.py +7 -6
  174. sglang/srt/layers/moe/utils.py +20 -5
  175. sglang/srt/layers/quantization/__init__.py +5 -58
  176. sglang/srt/layers/quantization/awq.py +183 -9
  177. sglang/srt/layers/quantization/awq_triton.py +29 -0
  178. sglang/srt/layers/quantization/base_config.py +27 -1
  179. sglang/srt/layers/quantization/compressed_tensors/__init__.py +7 -0
  180. sglang/srt/layers/quantization/compressed_tensors/compressed_tensors.py +20 -49
  181. sglang/srt/layers/quantization/compressed_tensors/compressed_tensors_moe.py +421 -70
  182. sglang/srt/layers/quantization/compressed_tensors/schemes/__init__.py +3 -0
  183. sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a16_fp8.py +4 -22
  184. sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_wNa16.py +339 -0
  185. sglang/srt/layers/quantization/fp8.py +152 -81
  186. sglang/srt/layers/quantization/fp8_kernel.py +55 -10
  187. sglang/srt/layers/quantization/fp8_utils.py +42 -14
  188. sglang/srt/layers/quantization/fpgemm_fp8.py +2 -3
  189. sglang/srt/layers/quantization/gguf.py +566 -0
  190. sglang/srt/layers/quantization/gptq.py +0 -1
  191. sglang/srt/layers/quantization/int8_kernel.py +18 -2
  192. sglang/srt/layers/quantization/marlin_utils.py +12 -0
  193. sglang/srt/layers/quantization/modelopt_quant.py +125 -100
  194. sglang/srt/layers/quantization/mxfp4.py +35 -68
  195. sglang/srt/layers/quantization/petit.py +1 -1
  196. sglang/srt/layers/quantization/quark/quark.py +3 -1
  197. sglang/srt/layers/quantization/quark/quark_moe.py +3 -3
  198. sglang/srt/layers/quantization/quark/schemes/quark_w4a4_mxfp4.py +0 -7
  199. sglang/srt/layers/quantization/unquant.py +23 -48
  200. sglang/srt/layers/quantization/utils.py +0 -1
  201. sglang/srt/layers/quantization/w4afp8.py +87 -20
  202. sglang/srt/layers/quantization/w8a8_int8.py +30 -24
  203. sglang/srt/layers/radix_attention.py +62 -9
  204. sglang/srt/layers/rotary_embedding.py +686 -17
  205. sglang/srt/layers/sampler.py +47 -16
  206. sglang/srt/layers/sparse_pooler.py +98 -0
  207. sglang/srt/layers/utils.py +0 -1
  208. sglang/srt/layers/vocab_parallel_embedding.py +4 -1
  209. sglang/srt/lora/backend/triton_backend.py +0 -1
  210. sglang/srt/lora/eviction_policy.py +139 -0
  211. sglang/srt/lora/lora_manager.py +24 -9
  212. sglang/srt/lora/lora_registry.py +1 -1
  213. sglang/srt/lora/mem_pool.py +40 -16
  214. sglang/srt/lora/triton_ops/chunked_sgmv_expand.py +1 -1
  215. sglang/srt/lora/triton_ops/chunked_sgmv_shrink.py +4 -2
  216. sglang/srt/managers/cache_controller.py +48 -17
  217. sglang/srt/managers/data_parallel_controller.py +146 -42
  218. sglang/srt/managers/detokenizer_manager.py +40 -13
  219. sglang/srt/managers/io_struct.py +69 -16
  220. sglang/srt/managers/mm_utils.py +20 -18
  221. sglang/srt/managers/multi_tokenizer_mixin.py +83 -82
  222. sglang/srt/managers/overlap_utils.py +96 -19
  223. sglang/srt/managers/schedule_batch.py +241 -511
  224. sglang/srt/managers/schedule_policy.py +15 -2
  225. sglang/srt/managers/scheduler.py +420 -514
  226. sglang/srt/managers/scheduler_metrics_mixin.py +73 -18
  227. sglang/srt/managers/scheduler_output_processor_mixin.py +317 -111
  228. sglang/srt/managers/scheduler_pp_mixin.py +341 -0
  229. sglang/srt/managers/scheduler_profiler_mixin.py +60 -14
  230. sglang/srt/managers/scheduler_runtime_checker_mixin.py +217 -0
  231. sglang/srt/managers/scheduler_update_weights_mixin.py +33 -14
  232. sglang/srt/managers/tokenizer_communicator_mixin.py +71 -55
  233. sglang/srt/managers/tokenizer_manager.py +375 -95
  234. sglang/srt/managers/tp_worker.py +212 -161
  235. sglang/srt/managers/utils.py +78 -2
  236. sglang/srt/mem_cache/allocator.py +7 -2
  237. sglang/srt/mem_cache/allocator_ascend.py +2 -2
  238. sglang/srt/mem_cache/base_prefix_cache.py +2 -2
  239. sglang/srt/mem_cache/chunk_cache.py +13 -2
  240. sglang/srt/mem_cache/common.py +480 -0
  241. sglang/srt/mem_cache/evict_policy.py +16 -1
  242. sglang/srt/mem_cache/hicache_storage.py +11 -2
  243. sglang/srt/mem_cache/hiradix_cache.py +16 -3
  244. sglang/srt/mem_cache/mamba_radix_cache.py +993 -0
  245. sglang/srt/mem_cache/memory_pool.py +517 -219
  246. sglang/srt/mem_cache/memory_pool_host.py +0 -1
  247. sglang/srt/mem_cache/multimodal_cache.py +0 -1
  248. sglang/srt/mem_cache/radix_cache.py +53 -19
  249. sglang/srt/mem_cache/radix_cache_cpp.py +19 -14
  250. sglang/srt/mem_cache/storage/aibrix_kvcache/aibrix_kvcache_storage.py +8 -2
  251. sglang/srt/mem_cache/storage/aibrix_kvcache/unit_test.py +1 -13
  252. sglang/srt/mem_cache/storage/backend_factory.py +2 -2
  253. sglang/srt/mem_cache/storage/eic/eic_storage.py +5 -6
  254. sglang/srt/mem_cache/storage/hf3fs/hf3fs_client.py +0 -1
  255. sglang/srt/mem_cache/storage/hf3fs/mini_3fs_metadata_server.py +3 -2
  256. sglang/srt/mem_cache/storage/hf3fs/storage_hf3fs.py +9 -3
  257. sglang/srt/mem_cache/storage/lmcache/lmc_radix_cache.py +5 -3
  258. sglang/srt/mem_cache/storage/mooncake_store/mooncake_store.py +101 -17
  259. sglang/srt/mem_cache/storage/nixl/hicache_nixl.py +38 -9
  260. sglang/srt/mem_cache/storage/nixl/nixl_utils.py +1 -1
  261. sglang/srt/mem_cache/storage/nixl/test_hicache_nixl_storage.py +17 -2
  262. sglang/srt/mem_cache/swa_radix_cache.py +92 -26
  263. sglang/srt/metrics/collector.py +31 -0
  264. sglang/srt/metrics/func_timer.py +1 -1
  265. sglang/srt/model_executor/cuda_graph_runner.py +43 -5
  266. sglang/srt/model_executor/forward_batch_info.py +71 -25
  267. sglang/srt/model_executor/model_runner.py +362 -270
  268. sglang/srt/model_executor/npu_graph_runner.py +2 -3
  269. sglang/srt/model_executor/piecewise_cuda_graph_runner.py +549 -0
  270. sglang/srt/model_loader/__init__.py +1 -1
  271. sglang/srt/model_loader/loader.py +424 -27
  272. sglang/srt/model_loader/utils.py +0 -1
  273. sglang/srt/model_loader/weight_utils.py +47 -28
  274. sglang/srt/models/apertus.py +2 -3
  275. sglang/srt/models/arcee.py +2 -2
  276. sglang/srt/models/bailing_moe.py +13 -52
  277. sglang/srt/models/bailing_moe_nextn.py +3 -4
  278. sglang/srt/models/bert.py +1 -1
  279. sglang/srt/models/deepseek_nextn.py +19 -3
  280. sglang/srt/models/deepseek_ocr.py +1516 -0
  281. sglang/srt/models/deepseek_v2.py +418 -140
  282. sglang/srt/models/dots_ocr.py +0 -2
  283. sglang/srt/models/dots_vlm.py +0 -1
  284. sglang/srt/models/dots_vlm_vit.py +1 -1
  285. sglang/srt/models/falcon_h1.py +13 -19
  286. sglang/srt/models/gemma3_mm.py +16 -0
  287. sglang/srt/models/gemma3n_mm.py +1 -2
  288. sglang/srt/models/glm4_moe.py +327 -382
  289. sglang/srt/models/glm4_moe_nextn.py +6 -16
  290. sglang/srt/models/glm4v.py +2 -1
  291. sglang/srt/models/glm4v_moe.py +32 -199
  292. sglang/srt/models/gpt_oss.py +5 -5
  293. sglang/srt/models/grok.py +10 -23
  294. sglang/srt/models/hunyuan.py +2 -7
  295. sglang/srt/models/interns1.py +0 -1
  296. sglang/srt/models/kimi_vl.py +1 -7
  297. sglang/srt/models/kimi_vl_moonvit.py +3 -1
  298. sglang/srt/models/llama.py +2 -2
  299. sglang/srt/models/llama_eagle3.py +1 -1
  300. sglang/srt/models/longcat_flash.py +5 -22
  301. sglang/srt/models/longcat_flash_nextn.py +3 -14
  302. sglang/srt/models/mimo.py +2 -13
  303. sglang/srt/models/mimo_mtp.py +1 -2
  304. sglang/srt/models/minicpmo.py +7 -5
  305. sglang/srt/models/minimax_m2.py +922 -0
  306. sglang/srt/models/mixtral.py +1 -4
  307. sglang/srt/models/mllama.py +1 -1
  308. sglang/srt/models/mllama4.py +13 -3
  309. sglang/srt/models/nemotron_h.py +511 -0
  310. sglang/srt/models/nvila.py +355 -0
  311. sglang/srt/models/nvila_lite.py +184 -0
  312. sglang/srt/models/olmo2.py +31 -4
  313. sglang/srt/models/opt.py +5 -5
  314. sglang/srt/models/phi.py +1 -1
  315. sglang/srt/models/phi4mm.py +1 -1
  316. sglang/srt/models/phimoe.py +0 -1
  317. sglang/srt/models/pixtral.py +0 -3
  318. sglang/srt/models/points_v15_chat.py +186 -0
  319. sglang/srt/models/qwen.py +0 -1
  320. sglang/srt/models/qwen2.py +22 -1
  321. sglang/srt/models/qwen2_5_vl.py +3 -3
  322. sglang/srt/models/qwen2_audio.py +2 -15
  323. sglang/srt/models/qwen2_moe.py +15 -12
  324. sglang/srt/models/qwen2_vl.py +5 -2
  325. sglang/srt/models/qwen3.py +34 -4
  326. sglang/srt/models/qwen3_moe.py +19 -37
  327. sglang/srt/models/qwen3_next.py +7 -12
  328. sglang/srt/models/qwen3_next_mtp.py +3 -4
  329. sglang/srt/models/qwen3_omni_moe.py +661 -0
  330. sglang/srt/models/qwen3_vl.py +37 -33
  331. sglang/srt/models/qwen3_vl_moe.py +57 -185
  332. sglang/srt/models/roberta.py +55 -3
  333. sglang/srt/models/sarashina2_vision.py +0 -1
  334. sglang/srt/models/step3_vl.py +3 -5
  335. sglang/srt/models/utils.py +11 -1
  336. sglang/srt/multimodal/processors/base_processor.py +7 -2
  337. sglang/srt/multimodal/processors/deepseek_ocr.py +37 -0
  338. sglang/srt/multimodal/processors/deepseek_vl_v2.py +0 -3
  339. sglang/srt/multimodal/processors/dots_vlm.py +0 -1
  340. sglang/srt/multimodal/processors/glm4v.py +2 -6
  341. sglang/srt/multimodal/processors/internvl.py +0 -2
  342. sglang/srt/multimodal/processors/janus_pro.py +0 -1
  343. sglang/srt/multimodal/processors/mllama4.py +0 -8
  344. sglang/srt/multimodal/processors/{vila.py → nvila.py} +32 -24
  345. sglang/srt/multimodal/processors/phi4mm.py +0 -1
  346. sglang/srt/multimodal/processors/points_v15_chat.py +52 -0
  347. sglang/srt/multimodal/processors/qwen_vl.py +75 -16
  348. sglang/srt/multimodal/processors/step3_vl.py +1 -1
  349. sglang/srt/parser/conversation.py +41 -0
  350. sglang/srt/parser/reasoning_parser.py +28 -2
  351. sglang/srt/sampling/custom_logit_processor.py +77 -2
  352. sglang/srt/sampling/sampling_batch_info.py +17 -22
  353. sglang/srt/sampling/sampling_params.py +70 -2
  354. sglang/srt/server_args.py +846 -163
  355. sglang/srt/server_args_config_parser.py +1 -1
  356. sglang/srt/single_batch_overlap.py +36 -31
  357. sglang/srt/speculative/base_spec_worker.py +34 -0
  358. sglang/srt/speculative/draft_utils.py +226 -0
  359. sglang/srt/speculative/eagle_draft_cuda_graph_runner.py +24 -7
  360. sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py +23 -2
  361. sglang/srt/speculative/eagle_info.py +57 -18
  362. sglang/srt/speculative/eagle_info_v2.py +458 -0
  363. sglang/srt/speculative/eagle_utils.py +138 -0
  364. sglang/srt/speculative/eagle_worker.py +83 -280
  365. sglang/srt/speculative/eagle_worker_v2.py +702 -0
  366. sglang/srt/speculative/{ngram_utils.py → ngram_info.py} +14 -9
  367. sglang/srt/speculative/ngram_worker.py +12 -11
  368. sglang/srt/speculative/spec_info.py +2 -0
  369. sglang/srt/speculative/spec_utils.py +38 -3
  370. sglang/srt/speculative/standalone_worker.py +4 -14
  371. sglang/srt/tokenizer/tiktoken_tokenizer.py +2 -2
  372. sglang/srt/two_batch_overlap.py +28 -14
  373. sglang/srt/utils/__init__.py +1 -1
  374. sglang/srt/{bench_utils.py → utils/bench_utils.py} +4 -2
  375. sglang/srt/utils/common.py +272 -82
  376. sglang/srt/utils/hf_transformers_utils.py +44 -17
  377. sglang/srt/{host_shared_memory.py → utils/host_shared_memory.py} +0 -1
  378. sglang/srt/{offloader.py → utils/offloader.py} +4 -4
  379. sglang/srt/utils/profile_merger.py +199 -0
  380. sglang/test/attention/test_flashattn_backend.py +1 -1
  381. sglang/test/attention/test_flashattn_mla_backend.py +0 -1
  382. sglang/test/attention/test_prefix_chunk_info.py +0 -2
  383. sglang/test/attention/test_trtllm_mla_backend.py +221 -53
  384. sglang/test/few_shot_gsm8k_engine.py +2 -4
  385. sglang/test/kit_matched_stop.py +157 -0
  386. sglang/test/longbench_v2/__init__.py +1 -0
  387. sglang/test/longbench_v2/test_longbench_v2_eval.py +238 -0
  388. sglang/test/longbench_v2/validate_longbench_v2.py +337 -0
  389. sglang/test/longbench_v2/validate_longbench_v2_standalone.py +306 -0
  390. sglang/test/run_eval.py +41 -0
  391. sglang/test/runners.py +2 -0
  392. sglang/test/send_one.py +42 -7
  393. sglang/test/simple_eval_common.py +3 -0
  394. sglang/test/simple_eval_gpqa.py +0 -1
  395. sglang/test/simple_eval_humaneval.py +0 -3
  396. sglang/test/simple_eval_longbench_v2.py +344 -0
  397. sglang/test/test_block_fp8.py +1 -2
  398. sglang/test/test_block_fp8_deep_gemm_blackwell.py +0 -1
  399. sglang/test/test_cutlass_moe.py +1 -2
  400. sglang/test/test_cutlass_w4a8_moe.py +10 -20
  401. sglang/test/test_deterministic.py +463 -107
  402. sglang/test/test_deterministic_utils.py +74 -0
  403. sglang/test/test_disaggregation_utils.py +81 -0
  404. sglang/test/test_marlin_moe.py +0 -1
  405. sglang/test/test_utils.py +85 -20
  406. sglang/version.py +1 -1
  407. {sglang-0.5.3rc2.dist-info → sglang-0.5.4.post1.dist-info}/METADATA +48 -35
  408. {sglang-0.5.3rc2.dist-info → sglang-0.5.4.post1.dist-info}/RECORD +414 -350
  409. sglang/srt/layers/attention/mamba/mamba_utils.py +0 -81
  410. sglang/srt/managers/tp_worker_overlap_thread.py +0 -311
  411. sglang/srt/models/vila.py +0 -306
  412. sglang/srt/speculative/build_eagle_tree.py +0 -427
  413. sglang/test/test_block_fp8_ep.py +0 -358
  414. /sglang/srt/layers/{quantization/deep_gemm_wrapper → deep_gemm_wrapper}/__init__.py +0 -0
  415. /sglang/srt/{aio_rwlock.py → utils/aio_rwlock.py} +0 -0
  416. /sglang/srt/{torch_memory_saver_adapter.py → utils/torch_memory_saver_adapter.py} +0 -0
  417. {sglang-0.5.3rc2.dist-info → sglang-0.5.4.post1.dist-info}/WHEEL +0 -0
  418. {sglang-0.5.3rc2.dist-info → sglang-0.5.4.post1.dist-info}/licenses/LICENSE +0 -0
  419. {sglang-0.5.3rc2.dist-info → sglang-0.5.4.post1.dist-info}/top_level.txt +0 -0
@@ -1,23 +1,23 @@
1
1
  sglang/__init__.py,sha256=CK60u1J439CJZaPihWqlDjFZ8doIC-5YgIYz-E1PIh4,1823
2
2
  sglang/bench_offline_throughput.py,sha256=Bge0KG4Uiv9CHsxDnqKdXJmG_TcxM4blz3CmvLmDRvM,14815
3
- sglang/bench_one_batch.py,sha256=TFYI_wQGFpeJMV5r4C_EABmwZD3EDNuT1ORQX3jUWlY,23109
4
- sglang/bench_one_batch_server.py,sha256=nD7GMOQE1I57BC1E7dTmqx-PMeSUPq8RF8W39s5z86I,26128
5
- sglang/bench_serving.py,sha256=0l-QrhHtIMUVyewiuvxoRx6_MIulMpadkKtbzpQMxyQ,87841
6
- sglang/check_env.py,sha256=qDMIG2rCNBH1yKnxQmF-Bp10oiFMUKMgfZLHZYOmdSY,8412
7
- sglang/compile_deep_gemm.py,sha256=EsgboGA-MK3Rvx9TlUJPLxJ5LBira4bTcHJLKEp1H6k,6488
8
- sglang/global_config.py,sha256=qnMsK6AKzl8dhEbg-Jlbp_OVY9JUV0X9BqQiOl8VkiE,1737
9
- sglang/launch_server.py,sha256=zBCKcUg4d7_-Zpp0NE9C7z8CIFYw94UH0wo7ZIilHMM,1063
10
- sglang/profiler.py,sha256=zjD9-TxnDv3yU1Qmv4vItH5Nuhiu230ssqOA43EyH2g,4420
3
+ sglang/bench_one_batch.py,sha256=cjECJgTmPcnP-b8Fcy7ldFU6FaEqBpz7Z45RTwBwNR8,23763
4
+ sglang/bench_one_batch_server.py,sha256=8zAjLFu0tgfIhhtEaPGdDhi15YCcHcaK19vz6Rmn_Jw,26565
5
+ sglang/bench_serving.py,sha256=tcgQ3SjTEG1CYvawDbhJdQeX3JR10yiINPxcSN47Jio,95619
6
+ sglang/check_env.py,sha256=6wRlWL7UwY1JjYRG307bLLJRoirPk2RVLYrDWV8Et0c,8413
7
+ sglang/compile_deep_gemm.py,sha256=v7WJZLSrJw3Vc_28lTReRDJ1WdiPKLRHizFi2l2chv8,6614
8
+ sglang/global_config.py,sha256=bVpUL_gMSA0FwJl8y8tP5CIa7d083o6Dcak-yRytzGw,767
9
+ sglang/launch_server.py,sha256=SDfZfS1i0RtakLx1zX9uclHpefKHOiXd7MQI0ktYjx4,686
10
+ sglang/profiler.py,sha256=uprc8Lo-WeqrQY9u2Wj503swEp4P_2laLJ6cWGALgME,4854
11
11
  sglang/utils.py,sha256=YreOyt4-fWdDcg01abaMJ0y0ly4gYps26vRlmWhwGC8,17267
12
- sglang/version.py,sha256=PgjGjGwMjSvY5WJg-jqo1zKEBRurR4G1DY2OwoitREE,25
12
+ sglang/version.py,sha256=TvZB2PPVmaQCmVVHStxmVi90Tm1q4CKl6ezbtlp8gnY,28
13
13
  sglang/eval/llama3_eval.py,sha256=mLNRZJIqV4CfqrY8UGnJEcHw2Xsyr1eyYZgFSUFYr1g,9997
14
14
  sglang/eval/loogle_eval.py,sha256=-CC2s2kh5qUoDrHRkQVkC_jNvBgNojXbf456ny5s78s,4557
15
- sglang/lang/api.py,sha256=rcp3GeoyZhmJ0GDLPRkuZNcxd0TBJy_wfUDpcmQoqW8,7210
15
+ sglang/lang/api.py,sha256=kyfJuErqMyle6hnx3Q_oqNSFDe0q4gFob1yd5ZLTatw,7438
16
16
  sglang/lang/chat_template.py,sha256=4_JVa7NDpHP2it6rAQS5UnCSxSMy0rtfdOgSvH_Kbdc,22549
17
17
  sglang/lang/choices.py,sha256=-W1DVw9N9ZliVpvmWrzIXG4cswAah8eMQrHWzkS3D8o,6234
18
18
  sglang/lang/compiler.py,sha256=MAuzoOOpb98njJ7Io2SDmFkhTroDYiq0te0ZpfHkMY4,7597
19
- sglang/lang/interpreter.py,sha256=F-wxyKDUnTygmJpSEYsrQermls2RyWJntOep9_P7V1I,34818
20
- sglang/lang/ir.py,sha256=FnRJ-lndAsR4GR0ONJRPDtlYx8FvL9RIk44vSA16RBk,19656
19
+ sglang/lang/interpreter.py,sha256=wy6dWNzk57Mp7U15I3VeCT_UFBSnLmff2vXRdDbh1hE,34844
20
+ sglang/lang/ir.py,sha256=wcV1dMwn-L6gK-ERu-Gg_2dqCkAuWkFNIGh0kRhFa7M,20184
21
21
  sglang/lang/tracer.py,sha256=ljBo9VZ0zVaGwzNk32qw21acyo60N0UjIjqBbT5a1WI,8175
22
22
  sglang/lang/backend/anthropic.py,sha256=qXWqqFlk0-nC62QCcYIRjLTc4AHrdTKpl7hCeDzROUs,2019
23
23
  sglang/lang/backend/base_backend.py,sha256=tEutGCU5tni1xGlrIjAVvA9aflJBt2duKrIDzqabJWc,1975
@@ -25,270 +25,302 @@ sglang/lang/backend/litellm.py,sha256=ugmL7sfUxkUHVbHtwNzHgdQAEd4UCjNQboFuE3KThc
25
25
  sglang/lang/backend/openai.py,sha256=YFs7pCDK6_DoYmjTa-vgDVdaeE4PYr7E-sIC1q7vAns,16422
26
26
  sglang/lang/backend/runtime_endpoint.py,sha256=UZRKqQ8eE_N11oiv9rViF3THNq21A_uio0N0Bt9MaY8,17487
27
27
  sglang/lang/backend/vertexai.py,sha256=gz0uNYyBb88jbPYz6ZIJ774fefrcbuVdoK33bphUZpI,4827
28
- sglang/srt/_custom_ops.py,sha256=9GPNUyqnybgvUnzdQ8n5_NgluHmQNw0Gptos0iLPfrY,5342
29
- sglang/srt/aio_rwlock.py,sha256=6LYtOdeTUY3hkfa1dmYkgsaF2ttrwIF3hUWz2AZ2fqw,2970
30
- sglang/srt/bench_utils.py,sha256=zNTsTBUta27XxojgvR5p5X9M0v1MFzZ7dcX9TMq4NvQ,4348
28
+ sglang/srt/_custom_ops.py,sha256=P4MLtuF8DzK66R_Sw88AYsiCOn7YNGZ93H7isJq0dUA,5356
31
29
  sglang/srt/constants.py,sha256=0i-tEwG2BSYNDy96MxnGHV5HnBELkYcnsVGsE-R18o0,93
32
30
  sglang/srt/custom_op.py,sha256=m5F7x3LHlnOuesmcNmJtIWsfHGFLBJ807vKc05Gu1D0,3312
33
- sglang/srt/environ.py,sha256=QaYZPUkvV-KyRWzJ6nz-kNO75Khn_pNbx2yX_YBL7-A,8894
34
- sglang/srt/host_shared_memory.py,sha256=00TgVm3PNCl4rTPJZChG5uu4I5hd_Xf587r39tibmIg,2274
35
- sglang/srt/offloader.py,sha256=cYON5jZErAp88Sh5JseaRw0B2Ho2MQz9smgvrTc-2KA,18765
31
+ sglang/srt/environ.py,sha256=wlvu5PP68cZLbH4DquMeZLkb3aVgJkc3aMzquHeyNbg,10892
36
32
  sglang/srt/operations.py,sha256=za_h1_kcR1Te6-i_r0i_zAeumbmIRhLK2pS31sukkrw,6089
37
33
  sglang/srt/operations_strategy.py,sha256=-w6GI2VgSGvORy3pUWRAJo6244ykSW1ZBV1Dx0fZlHA,7138
38
- sglang/srt/server_args.py,sha256=pjtjMs62nnyMIRQMaL161QKDE2DViatyZNrfbYSkYuM,137969
39
- sglang/srt/server_args_config_parser.py,sha256=niM5LYNaVxQg4FKHUJ3YmMZ-ekB3bDlvTwD7KqdLZoE,5220
40
- sglang/srt/single_batch_overlap.py,sha256=m70hHl1ufIvc_9Nl2bYqnIcfoMIJkPyGjWIqJLBsKhI,4844
41
- sglang/srt/torch_memory_saver_adapter.py,sha256=WFwPsOBvnWu6N2yTHmiOjLbDAYosslHwNSfyFHjz-7w,2511
42
- sglang/srt/two_batch_overlap.py,sha256=0cHUV2ZeyCaojDRpqNcRSUIQM3_Y4H4HfssML2gt_6k,34240
34
+ sglang/srt/server_args.py,sha256=igDvB6U6cnibpTgolFV927EwB90ALkqflmsHFslk714,168328
35
+ sglang/srt/server_args_config_parser.py,sha256=NW_tnD_ixnIpEhIuhn1W67pnAOJSGWKKN-jHcssKD-Q,5213
36
+ sglang/srt/single_batch_overlap.py,sha256=73RM4rQDjw1RQxW4GCWthRLQyoP2oPRA2oN7804dI_E,5236
37
+ sglang/srt/two_batch_overlap.py,sha256=xDDMyE1hKQPq-yu_GkVnNXskyc1CVoPYPaB6AvoPXKA,34667
43
38
  sglang/srt/warmup.py,sha256=fQYzNp-I9mZccs2BerI6mOZd1CDQjdiuFCeUkcwiOb4,1834
44
39
  sglang/srt/batch_invariant_ops/__init__.py,sha256=Z9TvOE4BL7cAaBIePEsVglH7RcWBSBIsSHs-XbveQNE,728
45
- sglang/srt/batch_invariant_ops/batch_invariant_ops.py,sha256=5vtvEFezea4tjGFuVMkadgZxynxAZZ8yxGwpkSm7Sl4,16246
46
- sglang/srt/configs/__init__.py,sha256=aMxLOh72NAL0iQl0aPcPP2Ih9oY5vhHUHAcymE0fv-4,1142
40
+ sglang/srt/batch_invariant_ops/batch_invariant_ops.py,sha256=aHC9BuEm_qY_9nQ87dzMCs1c8cTi_t9JGrq4kn6bEwk,19401
41
+ sglang/srt/checkpoint_engine/checkpoint_engine_worker.py,sha256=YlyiZ46LOi5aib0N5IyrPMuGbnVi_Xnnf9r2XdR1OtY,5509
42
+ sglang/srt/compilation/backend.py,sha256=avi40bJLD_XZd9a2r9Kcl3jOT-n7uiGVZTif76EFRWk,14424
43
+ sglang/srt/compilation/compilation_config.py,sha256=9GDBY3SAV5hIJ6hmYurJ3vfYh9-gtZP3nEzp0TrUdeM,617
44
+ sglang/srt/compilation/compilation_counter.py,sha256=qrCqMCaui2eOBpxi3ZBiuvmJ6dkWah_6dYjhvu6_MqE,1623
45
+ sglang/srt/compilation/compile.py,sha256=All4G5VjYBY9MOalW5YDo17eEtho-o_BG5V86lNJ-5c,6965
46
+ sglang/srt/compilation/compiler_interface.py,sha256=k6EDIpdtEB0NCOaDxsgXwaSXH4xTLQsflFdy-sTsyRQ,19508
47
+ sglang/srt/compilation/cuda_piecewise_backend.py,sha256=_MOgUhUGg9kBDIhSJWq-vUwZrluwScy4PbCzD-X9g7g,9237
48
+ sglang/srt/compilation/fix_functionalization.py,sha256=SDQ1Pbvh5PiUg3M82NAfyXPjz21wmBRQgzM_HHKRHss,5156
49
+ sglang/srt/compilation/fx_utils.py,sha256=vv32jqNIYcdvLiz0W4yGcUyh_ko6LJwrES8ZMU2vIis,2873
50
+ sglang/srt/compilation/inductor_pass.py,sha256=zebqIifs0wvLXIUy43ablX87qh4jnn9876ZHzw4c2IQ,4041
51
+ sglang/srt/compilation/pass_manager.py,sha256=n8TIJkWIxegDd5lX6Xja4l4YuBQLZvn2_9yEY8Esp80,2213
52
+ sglang/srt/compilation/piecewise_context_manager.py,sha256=P-WpB3Ny8sMEFUpkQv4ExSoqQPPyEwhXZraDWQjP8ak,1113
53
+ sglang/srt/compilation/weak_ref_tensor_jit.py,sha256=XJLJsj5t84QLhF0Bjx0j2Iow51d8zc6inASOd9watFA,390
54
+ sglang/srt/configs/__init__.py,sha256=a8_ODqcCzMN1q_fNHKMBNHM9aGH8LF92GLGcLeViLWY,1291
47
55
  sglang/srt/configs/chatglm.py,sha256=j-b0YkdYUmQm2y1kNmMJtKeACxWKmBbvNNkDWbs6kbI,2907
48
56
  sglang/srt/configs/dbrx.py,sha256=tdhIkXAQl1yr0MxqFmsDG1E0e2puRTTKm6UTyANBLac,11005
49
- sglang/srt/configs/deepseekvl2.py,sha256=sYMmoy5_LlDXht7MTi4QGYOaiE8iMGUO44bnuOu4i8I,23683
57
+ sglang/srt/configs/deepseek_ocr.py,sha256=3nZL7pWJ-WwN6ZYqRsPy7zbxgZCggW5igVfIvJhGUXY,8102
58
+ sglang/srt/configs/deepseekvl2.py,sha256=QTZnL47wIx0mkd_HCn_Kfzu4oCHEJaYZpvVSjmaDvp8,26518
50
59
  sglang/srt/configs/device_config.py,sha256=1Iaxrk65bJsCWV3E2cDfiap_T_xJIIj9oFVn9y6v0EI,515
51
60
  sglang/srt/configs/dots_ocr.py,sha256=HSKerqzHzrKIzoNZOUXA_KiBLmL-Rs8h4Vw17pjF1Uo,1863
52
- sglang/srt/configs/dots_vlm.py,sha256=PYoSrT-sRoykfNhdXFauqv21Sb54iavjYD3F09xww3U,5176
61
+ sglang/srt/configs/dots_vlm.py,sha256=Q2qaP65sYCKGmg_bvc4g5yb-pasdZNx4xnnlzu6Ed1U,4912
53
62
  sglang/srt/configs/exaone.py,sha256=Duxd4yQoKy8GWEzZD_kCY_OzmN_67CTJL_Kgn0eXk3g,10731
54
- sglang/srt/configs/falcon_h1.py,sha256=qn_n2uLRVN4EK4gn4UoHo_1NhV6kPFdOIb5TBJ0NAYs,16395
63
+ sglang/srt/configs/falcon_h1.py,sha256=LFxN0We8Gfgk-RWVeegzvyh-R4msAYF96ioO97Ta4ig,14939
55
64
  sglang/srt/configs/internvl.py,sha256=rIC-CBWJHy-Mjmk0_H3YcvVmZzeCRbXGo3dQMex-yeg,28141
56
65
  sglang/srt/configs/janus_pro.py,sha256=yI2c_aWBIKiTcK6RZxK6hq8CIxyYRH_NN8uaSNKsrKI,19156
57
66
  sglang/srt/configs/kimi_vl.py,sha256=4W7VQI3pr888ZsFA2SqCQo4mI0seXTOrGQ-x3oTvWew,1358
58
67
  sglang/srt/configs/kimi_vl_moonvit.py,sha256=hx2Rt4JSFbvy2HUTeLjBpge87m8M6ITAhqsgdNf_Jd4,1163
59
- sglang/srt/configs/load_config.py,sha256=_XhZdoP2Kbzih3FBZiiwGhXBf2-bNrn6f8eA63zqS7Y,3840
68
+ sglang/srt/configs/load_config.py,sha256=_x9n6Rkbi3VqYmXJ7PNdce32mvUNP1ewqrkUsJ7qprw,4765
60
69
  sglang/srt/configs/longcat_flash.py,sha256=Qp25xJVLq2K72Z80cXhcJxtqhagAdiPySDoevuT0Sno,3589
61
- sglang/srt/configs/model_config.py,sha256=fICFIXWjFrS7xtQYA-8TNJigD9blBfnEKmsbDsbMenE,35245
62
- sglang/srt/configs/qwen3_next.py,sha256=MVMDzdwlxrdar_6p6n9HjaXAei_giFfXlQNJAWpSLQ4,15794
63
- sglang/srt/configs/qwen3_vl.py,sha256=FMC-SVeM_sxLdjEAfJ_oNog1P5kXm70NMHNXmzSMo_U,29008
70
+ sglang/srt/configs/mamba_utils.py,sha256=AD96wj8FCxRsEovdtGn88xzcKAw5KErbO5xFSk0xwxc,3684
71
+ sglang/srt/configs/model_config.py,sha256=16APos-1uvf8oQsfU1yQz5HBSXI2WWQQU4pBCkeY3PE,39657
72
+ sglang/srt/configs/modelopt_config.py,sha256=pr4Q_J4G1Ff-wy24BYRzWaN0UI34rreGef7Nt6d0X3M,1070
73
+ sglang/srt/configs/nemotron_h.py,sha256=X39hWm2KQoAcZ4HXKDCfbua9aOTlcxcK89c52cmAq-k,13072
74
+ sglang/srt/configs/olmo3.py,sha256=DOyp1cNi_n8ckz9Ohs3zUZqkk6n26UBsNQ3zngHNNNY,3600
75
+ sglang/srt/configs/points_v15_chat.py,sha256=qand7WMc3L96wg-wzA9YqnzMz7ZUM6quAuThjO1rfM8,983
76
+ sglang/srt/configs/qwen3_next.py,sha256=XQje5KTnw2aA187DNkAFRUbIPFnTsKwl64FJCW1gcLA,14884
77
+ sglang/srt/configs/qwen3_omni.py,sha256=m6NxdP-iKVkKuYARukqjNhQ01D5gmNQOsfFKU5qZEqI,22384
78
+ sglang/srt/configs/qwen3_vl.py,sha256=0Coyj3ZYUJIgEfxt_6xx8wgd5Fy1tkMAeEhIaXXaZyk,28854
64
79
  sglang/srt/configs/step3_vl.py,sha256=_Otgnym57DVgB_kZ__8c1_Ys5gSalA_K0ZuVjcG51T0,4845
65
80
  sglang/srt/configs/update_config.py,sha256=GEf-XhL8JPrbX9-Hz8V7S3M6YTg76DVdIhc_4YdMDtc,6291
66
81
  sglang/srt/configs/utils.py,sha256=3nHUfisMs_Ltuhv8OZTNCJp63YJKJVF43h1QZB1zqx8,670
67
82
  sglang/srt/connector/__init__.py,sha256=zPuaRKulJsrDyT3OtN9wUT-4fqQBX-cJr2fZUB0_KPM,1562
68
83
  sglang/srt/connector/base_connector.py,sha256=LCKsTX_yWHclPrzNNB1fLwVCN8rIDKZaZhqHQ54B9MU,2774
69
84
  sglang/srt/connector/redis.py,sha256=K3fJSm2rZsd0R_KkICV3jIWKtrwxXE1tYktWnovLbz4,2514
70
- sglang/srt/connector/remote_instance.py,sha256=X_PIZFvZPsnUZ_54AgnzR0NdUfi6ClwQVlNexZatkXU,2710
85
+ sglang/srt/connector/remote_instance.py,sha256=LpPVftvXN0xRVPthwFm2fgnuvxSlYxwE_47NRGAmkmY,2704
71
86
  sglang/srt/connector/s3.py,sha256=hn5Ow9Y6ItS8RMJDwnTQe5QaiQ7HKMgiwggE9QnUewM,3743
72
87
  sglang/srt/connector/utils.py,sha256=isTvxauz1_8no5MW6p8Bwj2H9mQkweaRO_RSwAPA7R8,983
73
88
  sglang/srt/connector/serde/__init__.py,sha256=zuleyYN-jrDyiPiXjTbQKA27llb4H7HuDTZcBwrLk1U,707
74
89
  sglang/srt/connector/serde/safe_serde.py,sha256=XSjb9mRv1HqeG6Jiw633EOQYlrcI23Q21UluYqPZaWA,760
75
90
  sglang/srt/connector/serde/serde.py,sha256=n59I2MXLa7WCyN_8pEd8L-scJk7lMhmEX-GOUIhF0ZA,1004
76
- sglang/srt/constrained/base_grammar_backend.py,sha256=FKlBqllZ-bs65DYG5l-qsuuqfXOPeuUe5_NvPlpBzUs,8114
77
- sglang/srt/constrained/llguidance_backend.py,sha256=JkA_59nZ4zd8ciGvXsZ-OEsGCyQMoIxBO8QXIUqAUn4,6161
78
- sglang/srt/constrained/outlines_backend.py,sha256=t4gkO9AX8xfYulvhNx0n-p1kUavJnCjE9XjwN1Z4BV4,6883
91
+ sglang/srt/constrained/base_grammar_backend.py,sha256=LVEaY4JrF8zCbn1chwva0zJ9cW00dZ4yVTREmzJx9Zs,8307
92
+ sglang/srt/constrained/llguidance_backend.py,sha256=OxJoMbhi1InKzxMkGQrvetWU5GR9n8C1jc74fHBFQtc,6433
93
+ sglang/srt/constrained/outlines_backend.py,sha256=1pQNeROdrFBiXIIkIYKB0xufIfp6KDxm8G7C_xMooH8,6889
79
94
  sglang/srt/constrained/outlines_jump_forward.py,sha256=dm3PVswx2oE_JfAv-tPd7irMI95VCq4cZT-AF-Ohx3s,6823
80
- sglang/srt/constrained/reasoner_grammar_backend.py,sha256=YFxWuOTTo4e6cGhxnaBwuwli6f8FTUJtszib8dBq_8I,3207
81
- sglang/srt/constrained/xgrammar_backend.py,sha256=Dhn0sROXQtybY-sJfMcleIu_Rmn0sjleGMywCD3Simk,9338
95
+ sglang/srt/constrained/reasoner_grammar_backend.py,sha256=O36HzXEB-YKgo0recrLtW36EiTZIBbpnbHBPeGkWEyI,3334
96
+ sglang/srt/constrained/utils.py,sha256=ZDXuyKjGYHfPo3ZhcgxZe7pk_Qb4_ilBV2WjbDRXKDc,418
97
+ sglang/srt/constrained/xgrammar_backend.py,sha256=x7iwMMojTI3pcMmnyUPI1k4bCRoe1IIw76_IIJTAXBs,9855
82
98
  sglang/srt/constrained/triton_ops/bitmask_ops.py,sha256=WjTen9iuuFWLzkE1mAHQZB9_7aIy5QH8Wjf-lB-Fams,4614
83
99
  sglang/srt/debug_utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
84
100
  sglang/srt/debug_utils/dump_comparator.py,sha256=3rWdv4BQXTDtB3z5ao9VPN5lK31ImKf2zMWX7f0Xe6s,5394
85
101
  sglang/srt/debug_utils/dump_loader.py,sha256=RzWpl7RsDRw98DJMEvf6U9c9fPiobyeWI8opmRaRGGA,2632
86
102
  sglang/srt/debug_utils/dumper.py,sha256=6frfI4WErneQE4RpXgAR5gZJQRdzcQjyO3McW56jgYo,3517
87
103
  sglang/srt/debug_utils/text_comparator.py,sha256=NLJdjUikW--bWnGQWIeFJesyuvZ2Vni2S53fIED-m8s,7370
88
- sglang/srt/disaggregation/decode.py,sha256=_k9uVKzFUxEJIpBQSjoBVaY-GMoc0zTW6FuVhiH05os,36936
89
- sglang/srt/disaggregation/decode_kvcache_offload_manager.py,sha256=BWjhO0CDdpU8VIC_-hL9R8CjqUk5cQ1ivfXLjPSS9jU,7029
104
+ sglang/srt/disaggregation/decode.py,sha256=EJNSz7J2hmO5VuqXu14O6k57w7WizFRK5n1uE8iSzdY,40441
105
+ sglang/srt/disaggregation/decode_kvcache_offload_manager.py,sha256=jD_O-uRaZ5cD8C9qtto6m5ZXyM86loJzkdLgwheMBao,7045
90
106
  sglang/srt/disaggregation/decode_schedule_batch_mixin.py,sha256=BeGxXbFLW_ZbuyOs0idWzlicCh6NA1pTOXgON5SAdaE,6947
91
107
  sglang/srt/disaggregation/kv_events.py,sha256=yFbtwOeblcCmOXTjg00TopxnyjkmCBQIVz46KB8jetY,13555
92
108
  sglang/srt/disaggregation/mini_lb.py,sha256=JY2uCeUM3Zk3FdGWmCQBY3LeiJ5FM1PlrqAW8wJTTHI,395
93
- sglang/srt/disaggregation/prefill.py,sha256=eOEdepYknYHO6vz-MCV-jmuTOe_qq9X_ZD_AX1SwICU,37138
109
+ sglang/srt/disaggregation/prefill.py,sha256=crU3CZ5oITm3W9dSxIsvbPIwzOM9dPDOhPTELZcYepA,28325
94
110
  sglang/srt/disaggregation/utils.py,sha256=oBMqYOMAnyK4T69fFaDIuM1AAGa2vOvoA-CBtGocOkk,12263
95
111
  sglang/srt/disaggregation/ascend/__init__.py,sha256=-lxnica6fZYmYNpKwmE8yESUpQ5Sxf2DiZoBHzboKc8,146
96
112
  sglang/srt/disaggregation/ascend/conn.py,sha256=Z0xTJjSYXal7uGA5e7ci4oxOcWdC9qrV-gMd06ikp2w,4109
97
- sglang/srt/disaggregation/ascend/transfer_engine.py,sha256=JkalkQUFCwdCjJ_k8hxJqmgJ4CfxgiQzHzplP1S6xqE,3577
113
+ sglang/srt/disaggregation/ascend/transfer_engine.py,sha256=MK9G22_YUkvpaH4XVvKe1iz7F-bzhOdtYaVQ2jKiY2s,3567
98
114
  sglang/srt/disaggregation/base/__init__.py,sha256=4VwUv0aWxwmVL1049XK82aLTNxmt0WY5RPy9li-wyVk,160
99
- sglang/srt/disaggregation/base/conn.py,sha256=0CGEv-B24woyDBdEgQwT8Gqz10Uox3gCgWiCxznXkwQ,2912
115
+ sglang/srt/disaggregation/base/conn.py,sha256=SvNYNFIjC0adxt0vs3g80P-vdVCleBPE4VKs0-hUIz4,3271
100
116
  sglang/srt/disaggregation/common/__init__.py,sha256=7yl-EGLMVKRpBUaGF_7lwAsw2J_mqpRZV0238VGxD9o,126
101
- sglang/srt/disaggregation/common/conn.py,sha256=PiYuKGYVeVxoPaQcUK673IGelN9XnK7fyHSb6y6mptY,24415
117
+ sglang/srt/disaggregation/common/conn.py,sha256=mlZJnlsvdS2WxapGtMhV1YpE9M9zLm2NXPMNuI7PSFo,24443
102
118
  sglang/srt/disaggregation/common/utils.py,sha256=SxRhAWisNK8seGhb5BXBJ5u53DF7yeKVPMWPcB5ywbE,1194
103
119
  sglang/srt/disaggregation/fake/__init__.py,sha256=jJGWdXwaQiGIoR6atKqkQfkJmVyQ09l55VUN2WjwaeY,77
104
- sglang/srt/disaggregation/fake/conn.py,sha256=qsN5SEQLMenALxYC3x7GYZprhUQyRje5ldNwjkT6OPw,2283
120
+ sglang/srt/disaggregation/fake/conn.py,sha256=C5gYCsqf-CfffDhqzbp4FL1GQ3xFo_OvKkcC4W6R1OM,2502
105
121
  sglang/srt/disaggregation/mooncake/__init__.py,sha256=0TgqkAdQI1YynbHY6c0QISvVoOSk-0SwCIq5rjPSmgE,156
106
- sglang/srt/disaggregation/mooncake/conn.py,sha256=01TcfkekA3v7ApN11ATx_YsFi6B5U1xd3yPDxRx6F9Y,50697
122
+ sglang/srt/disaggregation/mooncake/conn.py,sha256=ruE4Rb0dPIhAmpQEKkePgnyRDG0xMbySgsrCb7wFIh8,56422
107
123
  sglang/srt/disaggregation/mooncake/transfer_engine.py,sha256=O-XRmQ3QwD6RuiyRgw4ZohSrFkuPdppV_eDBMUXn0jk,5884
108
124
  sglang/srt/disaggregation/nixl/__init__.py,sha256=qODVPIGWUXKXq4zsRIcMYoAoAeg6nBIN9vdQOlVMANE,136
109
- sglang/srt/disaggregation/nixl/conn.py,sha256=_si9ryeRoDHYmomthSyztUOEYl20aa18mS9_Sm961S4,32299
125
+ sglang/srt/disaggregation/nixl/conn.py,sha256=w_kDDEB4fIvDe-Z7ufxmw_cpDR57xXJVQrqWvYe88vo,33788
110
126
  sglang/srt/distributed/__init__.py,sha256=jFOcyt-wFAPMBUAf9zkZalNQlt-4rqmT6pCKBz1E4qo,149
111
127
  sglang/srt/distributed/communication_op.py,sha256=IBnFUdMftK_VSTMMMitGveonorFUUVNL4guqO31cMSc,1130
112
- sglang/srt/distributed/naive_distributed.py,sha256=5Kcfapzz61G3TtScTZrHoWa4bf6Vr27GlMcBAGMz7tQ,3260
113
- sglang/srt/distributed/parallel_state.py,sha256=m0T-Tfqi7DnCUPEGhA8Fr-dNlbeoowvG3Ds60IoDeos,68541
128
+ sglang/srt/distributed/naive_distributed.py,sha256=GX7CHhUb9rIQuaIPX4TYm01S7XQdBXvdqaJoPdxFyAI,3317
129
+ sglang/srt/distributed/parallel_state.py,sha256=2lenq6afSb6xGdvOw2dvpD8ssjm7XTbSF0BjJ_V-mbg,70571
114
130
  sglang/srt/distributed/utils.py,sha256=aaCxATncLGnVgB0WlGpBdee0behKW8Dy_dakqcuKSaQ,8497
115
- sglang/srt/distributed/device_communicators/all_reduce_utils.py,sha256=IxCuujkRVUGckr-PAhe2F_QfHGKhvQHo9ryB9-CQjpA,332
131
+ sglang/srt/distributed/device_communicators/all_reduce_utils.py,sha256=dk-uFaKZgVG-1dZDwMT6GvpFi2xP0DJRJ9BiRjHq0zw,336
116
132
  sglang/srt/distributed/device_communicators/cuda_wrapper.py,sha256=3jvPG-Ow5UBLiXhfx8T8snR7crSZbPpARAggsDPWq7k,7038
117
- sglang/srt/distributed/device_communicators/custom_all_reduce.py,sha256=Q1kkKPKFPV0QMmKLyjOBlOnX8-Pr4UeGBZYkG6j0gc0,16570
133
+ sglang/srt/distributed/device_communicators/custom_all_reduce.py,sha256=RCF9FzJYI9EzlNEDUZB-uL_0VKjTqNn0_MfZED-0RhA,16615
118
134
  sglang/srt/distributed/device_communicators/custom_all_reduce_utils.py,sha256=Fx9D70NO2dplyuqOxTasMwkzONN3wfC4WOny3tWSbPA,14159
119
135
  sglang/srt/distributed/device_communicators/hpu_communicator.py,sha256=gPjEH1-izoby5uDrfUlzNf21luPT0Ow7pJjhCRKnHy8,1728
120
136
  sglang/srt/distributed/device_communicators/npu_communicator.py,sha256=bRXN1Md_4SHQGzQYZa2GrHv2zbIU5vSpkueHiAZL1xQ,1345
121
- sglang/srt/distributed/device_communicators/pymscclpp.py,sha256=8Pgehd02v-BpHixTTB4OB9ZlxA7fyXiPF4Xp9F_heyU,10890
122
- sglang/srt/distributed/device_communicators/pynccl.py,sha256=7aE-pKMyJfawGo7Vzymb6Nlz3ux2G_dPflYPK2kzpaQ,12208
123
- sglang/srt/distributed/device_communicators/pynccl_allocator.py,sha256=zAxWwI73ZNsF_c4PZUnRMzwzSD88v26w8komzZ4Uatc,4771
137
+ sglang/srt/distributed/device_communicators/pymscclpp.py,sha256=8ujiWibMH36TGh0kWnJKcP_AqaVAX0dYhJHtZemRefM,10874
138
+ sglang/srt/distributed/device_communicators/pynccl.py,sha256=TqczleI5orlLfP3UkhccOIQexh_ih1b98kqUxtE42jY,12813
139
+ sglang/srt/distributed/device_communicators/pynccl_allocator.py,sha256=jNvIJiYPiEJYV6Q0kvcdbYZfxjh7wq0yWiRJuWWzYi8,4756
124
140
  sglang/srt/distributed/device_communicators/pynccl_wrapper.py,sha256=BLGEl90GZSl3K-04x7eCTaVmpZBXpcb7uJakAseteFU,18539
125
141
  sglang/srt/distributed/device_communicators/quick_all_reduce.py,sha256=4j1_E4azoxfd8wxtfFmt9rvbQncl8ny6wmTMl6gAkp0,9932
126
142
  sglang/srt/distributed/device_communicators/shm_broadcast.py,sha256=q68niUgh8zF7CgNwqny9vaZU1aHGpLSrxBMiUWZ5Nsk,20969
127
- sglang/srt/distributed/device_communicators/symm_mem.py,sha256=EFN6v2l3Hrxek_1kxDHMMmzLP-bDswhdNW53FrQm2-I,5664
143
+ sglang/srt/distributed/device_communicators/symm_mem.py,sha256=MauP4LGMIKSfoDx-L8o0kaXg7rsAuVDT92ugjlM68xM,5641
128
144
  sglang/srt/distributed/device_communicators/xpu_communicator.py,sha256=ajW6132BvA6jkeipEIgN27TFycI0U06Ih2Z8WNjlA4s,1593
145
+ sglang/srt/elastic_ep/elastic_ep.py,sha256=KaSUAi0JHB82desvcv-TW5_PYCrzQStslOCcl9_g-LM,2311
129
146
  sglang/srt/entrypoints/EngineBase.py,sha256=yKN76witT2jz1zhmLHmPNLGMpK2UiOTaKQ2KPD8l99U,2594
130
- sglang/srt/entrypoints/context.py,sha256=aD-94xkD0komuGO5gtYUoJKCHdc4hAipMxQt04yVRGA,8030
131
- sglang/srt/entrypoints/engine.py,sha256=hDuQJ5XheUZNfScFRBxKHEev_gDTiKH3f6gKtcWfj-U,34950
132
- sglang/srt/entrypoints/grpc_request_manager.py,sha256=0tVlP5eRgQTk1PGWsQtzNrlqd3-HJp67yu3o6jRkan4,32273
133
- sglang/srt/entrypoints/grpc_server.py,sha256=WjToYISgaWQwlmUz6-1PxMd84YPGmTPpbdKvNiukt4A,31208
134
- sglang/srt/entrypoints/harmony_utils.py,sha256=01T-A5GBUm2b306PcxNEg2rfx4cykBcqNYrzcXTWBlc,13590
135
- sglang/srt/entrypoints/http_server.py,sha256=8f9fJhaXGEGwMCsLp5B2Ukk_MDd5dNRYE8NJ5FbLKk0,52423
136
- sglang/srt/entrypoints/http_server_engine.py,sha256=_--j4U04OeJLlnnv1f0XmCd_Ry0z1FlhkrbePX8rYV0,4938
147
+ sglang/srt/entrypoints/context.py,sha256=YQdVLmELQD1tNT6Q1BLl04sATwTJAAomCATZyD19S8g,8035
148
+ sglang/srt/entrypoints/engine.py,sha256=-Cmjdfq9QxXKCXXVSnOfg2LIvpteQlIvr0sMBUn1IZQ,35028
149
+ sglang/srt/entrypoints/grpc_server.py,sha256=3yio35-FDDYwCyt0QwTRDu4Z1ASS20UmqK7Hz6fBbRo,38813
150
+ sglang/srt/entrypoints/harmony_utils.py,sha256=FhpPFnwgy1-qLnu_HZAk5V_RPmQkT81dFVp8A6xINEU,13594
151
+ sglang/srt/entrypoints/http_server.py,sha256=tBGTW1MA_6Dtqb0_z_mWHjmpY9ZLIaGehLHKJITvdJg,55556
152
+ sglang/srt/entrypoints/http_server_engine.py,sha256=rWgdCYLZZP89MA-Y-hfACQqdDu0LC7lLYghi2wk-nU8,4809
137
153
  sglang/srt/entrypoints/tool.py,sha256=aAXEjBqkr5j6_IgRL8fZCKgoDPY2TikM20-LQXU9TaI,2709
138
154
  sglang/srt/entrypoints/openai/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
139
- sglang/srt/entrypoints/openai/protocol.py,sha256=UmPdjkfaFYP2X5NYI0rt8L1w2pdqGYsIcIiCO1bnF7Y,33216
140
- sglang/srt/entrypoints/openai/serving_base.py,sha256=b15N627nn3me2jHzXJBFkWPpX8OJdtD66v8aSsx0i0s,7746
141
- sglang/srt/entrypoints/openai/serving_chat.py,sha256=w1awHs-msdhKEzlMHUA_e_Ptx3qlUcdiUGVLq6ryYfs,49829
142
- sglang/srt/entrypoints/openai/serving_completions.py,sha256=SBoaa9KIIL7NQCWwB1B2A9roTrQW1P9C4fkhuHymo00,18233
155
+ sglang/srt/entrypoints/openai/protocol.py,sha256=NkK_i-Njzxzp_FIVFoOJXonz0kdYLtf_crLBuj69LoI,39612
156
+ sglang/srt/entrypoints/openai/serving_base.py,sha256=-L4lcJCTCJPEmtYHtQXLFgJnvJ3CbUp80uyEI0X_C6w,9665
157
+ sglang/srt/entrypoints/openai/serving_chat.py,sha256=NQs4XRPE7JEV8Mmpe1XSVWKD4VQxr8Fcw1ItLUeO3jA,47908
158
+ sglang/srt/entrypoints/openai/serving_classify.py,sha256=ifEjD-2rq7izbgITMB_nZkrUDN8wj73ZMV634G_HJ4U,7148
159
+ sglang/srt/entrypoints/openai/serving_completions.py,sha256=-kTg3BYaKLmnneKh-1_2QVC0KPg1e2VV1DEKImG9KpM,18831
143
160
  sglang/srt/entrypoints/openai/serving_embedding.py,sha256=H7Nv1vSUuyOUXBeaNvYB4XMFxmcJc8or7MUKyuAw_XA,6435
144
161
  sglang/srt/entrypoints/openai/serving_rerank.py,sha256=G79XdomjzLhH1YCbGR4alSxWO9NNmi7U-YSPsH61cjk,3379
145
- sglang/srt/entrypoints/openai/serving_responses.py,sha256=ro1VwdazJNqm5RRVbMKI7NliPsVMFcrNEsRD23QiADc,54989
162
+ sglang/srt/entrypoints/openai/serving_responses.py,sha256=LDnLzUHpNrIibmUWlqCAtosUg7X3G-AIOvnUJ6etDwg,55122
146
163
  sglang/srt/entrypoints/openai/serving_score.py,sha256=LuwXzWRAMm-xMK8ZjP3JaJ84Gxjr0Oi-e3keCsIgK38,1992
164
+ sglang/srt/entrypoints/openai/serving_tokenize.py,sha256=kgLBC8a_j16T2Gm5nv4DaUjjt9voerrbe-LrB5hJz-0,5525
147
165
  sglang/srt/entrypoints/openai/tool_server.py,sha256=rRNGELPV5RHONp55MYkO4_b0NPsPffJnWg-gMYwDSTc,5659
148
166
  sglang/srt/entrypoints/openai/usage_processor.py,sha256=9LTB5rqdRuMKyZrIXiUBuF_WKaSg9X45YdzERDxbtCY,2746
149
167
  sglang/srt/entrypoints/openai/utils.py,sha256=DT9quW0F1DX1P9NAuMxpERgXcNYKKtm7rd7J1m7EaDQ,2112
150
168
  sglang/srt/eplb/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
151
169
  sglang/srt/eplb/eplb_manager.py,sha256=e8HMGzZb2QFRGdS7JZIFSy8cOIlxOlGRY-ef7Wei0Sw,4364
152
- sglang/srt/eplb/expert_distribution.py,sha256=gd3PktGCSqHLjB5XHhTSA-OtaDVYw-taExCe7NOHM9E,32939
170
+ sglang/srt/eplb/expert_distribution.py,sha256=X28mY6j91VKFbBtMHPwYdFLB8vYtzSjxNF82W3XVGKo,33892
153
171
  sglang/srt/eplb/expert_location.py,sha256=WoOmsZ4u9le44km3nbjJjF6BVBxN3cKRz9nQM0uWH_s,18386
154
- sglang/srt/eplb/expert_location_dispatch.py,sha256=vA0o-7bXf847BQAVCqElWKEpofZLAIsir_d0pew2KNQ,4178
155
- sglang/srt/eplb/expert_location_updater.py,sha256=ScoyCJbtJNQLriQXJNZTV2-5G8-tR3AocZDK3ujMaJk,21172
156
- sglang/srt/eplb/eplb_algorithms/__init__.py,sha256=c6fo4qM8N0p5DyyfGp9fxqc2wkxvzSJBzJFRG1I1leg,1959
157
- sglang/srt/eplb/eplb_algorithms/deepseek.py,sha256=mMZT7zAAArccdRS0xXxifvMb3qn9enSt426uUTKeiq4,8340
172
+ sglang/srt/eplb/expert_location_dispatch.py,sha256=mZUH-jvz7yvxC-5bwMFQalfKbbJiZujMiRK_M9oGOT8,4163
173
+ sglang/srt/eplb/expert_location_updater.py,sha256=7LOmLtY_YWYySI2GgFuTJ__Qde0LEKq70E77Q608OFU,21157
174
+ sglang/srt/eplb/eplb_algorithms/__init__.py,sha256=FBO0vEaWbpURbrSV6Uq753Zm2ukiCTUkDvOd292xU_E,2695
175
+ sglang/srt/eplb/eplb_algorithms/deepseek.py,sha256=LHEW_v5vA6FgH-oFqG4Cu113T-5ZPVdGV791MrM4K20,8293
158
176
  sglang/srt/eplb/eplb_algorithms/deepseek_vec.py,sha256=Vzy5Iarua1VgVHzjBNZaVV_vt1LY1BLtJz7PmzB701k,10654
177
+ sglang/srt/eplb/eplb_algorithms/elasticity_aware.py,sha256=x6ab8G_CCaUnkFDmI6JdzQqaNIXyETW1oCsCx4PPxKY,3230
159
178
  sglang/srt/eplb/eplb_simulator/__init__.py,sha256=HIZaXqsvsOCMMJ81dSs1afSGZ5G6OiOZEtHpltyzzjY,21
160
179
  sglang/srt/eplb/eplb_simulator/reader.py,sha256=OlsWqsuXqVQY7PfvvrP-vsl2Ww2Kg4vD_K9BltM_QHo,1828
161
- sglang/srt/function_call/base_format_detector.py,sha256=DunwyYJxLcwrD-iHDXX9uqJ5S8zMJhUXfzHiBgbXaZ0,15728
180
+ sglang/srt/function_call/base_format_detector.py,sha256=pQjF8ri_i7wc8diX-sGC4FkKi6eOqSUUi39Wu2Q3-AM,15585
162
181
  sglang/srt/function_call/core_types.py,sha256=wLUsW8mUA-i-ISz5QUDL7Ejq72W-K1HIhFa9Wm-_oA8,786
163
182
  sglang/srt/function_call/deepseekv31_detector.py,sha256=hpRjjv219mH0v1PQpMvj_gezrP7PwvLiNbBKOTCSC3U,9731
164
183
  sglang/srt/function_call/deepseekv3_detector.py,sha256=DhO3tUX1nvFlfRkHJ1Vm_7OMXFFTvWBA9u9SZKFAwuQ,9710
165
184
  sglang/srt/function_call/ebnf_composer.py,sha256=OpjfvYowLlMLnxz5fwS7zv5-d43_ZwO9ucGAMsILvm4,15321
166
- sglang/srt/function_call/function_call_parser.py,sha256=NUQCh7dMwRTkudRDFz3Mdr-nDL_zXqABVQYPocGI274,8592
167
- sglang/srt/function_call/glm4_moe_detector.py,sha256=fUqozcc_V2g4Vd0l3BjhZZ0MRKmLinx98-Gm8aOlVgI,6975
168
- sglang/srt/function_call/gpt_oss_detector.py,sha256=f0fjnxNKLb_TrxvNWbmCOB3_KN07NtZacazFpyIcqC8,9262
169
- sglang/srt/function_call/json_array_parser.py,sha256=i985g7MUHj1M8gJ0it3Lw663Bx1uh0biN_It13hnMxU,2227
185
+ sglang/srt/function_call/function_call_parser.py,sha256=JDZzRmXBypTfhGm_hZDmhw6o2XkyWCd4iYyxqvmcsxk,8869
186
+ sglang/srt/function_call/glm4_moe_detector.py,sha256=B4GjjgoDVc4ETyqCowfWQamIhhUDwl6pA9xsAE3sOfo,6943
187
+ sglang/srt/function_call/gpt_oss_detector.py,sha256=ti5Dwci_3J9XzqQetMILY7R-VTCCRbGbHas3DdC5x28,9263
188
+ sglang/srt/function_call/json_array_parser.py,sha256=m37S_3bQtyAI86T3ju80dkKJxuazA1VV0J5ioK1uQbw,2205
170
189
  sglang/srt/function_call/kimik2_detector.py,sha256=VWN4Nf9l9O0uSUR0UppuoAyVObvGw-rVvklFJ1qzbRA,10641
171
190
  sglang/srt/function_call/llama32_detector.py,sha256=trZja7IXc2IWUko5PRj7p4pRU6XCVjtxr-7qJNr0EWo,3647
191
+ sglang/srt/function_call/minimax_m2.py,sha256=1Q5uo-cUUtKykYDeAWx0CxqiDtz2_oC7sprsAJL6Ki4,14689
172
192
  sglang/srt/function_call/mistral_detector.py,sha256=Ts2HrJdu5r2lCCMVKPZfnCds9pt1K5H1EaOQrF_HD60,4686
173
193
  sglang/srt/function_call/pythonic_detector.py,sha256=yAatItKtVDf9uhlB78wPWKP3fbefLJDNGGzFV5ey-YA,8756
174
194
  sglang/srt/function_call/qwen25_detector.py,sha256=nv83_sipZMU6Vie3J4HeNiZVCSRU5ei7601j50779HA,5181
175
195
  sglang/srt/function_call/qwen3_coder_detector.py,sha256=fyiF0WkNwozlKZQy0G903hj-ZAyvEgkFC8l20FVOVX8,14299
176
196
  sglang/srt/function_call/step3_detector.py,sha256=SAibrispu0peDQzqOG2-V93KGHtV6Ud7a38vlnhTunA,17442
177
- sglang/srt/function_call/utils.py,sha256=HeRwtWRrkwipIKM_EBfCgyNxy2It_7kAfPUcBhMERjU,4548
197
+ sglang/srt/function_call/utils.py,sha256=P-iT81YRm1zPV7Y19bkQq5VcV15-XLF1AwoeXWI7Nig,4552
178
198
  sglang/srt/grpc/__init__.py,sha256=dPeDsMRMW8WyHD6jolIpIlvlJsYLAhwewHhCTdu1MAE,21
179
- sglang/srt/grpc/compile_proto.py,sha256=kiaVgK1eEcSMVd5mCed-5cs_78JIawjJ1jQ2U6mdYkg,6997
180
- sglang/srt/grpc/sglang_scheduler_pb2.py,sha256=Q0QVnMvRovwWpFmd3j2-fNLZfuvX_4Hq8iRKM6sz-s4,14182
181
- sglang/srt/grpc/sglang_scheduler_pb2.pyi,sha256=RN5UOWYzxPBFUUcWAaiXPeOB9iclizo7ehFzNrI5P94,23095
182
- sglang/srt/grpc/sglang_scheduler_pb2_grpc.py,sha256=s8WXOFE0a0zGkcfVUxHxa28yA8VOZxua5K31dEXqt_A,9051
183
- sglang/srt/layers/activation.py,sha256=iWEi9wIdAf0xov0KU27JUB5FIl6dqCGQjbIm_9dVSfQ,13368
199
+ sglang/srt/grpc/compile_proto.py,sha256=ZRH11Wodv4BbYo0F-JqA-ymIM-FwkkiAjwM_7msI2uA,7011
200
+ sglang/srt/grpc/grpc_request_manager.py,sha256=ZX4p3ewoUAd9vGG3lNKv9MknFV4BtXJQtP1u8hDJrKk,34849
201
+ sglang/srt/grpc/health_servicer.py,sha256=6h0JFrvVKz5hRBh3pzz_N1Hsj2WgM_Kyd7kfHuJqlDI,7278
202
+ sglang/srt/grpc/scheduler_launcher.py,sha256=GMuNCfF4MYYjJL3O8NqQrg1N9P7T2QyRmpxxXOAYeDw,6563
203
+ sglang/srt/grpc/sglang_scheduler_pb2.py,sha256=ALq0gD19OUC4CdjbOU2YYHGmgTlkJvWX3exX_SOXSv4,16016
204
+ sglang/srt/grpc/sglang_scheduler_pb2.pyi,sha256=ibYeIZPchbx4fcLDeAa-LSnq6MZi-mh4DgzIGg-SUWY,26274
205
+ sglang/srt/grpc/sglang_scheduler_pb2_grpc.py,sha256=8FQtALiqSyWkqL6P_rKerievE9q19V3675AEEomNSe8,12633
206
+ sglang/srt/layers/activation.py,sha256=9NArY7s3okKipcJaVLHuX9Irw71z4c338AbsqeUocXQ,13671
184
207
  sglang/srt/layers/amx_utils.py,sha256=1mENgHK2B8mgaD1oMtgbZ15Jmy_Uu1QueBmo09Ff2iA,2865
185
- sglang/srt/layers/communicator.py,sha256=KzmCXRknuxlRnwdA3G38wRlVHYD_kf76mOZWhaIU5lo,24366
186
- sglang/srt/layers/dp_attention.py,sha256=ly-EMgb_I0neGA0Y4Hq9Z_sp1plIRwoBM3feTqLJob4,16322
208
+ sglang/srt/layers/communicator.py,sha256=ZS1A_wkCaljrOT1nrjQlUhImNFeyZsiONUjOfIa5SjA,24511
209
+ sglang/srt/layers/dp_attention.py,sha256=dBfEtofjY9MlCDF5B-y_zrX-owfZ46mSBYioCzlIoHM,16817
187
210
  sglang/srt/layers/elementwise.py,sha256=tGbN7bbK2s-j3DoJeJfkfyPNmKdVAutAd0J3TbxUPAQ,18849
188
211
  sglang/srt/layers/flashinfer_comm_fusion.py,sha256=hnVVS_VsWukTYhREubWs2KcJ1GjVMEI9ECqxqOMXZv8,6729
189
- sglang/srt/layers/layernorm.py,sha256=WKAv4N6LFDLu9x62XBqGT9xEcrj2W53GtP8ji4zTbTM,11335
190
- sglang/srt/layers/linear.py,sha256=z15L32URxbPUb34_urGDwSWIZNfh1jmyKUF1A9lzI9I,55761
191
- sglang/srt/layers/logits_processor.py,sha256=BYDSuqVCrpo67JFCSvmATfegVwgtJ-2_Bgwp23y-Ds8,28094
212
+ sglang/srt/layers/layernorm.py,sha256=CI1sJ_I3nZMy-cpvcbxIAGk52iFoR6eme9S27cDdPFc,12906
213
+ sglang/srt/layers/linear.py,sha256=1g5vEFHqSd1TPb0VxQiZ5oga45QorYxvj2CZl_NM9wc,56084
214
+ sglang/srt/layers/logits_processor.py,sha256=0xOFWdBdrQYGz7uihAscwjdeiEMgkY9hHrWzia1R_cQ,34792
192
215
  sglang/srt/layers/model_parallel.py,sha256=eLXZhvJ4wG6dh0FontNCIdVZvHYdWgaeY-5cu7TD9tE,6078
216
+ sglang/srt/layers/modelopt_utils.py,sha256=Abhiwmu1VOoSePJWytgFxRw_6qTtN2rqT61DPDboCIw,335
193
217
  sglang/srt/layers/multimodal.py,sha256=vNswe0J0maeBiN8ehlmxfs-YYlrmMllYl6Nc_Y57Neg,5114
194
218
  sglang/srt/layers/parameter.py,sha256=6ce1lx2urWJKz87g2qg_oce_S5BV0IcguSiOGGHbcC8,18378
195
219
  sglang/srt/layers/pooler.py,sha256=uZ6WX1FLMEafZwusyZdm6KuVlIwSjbKrdwk2qzgqNGk,3812
196
- sglang/srt/layers/radix_attention.py,sha256=MpugwaqiY2zPTeg7FVW41OljljCXmYVvHZ2MvneF6PI,3745
220
+ sglang/srt/layers/radix_attention.py,sha256=SqL-15JQWxjoSZyaOxfhGqUE0Vu_55O_ihN5CiPRxfM,5310
197
221
  sglang/srt/layers/rocm_linear_utils.py,sha256=7PPh-5H2IYjiLp_g_szzVBsmiMacZ1RtjVtjdrdFJKI,1374
198
- sglang/srt/layers/rotary_embedding.py,sha256=D6X_HmwtGShR_XKuOBPXtRSmfrUU_VMuJ58HycmRUxY,75058
199
- sglang/srt/layers/sampler.py,sha256=C4iNOK42sfUGKhA9xBZA4xXHDsciC3V_5aPoJr-kpJM,19805
222
+ sglang/srt/layers/rotary_embedding.py,sha256=nAc_bIZN2UFN7O2hgoImNfv4msodVeOFf4ft-gbsS68,101948
223
+ sglang/srt/layers/sampler.py,sha256=CunUv_aB_Dw_SqOimQRdw0W21pG75TMH-lvGRr2fNR0,21177
224
+ sglang/srt/layers/sparse_pooler.py,sha256=9gB8duR48R-FGtA4Q7D1fIDSvbKlD70N38S3Lvg773s,3424
200
225
  sglang/srt/layers/torchao_utils.py,sha256=Ws24FdRBSkTpyeyA6bQrdDm-W5wfDxKvSIPUSahyMfA,4063
201
- sglang/srt/layers/utils.py,sha256=58yO8aKsAvS0jJ3nhOWVR_WAc5oTFiMeAERWNkXGR-I,1945
202
- sglang/srt/layers/vocab_parallel_embedding.py,sha256=x0421kNUgnAb5LnkJR6O67vGZ0ikSD-ThluV3QGsZ_8,22673
203
- sglang/srt/layers/attention/aiter_backend.py,sha256=oovonzjvnijaegNmkyTlWlEhCuhXAMNd85EykvKvvow,43923
204
- sglang/srt/layers/attention/ascend_backend.py,sha256=JwbuW4a-urczuVHEP7oRGOehJOcfUO71LCG3BiQq-zA,27206
205
- sglang/srt/layers/attention/attention_registry.py,sha256=RT9Z1Jg0pM65FO08S9Vs3K_7BxfOYpFsgbl3_FZ-uZ4,6795
206
- sglang/srt/layers/attention/base_attn_backend.py,sha256=AGCPd_VqvvZ0tLExCEs_9RenwhP7nB47nNcbR9VuSJw,3831
226
+ sglang/srt/layers/utils.py,sha256=F_hhE514OZ4cyMklga3mipdUzlrKo3SolIcuqgqqQqQ,1913
227
+ sglang/srt/layers/vocab_parallel_embedding.py,sha256=jPZ6H45qD6ieWV2TqU65YzSaJwRWURoJQ1J-6eOOG-E,22737
228
+ sglang/srt/layers/attention/aiter_backend.py,sha256=bv9yGDu-4oLZlA3A00GDpOWU84cLJ97cW08aVoGEjn8,43935
229
+ sglang/srt/layers/attention/ascend_backend.py,sha256=lb3ZmNZmEqnmf3zng38sA48NBBLn9M9lVXW_UdB6SNw,27892
230
+ sglang/srt/layers/attention/attention_registry.py,sha256=OpiNS5eGkYK05lt0L6zm0NfHZFQKyI-fGtLl3wHqONk,7505
231
+ sglang/srt/layers/attention/base_attn_backend.py,sha256=oYk0ch5ptL2EtlhjyitKvu6H2qCHvrXSjUJVJgPnGd8,4495
207
232
  sglang/srt/layers/attention/cutlass_mla_backend.py,sha256=cb2dMTnDMmMVBG_lqFRciVDiF3PeEAcXYaKDFWszeTw,9849
208
- sglang/srt/layers/attention/double_sparsity_backend.py,sha256=2ZRL_gYz14idoVqQzeQ6N77nXer0f_8_TUYw40XUUz0,9161
233
+ sglang/srt/layers/attention/double_sparsity_backend.py,sha256=wkF1GxFuLsGUWYoPWoqdz0xpePqA_nbo7xd2ha67sng,9135
209
234
  sglang/srt/layers/attention/dual_chunk_flashattention_backend.py,sha256=20vmnq68-Cq62UWIzQU_uwJzq4B8KdJeZUPVoWPiyDs,68620
210
- sglang/srt/layers/attention/flashattention_backend.py,sha256=nuOTQ8Zl2anCrNYDLoDiBhCkd3XE4UAA9ZThcY7zFOU,105158
211
- sglang/srt/layers/attention/flashinfer_backend.py,sha256=3tX5ThHhH4Za0jhONXxxViUxN1sYmuqkdOOD0TGq9Go,52247
212
- sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=hEoTNUHPM1LJXMPNVY9FGazUnord_Bmr5WsQY0mxRx0,39403
213
- sglang/srt/layers/attention/flashmla_backend.py,sha256=QqQgWIcF90wVqcvsxJR7lHtCtAqkNd9Rdl-tLq7cHHk,20852
214
- sglang/srt/layers/attention/hybrid_attn_backend.py,sha256=Mp1M83ODwHENVvefP2JEjv47ifDt5SA1hoyrJo4OJyU,5128
215
- sglang/srt/layers/attention/hybrid_linear_attn_backend.py,sha256=e8O2h82ZDwgDEXt8QF23IznOY3vq1-LB9vcWum7Y68k,21938
216
- sglang/srt/layers/attention/intel_amx_backend.py,sha256=IU_E7HkPrBLfNG2ArhI1ozHZ_pROujUzdI6g2JuToL0,4154
235
+ sglang/srt/layers/attention/flashattention_backend.py,sha256=jBN4xznXLKxgr_bJ3v3L6TvwgX4QxuH-tAW7Yl3H2mc,105725
236
+ sglang/srt/layers/attention/flashinfer_backend.py,sha256=6yfbhGS1lGhQYqgoLFCVm05fQcniu--D4uQuhCWYCUY,63842
237
+ sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=lr6SeoyzhgxX25e8Tt6lxCmeJLigNRa5kAmkE2GsARM,39786
238
+ sglang/srt/layers/attention/flashmla_backend.py,sha256=HijFHZZ-pGE75NytFXsS0MIv8d-zWJGRRdfjdF1ViJ8,20860
239
+ sglang/srt/layers/attention/hybrid_attn_backend.py,sha256=_Gol1e_m6vMKhpUw2-OQ37ymC5sIuSTntDylVKSZtpA,5121
240
+ sglang/srt/layers/attention/hybrid_linear_attn_backend.py,sha256=tqwPna30r1zriVhKlit-iVfpfy6hJGxumGKsnlJ20C8,26119
241
+ sglang/srt/layers/attention/intel_amx_backend.py,sha256=8AcbJn0u8ifvhml9iocDzjrtzLEj0oJ7V7bOmkQPefo,4168
217
242
  sglang/srt/layers/attention/merge_state.py,sha256=OnWmNV6LYTUj0y8SCy_IK7A9q6v9bZwR4_XiLOIvbrk,1423
218
- sglang/srt/layers/attention/nsa_backend.py,sha256=yyN3TRmPyxDBaYKsV-c5upK_wEVV3MyjJocw20DCAVo,33190
243
+ sglang/srt/layers/attention/nsa_backend.py,sha256=68NXSaTzqQKL7aVSgmWgDRgPc0OYI3HNU-f9JsEV79E,45516
219
244
  sglang/srt/layers/attention/tbo_backend.py,sha256=MyEQ29I41LCOHXm4_g7J7sXSs5bNKWRlSa2EfqploD4,9185
220
245
  sglang/srt/layers/attention/torch_flex_backend.py,sha256=MnnZLxi41R-d4P0cyklNyefSWOU-AdFEjr8pxJWNgdI,11711
221
246
  sglang/srt/layers/attention/torch_native_backend.py,sha256=NdWD2ArmS1lQN9mZIbS2rcHueBWColNxvhcLaQGAKGQ,9728
222
- sglang/srt/layers/attention/triton_backend.py,sha256=3nIh_oQXVPDZw07m-bkXkAAddW39exOxzNMCDQbc5YA,43564
223
- sglang/srt/layers/attention/trtllm_mha_backend.py,sha256=l6ZbRIZ9Q4rHbsULJ49_MKd32vWdr3IRF5Pi8Dnzv0M,27503
224
- sglang/srt/layers/attention/trtllm_mla_backend.py,sha256=k3e-tD-YjiVs8kOzEXaakCI7g6MDLD99NXMtAscrBZY,29396
225
- sglang/srt/layers/attention/utils.py,sha256=lx_jNw2VwlBe2VnDb1eXRRdN9WArw9rdWHTHqndUEFk,3174
226
- sglang/srt/layers/attention/vision.py,sha256=F_dBh1DpepBt97JOhvQo0sI9tSKBU3w3LOxLT66wBQg,21780
247
+ sglang/srt/layers/attention/triton_backend.py,sha256=30z1z_aJ9jUKGG3rc-2DI6h-3HO3w3hVpcFM18BVSQY,50504
248
+ sglang/srt/layers/attention/trtllm_mha_backend.py,sha256=IQUu3jkCuAY5foqvR6L1IYjjVD4qfmTwG6rfo05ZVkI,27516
249
+ sglang/srt/layers/attention/trtllm_mla_backend.py,sha256=YrC662lqz5nCdGvq_6bdaxWsMYx6AVne8vTjAuQu2n4,41079
250
+ sglang/srt/layers/attention/utils.py,sha256=L1FlCmgWsH-k-ccXcuSiB9Tj4z7b-a7KMWPZKvCXowQ,5478
251
+ sglang/srt/layers/attention/vision.py,sha256=-MX_K0_mX58xkpaS6O93vWIJVqha4iNgYNN5M5Yptnw,21763
227
252
  sglang/srt/layers/attention/vision_utils.py,sha256=6hPPAt8p3SOm7tgHNUesnMLxvQiKbaOM5EK6K-ig5dI,2771
228
253
  sglang/srt/layers/attention/wave_backend.py,sha256=dMsR7GsfDYgVizY8QJ94ASrxiiJ5_MNOuTUDDQzvpPQ,22915
229
- sglang/srt/layers/attention/fla/chunk.py,sha256=N8ToAspPlgR7sVJBImzpmlGV6rWsMA7aTaTa1iddcPg,8929
254
+ sglang/srt/layers/attention/xpu_backend.py,sha256=nYRnYi7ZVyeC1m5WPB8TKpux2mBxCjHOzKZ5QNnCBlo,47650
255
+ sglang/srt/layers/attention/fla/chunk.py,sha256=r8Tddl7p0ae0nH0FU1sU3EpWTtiipdzoijaTMX3_gGI,8913
230
256
  sglang/srt/layers/attention/fla/chunk_delta_h.py,sha256=Gf8RgLesGaR9GM4HTB7kDDCVirwR9XvO7O3I1HWdcuY,10681
231
- sglang/srt/layers/attention/fla/chunk_o.py,sha256=IZllM88Ap1ztEF9nOSfcx7KmRvmwIwiBMqwT9AjjH-U,4980
257
+ sglang/srt/layers/attention/fla/chunk_o.py,sha256=ngvGxIxeHhulkj_FfQgtNY0T-5cwV_4Ochc_6dP6oVo,4973
232
258
  sglang/srt/layers/attention/fla/chunk_scaled_dot_kkt.py,sha256=445twkm9l0Mu9Q_VFBIgUZQzTNLvc82gqIAe8ylip-4,4386
233
259
  sglang/srt/layers/attention/fla/cumsum.py,sha256=beIT2WTSn8Wk_wknoWM3JYQhzmzR1JJwMFzspsXvWng,8374
234
260
  sglang/srt/layers/attention/fla/fused_recurrent.py,sha256=yOSTwqcNSoPWwQD--tcCkVd2OwB5Ox0nLGnLLv8MRr8,20856
235
261
  sglang/srt/layers/attention/fla/fused_sigmoid_gating_recurrent.py,sha256=dlmOu-7DG6YoSNexT3YV8GudrFPn_RiYj-3hClWdy-c,6424
236
- sglang/srt/layers/attention/fla/index.py,sha256=kQGcR1doARV324QuA-faNoyo6u8a_wb-DfiPe_bOdhY,1050
262
+ sglang/srt/layers/attention/fla/index.py,sha256=u4yVogS7a2DrfsYwQ22t60DpO3Y7KF9eAHY1PUrfUt4,989
237
263
  sglang/srt/layers/attention/fla/l2norm.py,sha256=XOs5nGdWROp3FW4fHSObC8sa_x697yDV0jt5UKuLllE,3783
238
- sglang/srt/layers/attention/fla/layernorm_gated.py,sha256=gNAAUyRfnjf5vTx92Gkah5UeumrlgH7oCq0Tg5D_5mQ,9938
264
+ sglang/srt/layers/attention/fla/layernorm_gated.py,sha256=OJEzBNg4JQ6_Vk_ZHWnVPwy8PLbrwuBiw3rt9bLiBRc,10122
239
265
  sglang/srt/layers/attention/fla/op.py,sha256=Qc-zHwZY9-8Aw53AuuzNfpbPBwKgIvVMgtWcfJLl6A4,1695
240
266
  sglang/srt/layers/attention/fla/solve_tril.py,sha256=-Z51hFsLER_Lzn8h21WRUajbVOA1wuu5TSEvaC2AvK8,14405
241
- sglang/srt/layers/attention/fla/utils.py,sha256=yBYjW-blAsq_uZxZ961Dub3cUouIvl4DCKV9UqkQSJw,10474
242
- sglang/srt/layers/attention/fla/wy_fast.py,sha256=zf6_76vq7yYtn9Ir1Le4RVOKLaPNF_4bNST3ePuH0cU,4407
243
- sglang/srt/layers/attention/mamba/causal_conv1d.py,sha256=w1sBOwpJeDKeYK83vPaaep5Vhq2J_qey9JUaQ2vjnjU,4474
244
- sglang/srt/layers/attention/mamba/causal_conv1d_triton.py,sha256=M04m2D13KhSCvsC37vuslNpwbgS4HLaJwWzyWjqev2E,37539
245
- sglang/srt/layers/attention/mamba/mamba.py,sha256=HRGM1fFe_MzVY-6rdkYHndsaSaQB3cOWUCow8bPQYFY,24243
246
- sglang/srt/layers/attention/mamba/mamba_utils.py,sha256=3-iipUQzuHPUDlWYhse2XwtiPYgcblOsiOoozkIoOZs,2820
267
+ sglang/srt/layers/attention/fla/utils.py,sha256=CxcsCXLamjIhbCuj3NUqar1LasPsGGf8WX4acXnF_fE,10451
268
+ sglang/srt/layers/attention/fla/wy_fast.py,sha256=wS1sJq23pa5xK2tUDYRO5FhLLJ5JpHWozBghDl64pYY,4284
269
+ sglang/srt/layers/attention/mamba/causal_conv1d.py,sha256=0Im_XzEA965rT5r09-bm1We1BaPgq2g_yo5nbA7KwvI,4503
270
+ sglang/srt/layers/attention/mamba/causal_conv1d_triton.py,sha256=EqiIga4XzikCKeA9wvLAcK3uTCX-Fop9GQFyzLeNAg4,37660
271
+ sglang/srt/layers/attention/mamba/mamba.py,sha256=qGGEzMVZDDG0dEdUrLxVfWhRa1UI5OLis7dVBMqUpl0,22517
272
+ sglang/srt/layers/attention/mamba/mamba2_metadata.py,sha256=6hkbWuV0do1lFXucgGusqR5ha784g5CB7P7hZaigRNM,8551
273
+ sglang/srt/layers/attention/mamba/mixer2_rms_norm_gated.py,sha256=C60rddCKuf3eD6KVt5vB60LlGD2dYiU9WZGTlEPaoDM,4689
247
274
  sglang/srt/layers/attention/mamba/ops/__init__.py,sha256=r-IpDGRIwTqGJzZoWNGyHqsqqv8oF19pNHEb7_TZR9M,98
248
275
  sglang/srt/layers/attention/mamba/ops/layernorm_gated.py,sha256=hmuL7vQ77aWFENCDsJDB7Nki5DDdMTEiQywbaU4FC04,5229
249
276
  sglang/srt/layers/attention/mamba/ops/mamba_ssm.py,sha256=aCFsiBdBDYt3D5HT0lxt6Rru9-gPYZspBM_WpTGgHh4,13680
250
- sglang/srt/layers/attention/mamba/ops/ssd_bmm.py,sha256=xZEjoVv5zdUeu_36WcS0VO9Qkmob2BwGgJ1RqQmg6w4,8420
251
- sglang/srt/layers/attention/mamba/ops/ssd_chunk_scan.py,sha256=gyph59WoRu7rEuzARSK6731b_gCKx326vZ9X-Is1qbs,20380
252
- sglang/srt/layers/attention/mamba/ops/ssd_chunk_state.py,sha256=yaZ1Hpj3XNSvFA0wSXkEBBZZKgy0441VrHgLBcp8r6w,24392
253
- sglang/srt/layers/attention/mamba/ops/ssd_combined.py,sha256=ivE3zqD31W01W7_RgpRG8Tfh11Co4mjbz2H6fWzGBP8,8909
254
- sglang/srt/layers/attention/mamba/ops/ssd_state_passing.py,sha256=lCt7NzzUbyCcnfDB2ai_agVM_hoZvfrB1d-UbFO8WWs,10377
255
- sglang/srt/layers/attention/npu_ops/mla_preprocess.py,sha256=n6iR86qvKTYY_mC1EMxMiyHQaXZ8pF9o2iNCV68BA0E,14540
277
+ sglang/srt/layers/attention/mamba/ops/ssd_bmm.py,sha256=IGOJ67TLx2WQQwDFm9jw2OU8vTZc0daVUnQF6kcu2x4,6798
278
+ sglang/srt/layers/attention/mamba/ops/ssd_chunk_scan.py,sha256=n70BQM8Dpg7_shX87ay3QvBEUO4fEcmg1OopU88KPiE,18405
279
+ sglang/srt/layers/attention/mamba/ops/ssd_chunk_state.py,sha256=Qdzx_4DIwl1-g_c24lRWKfmLTL29rxn2aRELWfuUct0,20784
280
+ sglang/srt/layers/attention/mamba/ops/ssd_combined.py,sha256=evYcNq31qo1TeaJP8Q3yttBQODici594N4kpdgT7hrQ,8880
281
+ sglang/srt/layers/attention/mamba/ops/ssd_state_passing.py,sha256=pNjxxLYw2BsTwy5-m7RhgqTZ9H8uyQFX2GQVucWU4wE,10032
282
+ sglang/srt/layers/attention/npu_ops/mla_preprocess.py,sha256=3_jiUFd2um4mOwG2FaNHWfwbRbjko0c6EeDfdlUiGO4,14554
256
283
  sglang/srt/layers/attention/nsa/dequant_k_cache.py,sha256=ie1qLy7AAipFYS0EJFrunN8Mq97D9v-noWaJBYMiv0I,4973
257
284
  sglang/srt/layers/attention/nsa/index_buf_accessor.py,sha256=jPYRgFfTdH_g83OUs9q3ncj2Y036ikBvflMjYEjrHGw,11481
258
- sglang/srt/layers/attention/nsa/nsa_indexer.py,sha256=FgK_o31MRswHX8CQiX9jPp04z_P7GgBumC91v_pRJHM,26466
285
+ sglang/srt/layers/attention/nsa/nsa_indexer.py,sha256=qTzO557wWrB7RypNvX1i5_C5vr66X_YPjEgJiV_TP3E,25368
259
286
  sglang/srt/layers/attention/nsa/quant_k_cache.py,sha256=FYl6gp16uGU3ftIHkU5vFAjfdPnoKvWOg4l7TBKkGI4,8675
260
287
  sglang/srt/layers/attention/nsa/tilelang_kernel.py,sha256=Iifd9YYEnDGkRhjK0NH-pbyTiQX0kVpJynyGwZcnH8w,31554
261
288
  sglang/srt/layers/attention/nsa/transform_index.py,sha256=0yurXIDt5EQ9k_P5g_aDXohdzvSiBQcQpCHBcNf0ZBA,4745
262
- sglang/srt/layers/attention/nsa/utils.py,sha256=qiUetSApDNI3Qz4_3-NVh_-mknU8ZHgA9sejb6PQKfY,901
289
+ sglang/srt/layers/attention/nsa/triton_kernel.py,sha256=FyInDj54ux1IctSGlPd82iq-aGY-UfXJvd1KIPO9LTI,3974
290
+ sglang/srt/layers/attention/nsa/utils.py,sha256=_Ni-gYZTx5MXbIV2i5-7MexX6N5vsZNYTY-b0GczXRI,822
263
291
  sglang/srt/layers/attention/triton_ops/decode_attention.py,sha256=JnOtqtPXEgn_T0R4gGCROx1szlAhu_G_ODNKCazz0lE,20554
264
- sglang/srt/layers/attention/triton_ops/double_sparsity_attention.py,sha256=FbgrPO5GvEGEvojV7Ss0jX7384e9vuzX2goDCQuP1Zk,31124
265
- sglang/srt/layers/attention/triton_ops/extend_attention.py,sha256=eYg4xQoH5gBkM7bjzpBIpTdcelvUK3BujJ-8eXRCm70,17108
292
+ sglang/srt/layers/attention/triton_ops/double_sparsity_attention.py,sha256=TGnhUIoTsrFmOAVspsGpG0F_ORB7EMahM4v7nl7tNoQ,31105
293
+ sglang/srt/layers/attention/triton_ops/extend_attention.py,sha256=KzkbTOStDiIb76i5F7yLRZL0ThuZdBzv290KB2FZDow,32920
266
294
  sglang/srt/layers/attention/triton_ops/merge_state.py,sha256=v9nD01a5eTnkwZxMwERtrrRfC5rs6GxkYOpErkAPcYI,2877
267
295
  sglang/srt/layers/attention/triton_ops/prefill_attention.py,sha256=waZsmpKIp8rTgFSoM4QMabJuLaB3yW6ltOzAKJksBoE,6260
268
296
  sglang/srt/layers/attention/triton_ops/rocm_mla_decode_rope.py,sha256=664WnAJ91EiCUZOcnVDfbTQf4uGJ4ZDZB1CbxpEUFZc,13866
269
297
  sglang/srt/layers/attention/wave_ops/decode_attention.py,sha256=oJNBG57cySgxtmJe1MSEsZKOIQOXnH0iVAcFO6DUWvY,4732
270
298
  sglang/srt/layers/attention/wave_ops/extend_attention.py,sha256=LyZQQIvFYfcIcObgy_tETK5JxRLgAkOYlF-KhGcGEoA,3877
271
299
  sglang/srt/layers/attention/wave_ops/prefill_attention.py,sha256=viTUit0rxjVV5UahuwmVAhmL66YRFJD4g1YhH_oRBu8,2344
300
+ sglang/srt/layers/deep_gemm_wrapper/__init__.py,sha256=esJMd0Yuj68t6QYOpmIFuiWP2J2dxTMC4bRBNH0Xk6I,26
301
+ sglang/srt/layers/deep_gemm_wrapper/compile_utils.py,sha256=EoRu5a-eiXcBZV9bVJ0x8ATLpKLt_AUeTNixdeJ1bSw,8070
302
+ sglang/srt/layers/deep_gemm_wrapper/configurer.py,sha256=vkMBNZx3RqukEtxMUAbTfKJii3MDXLBs83ZlsgtxNiU,559
303
+ sglang/srt/layers/deep_gemm_wrapper/entrypoint.py,sha256=5VTBfCU6wTBS2uMJc-luyqawh1478w3Jh1qk39qhjlI,3199
272
304
  sglang/srt/layers/moe/__init__.py,sha256=P8OC-pUE5yeEr80QUDqSPwF9a9BAYPuaK7GNlQovsJw,863
273
- sglang/srt/layers/moe/cutlass_moe.py,sha256=JKJED-4709ndP5AwhQ7Vi04GJjw5d9Xl_mWOsZPZ3U4,14298
305
+ sglang/srt/layers/moe/cutlass_moe.py,sha256=335MeGbcVPsAI9oaEQCVSMxzzQ9YV1qPiNxINXtvO48,14206
274
306
  sglang/srt/layers/moe/cutlass_moe_params.py,sha256=9NRCmgP_Ug3gGqCcpi-x-QRbLjCNpw8792gKXwZsbEU,6522
275
- sglang/srt/layers/moe/cutlass_w4a8_moe.py,sha256=psvH2RhUQkK4oyaSE7xe0EncCqLvNbd_NwR4XHxk79w,7017
276
- sglang/srt/layers/moe/flashinfer_cutedsl_moe.py,sha256=4TS3YLrmxn5dEHYUKeY7aohBXYeAsU8UCx846NXFTw8,6197
307
+ sglang/srt/layers/moe/cutlass_w4a8_moe.py,sha256=2vVS2bhUuKRsDnPR2cNUKli9Pbi32lzQ--0jRpyYB_I,19210
308
+ sglang/srt/layers/moe/flashinfer_cutedsl_moe.py,sha256=ULLAdfRad_sG2ZYXE4qMCOutQX0eckQt0fwwhfcsckA,6186
277
309
  sglang/srt/layers/moe/fused_moe_native.py,sha256=XzJPM9Z6YQ4ejrMrBFt3l1i7guBcdQTXo9-gT5H8AIA,3479
278
- sglang/srt/layers/moe/rocm_moe_utils.py,sha256=07Z99bTV3B-b2Cbm-odhGpx2twxtnVpYvaDMBE1K3LM,4555
279
- sglang/srt/layers/moe/router.py,sha256=eUNu_Uz5VB2FOZzZyYuZo5pokCVBS17_fcjHQbmvDSE,12181
280
- sglang/srt/layers/moe/topk.py,sha256=HcvKwbew1W4NJ-IGCp2aietW3o3KQPRuC7siRrjavt4,32240
281
- sglang/srt/layers/moe/utils.py,sha256=HPRJy9cYYPAV5jU4dPYidIpVuSyk1HgaJrePQyD21Fo,6361
310
+ sglang/srt/layers/moe/rocm_moe_utils.py,sha256=SglTXIzpiWKFKVEf9gS8SEocJYcSOmeKUKjHznfC_nI,4527
311
+ sglang/srt/layers/moe/router.py,sha256=ouSNu8XU2w-BICyAYPpFq2zPb11LyTDalZElh0AXGus,13675
312
+ sglang/srt/layers/moe/topk.py,sha256=bjmeGhdwlSOeQpzb2XjBVNcpCX-L0chN5aanzXmTw3Q,32310
313
+ sglang/srt/layers/moe/utils.py,sha256=UZsd1KCXNZ4XFWNnxZiNywsuYEtA7xOQLd52c6RZC9U,6701
282
314
  sglang/srt/layers/moe/ep_moe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
283
- sglang/srt/layers/moe/ep_moe/kernels.py,sha256=WfHn5Kt3NH6MzawvtycMSgo_WDqg1aJQXp1HuqgNAP4,46168
284
- sglang/srt/layers/moe/ep_moe/layer.py,sha256=7Aekn8YmGXThshcbMY7dk4fMVNLsTQ1_MnDLWwn5S6E,35667
315
+ sglang/srt/layers/moe/ep_moe/kernels.py,sha256=jsSLb_D7u60_8NIHxTEoEerRAbQFJXPWJHMpRVsEyOU,37898
316
+ sglang/srt/layers/moe/ep_moe/layer.py,sha256=jra2o5MZ2od5T4J3CiJH7XZor2zW94fvcP7j4IvvqCU,19836
285
317
  sglang/srt/layers/moe/fused_moe_triton/__init__.py,sha256=tis0ZJmih7gKHCurbLtY_o-bY3K4MOzQLYLC3ftIOf0,977
286
318
  sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=mKH6zTTuh_Z8Ceg6d1VWjGBI3iPBn1YfGO6udxIRAtU,23306
287
- sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_config.py,sha256=1iX5ox2KT5sgLHrN6l4svsgtn1-q_6514Q_F1v83-iY,7747
319
+ sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_config.py,sha256=0jTqnuw8v6uwr4g2IJ6bc3PRq77HF96mEYaSOBmpTAQ,7983
288
320
  sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_kernels.py,sha256=QOdl5uhZ8--aryXnKObdspKonGcF6Tc_U9o_lC_opo8,27760
289
- sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=1FGnf9QRSEPYdOZzvu-DFuz2DYDY0u7TaW0IuDYm-i0,39690
321
+ sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=QvljwzkINsJEt9q5HkS-0KC0QDq_vuTIMJh2QAkH_18,39827
290
322
  sglang/srt/layers/moe/fused_moe_triton/moe_align_block_size.py,sha256=U93mxPPU2RP7d3QRSvoG3OCtUQIK8YhQfHf1ZGeREmY,3284
291
- sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=Ai06BZ7uxMnk0nPWQelgvi1rV9Z72FetRo6p7E3rsYs,10986
323
+ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=g1duB_VckkfiqyB5ePWRv8Nndwr5OoqnN9pEiVUrVXo,10408
292
324
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=iNGsE2ZeVnQEnN4A8UJ9Jv0d3hbRF2MJ9oBgjup5Szk,2737
293
325
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json",sha256=JJN0hryyLr5Zv3dSS7C8cPFhAwTT6XxUVnBGMZvV6JA,2752
294
326
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=ouRyZ5PEMPP2njPftCNhs-1g1y6wueWLmhI7G1SjV1k,4131
@@ -473,6 +505,7 @@ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=Ai06BZ7uxMnk
473
505
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=385,N=128,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=rgF-KSAUXmI7QGrhMUywPVfeTxz_j8_IP4N-6bkYdak,3260
474
506
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=385,N=128,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=7aaoi0MI2xC5ZJkflkTZAH4tawTPdmUpmcBOgOInKxs,3268
475
507
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=8,N=7168,device_name=NVIDIA_H100_80GB_HBM3.json",sha256=a9XJZ0XudUTebAdN5guVq-3XSvZetHIRjatO1-_0xCk,3257
508
+ "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=128,N=192,device_name=NVIDIA_H200,dtype=fp8_w8a8.json",sha256=-MZaZ4R9r5Rk8a9OEa1eM_S6INlcsX68Bj5_pM4Aa0U,3257
476
509
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=128,N=352,device_name=NVIDIA_RTX_5880_Ada_Generation,dtype=fp8_w8a8.json",sha256=L7acUMDmYZOeA-riEds1-r9Wsq2KBWJlG7X7rilWjfA,3254
477
510
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=128,N=384,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=6JYGN4imwzIrQAEgboSO93wWYBuguzTgBjfTedq2c_Q,3250
478
511
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=129,N=352,device_name=NVIDIA_B200,dtype=fp8_w8a8.json",sha256=ClPogINm5AsnjDqx6Hz_rHrmnnCdUPid-jYIdIgjZxs,3250
@@ -480,6 +513,7 @@ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=Ai06BZ7uxMnk
480
513
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=129,N=704,device_name=NVIDIA_B200,dtype=fp8_w8a8.json",sha256=W8C1GtP4K43SK9128U52DD5WWofvPleAJE4us2Qju1k,3251
481
514
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=161,N=384,device_name=NVIDIA_RTX_PRO_6000_Blackwell_Max-Q_Workstation_Edition,dtype=fp8_w8a8.json",sha256=RMYwqtB7hYeaCyuZ1feVnRhBGlN4jMcmNQX2hqUqBlk,3254
482
515
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=256,N=256,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=T6kCtCUytCxiW8JOLfEF3YgdCD9_mKccJ85IqT0b8LU,3253
516
+ "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=256,N=256,device_name=NVIDIA_B200.json",sha256=NkLVci5u2GGeuFbC3d_6PicBS3mSuV77JICCSzU_8cc,3238
483
517
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=256,N=256,device_name=NVIDIA_H800,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=M3W1OQU6RgKAQL2EoYivAIidtz1cvgoK6_6ntNfn_lY,3265
484
518
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=256,N=512,device_name=NVIDIA_H20.json",sha256=bSe-KUwiVT3yM9jQuXlDmxe_KUft7FUn5zOby8bpSkc,3233
485
519
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=257,N=128,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=RbJYTRfjP_3-ytfj53W_w2jFpZ9xwMaqoKW52pkgP3c,3257
@@ -496,49 +530,54 @@ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=Ai06BZ7uxMnk
496
530
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=512,N=64,device_name=NVIDIA_H200.json",sha256=phmhkQNz8DcLHPqN5tjmJqOgbX0BhQx9cP82fp_jyIQ,3236
497
531
  sglang/srt/layers/moe/moe_runner/__init__.py,sha256=Dc4PH6HfzQDjJWL7iuZ-0qh8oRu7OtnH6IEl675pYiU,172
498
532
  sglang/srt/layers/moe/moe_runner/base.py,sha256=GMdFI74BGO5HDjtel5QWI7W4CFix0BHkw_HrjVswhcw,8905
499
- sglang/srt/layers/moe/moe_runner/runner.py,sha256=7ZOqDu0r1GY-9ra1VICq4WmH1nJVSQoE5yBXuSUr2CI,2669
500
- sglang/srt/layers/moe/moe_runner/triton.py,sha256=YaPqGIX-5y25nxmjF54_ASYbr9Dw4RYze2cNV4cUg-Q,14433
501
- sglang/srt/layers/moe/token_dispatcher/__init__.py,sha256=I5I1ySCHbyAW5cFQy9mpuqkSWqLclLmi2AspCkoP8ig,993
502
- sglang/srt/layers/moe/token_dispatcher/base.py,sha256=BqqwuSETP47vTaHkUoQWTEeZcAkg0n_Dgka-PkFM4uc,4029
503
- sglang/srt/layers/moe/token_dispatcher/deepep.py,sha256=LtsaJ3bR-HBQL9ZWjgbw-HaP-hcAqAgrmpO-829PL94,26293
504
- sglang/srt/layers/moe/token_dispatcher/standard.py,sha256=_OSudEOHA5qHqR5TJqnylQxUYyk7ZnhRMGOf7sMCyt0,1526
505
- sglang/srt/layers/quantization/__init__.py,sha256=GmJvVSlkJXf2AmTfWBN6EBrOhhYlxPYNE_eAEXMZfjs,7813
506
- sglang/srt/layers/quantization/awq.py,sha256=YuAkweqSvQQGTGQvg4VpNXevSaJvT8CROpiNzmY_3tQ,26980
507
- sglang/srt/layers/quantization/awq_triton.py,sha256=4XwJbRNlFmlvjbMGtWF1Wvk26Kf96162vNEmuI5Kars,11737
508
- sglang/srt/layers/quantization/base_config.py,sha256=ql3kwwnjVzZGh8BUcimMt8K6kFxQtVbR5WgZHXqkOqA,7245
533
+ sglang/srt/layers/moe/moe_runner/deep_gemm.py,sha256=Ntif63j3HYofgc8f1FED5sRQrzGsnBKiwuTdalGGWp8,18123
534
+ sglang/srt/layers/moe/moe_runner/runner.py,sha256=eJhOjzbKwcNSGztwTKAJxpcSYm9pqv_C60MJGmPkr_g,3041
535
+ sglang/srt/layers/moe/moe_runner/triton.py,sha256=pYzFyJDocnBfNiF6kp1cnSZmKKTsLOYXpAUXFZYKOsI,14464
536
+ sglang/srt/layers/moe/moe_runner/triton_kernels.py,sha256=qsV9-k9iblqxE8J4JWyJS3Mfd7he7aZUYbIa8QTY1vo,6350
537
+ sglang/srt/layers/moe/token_dispatcher/__init__.py,sha256=rFv-j_zeUrKEOniMaODRi3EUaRAIufj5jIMGt45JdwE,1305
538
+ sglang/srt/layers/moe/token_dispatcher/base.py,sha256=joEgkYGDKlyYyb8hCOTYI_jAnZ1M_IRaT8WshXiolZQ,4253
539
+ sglang/srt/layers/moe/token_dispatcher/deepep.py,sha256=S1ucIB4erQgOqfAC21cB3e-WAFCxaSFH7DgxNUlXbgQ,26705
540
+ sglang/srt/layers/moe/token_dispatcher/mooncake.py,sha256=ZQpjlv-WvEvTgFE6R_zuzFZXOfbRwVvXFYpOnWuCBXk,11855
541
+ sglang/srt/layers/moe/token_dispatcher/standard.py,sha256=fbYsC4iBmRL49ha-wPSL24hP9qEZMUMeHTxIj9By9Ko,3462
542
+ sglang/srt/layers/quantization/__init__.py,sha256=4kFbEgYmLsV0H5pwU-M-yJSYzSzaBI7dFOF6N4CRB90,6301
543
+ sglang/srt/layers/quantization/awq.py,sha256=zm3wcy7k90cNlFvPT7uY2JsravExXaZuC4a3nsRdKss,33343
544
+ sglang/srt/layers/quantization/awq_triton.py,sha256=1QwpxPoqcfe3sDU8uRs3LXBRcDZvq-M9xQ7NE9RV0Mc,12658
545
+ sglang/srt/layers/quantization/base_config.py,sha256=NP7QyI1lCq5JxerPIDTy8TYQqOwSRGreNeD-Sye2Zus,8214
509
546
  sglang/srt/layers/quantization/blockwise_int8.py,sha256=pqSLo4gwazZ4ajdVzyouwh_Z5oVDbWq9wo8RnrMdY8o,13998
510
- sglang/srt/layers/quantization/fp8.py,sha256=pMr42f5f4QDQcOYmo3g2VBv_Dh8li85KpnbKYa2oNyo,50739
511
- sglang/srt/layers/quantization/fp8_kernel.py,sha256=Mgigb6GmF66oCrgjS97IvDDSacNYb0u-VYAf4FChhqM,54849
512
- sglang/srt/layers/quantization/fp8_utils.py,sha256=sxsjlqL7sWXwbgsxwfzFSkojyN3w8KQh1R99JEWdBl0,29191
513
- sglang/srt/layers/quantization/fpgemm_fp8.py,sha256=dq7rJz-QB9LovmZZLBMK8YJEOr05wjVrtWLmSTkXjYw,7004
514
- sglang/srt/layers/quantization/gptq.py,sha256=Qe6XfBWd9aOW7jkLmQR61AjmJRe5MJi6FJvGno1HH4k,39433
515
- sglang/srt/layers/quantization/int8_kernel.py,sha256=GfRC9FOn9exNvK4QHbUeBj3Hhv32VcyGphapFPt5b84,12625
547
+ sglang/srt/layers/quantization/fp8.py,sha256=75F0a9xRIGCmZTY_KGsEEYu0VXQFJTJyWMLo2BTOjhQ,53658
548
+ sglang/srt/layers/quantization/fp8_kernel.py,sha256=noTju6oEzKQ4mOcgWF8s0sFL5g-PuxLrCivvSbKQJWI,56181
549
+ sglang/srt/layers/quantization/fp8_utils.py,sha256=enZUimrleDg7RJhoh7uxVLRYd1dSMKeCUhaXuwWAYyE,29831
550
+ sglang/srt/layers/quantization/fpgemm_fp8.py,sha256=OpDJAOBpy3PtAvDwG3ZIA4ItMFvrodxAHTkHQnT_cso,6967
551
+ sglang/srt/layers/quantization/gguf.py,sha256=XCjW3-Xe63mwNUDT02U09JiBUMdxxX_slmeaoWMEIP4,19824
552
+ sglang/srt/layers/quantization/gptq.py,sha256=oAlxR3qX06Pwc9-kkrzu7W4j0K-zWfi2JQL3yO0HHCI,39377
553
+ sglang/srt/layers/quantization/int8_kernel.py,sha256=nl3bmwcgvs8SCe3_jz0hC5f6HfdohhEMyeWM_t8Zx5Q,13124
516
554
  sglang/srt/layers/quantization/int8_utils.py,sha256=YK9CS-lb_n91kNCTKK5o5apYF31V2giDg5G5VKrpcUA,2356
517
555
  sglang/srt/layers/quantization/kv_cache.py,sha256=_9pF5rwvB7ta6Gdc5YKVVGbNzYwqmhIx4TrX1-xnodQ,3261
518
- sglang/srt/layers/quantization/marlin_utils.py,sha256=aM3GU7b7rHNZE-tZjRSrtOaPWzSaMcLxck4he8MlEVI,26344
556
+ sglang/srt/layers/quantization/marlin_utils.py,sha256=Zvasw0DpgMQKTNJm1ZNGLt3P1AKgDfYhTpePdI9BbQ4,26634
519
557
  sglang/srt/layers/quantization/marlin_utils_fp8.py,sha256=iSjq-ikPOTU5plrWNTW4MletKLySIrNl5NhQmY6FyAo,12508
520
- sglang/srt/layers/quantization/modelopt_quant.py,sha256=qDCoZxsZnZmi6RM3LbIw61Zzm3UM_vM9nRvIUOwcmCA,59352
558
+ sglang/srt/layers/quantization/modelopt_quant.py,sha256=yKs6xczPfjKV1UKB5S50nol4rRURMX4m7_7pYIYJZU4,60689
521
559
  sglang/srt/layers/quantization/moe_wna16.py,sha256=uoRhxJ8W_U_VFpbn03YEp0aCjbzqquWwonjuN7KBucw,19117
522
- sglang/srt/layers/quantization/mxfp4.py,sha256=mb_DeJgrmEBS2CREZ09WsQVetxLozq3a4HhxqMq2amY,32993
560
+ sglang/srt/layers/quantization/mxfp4.py,sha256=9DurnjCX2BBWveFfE-ISTAhE4VOW0BB0ZNPMsrgxYEM,31337
523
561
  sglang/srt/layers/quantization/mxfp4_tensor.py,sha256=bGeCXlIOhmFZFGWp_lITkIRDEgGUaLpawDvMy1cTOmA,5389
524
- sglang/srt/layers/quantization/petit.py,sha256=74Jn0eICq23v_b4rEctDaYTINtbqkdM6IXycT-_FbbI,8954
562
+ sglang/srt/layers/quantization/petit.py,sha256=foRPfOfhq02h6yMt-8yHKofQB6l16Pz-bRCqUD3iiHU,8944
525
563
  sglang/srt/layers/quantization/petit_utils.py,sha256=-gy4zMhqNoIA1R0n7-5C0efV54jHonCUgPDUUFjGsyM,3245
526
564
  sglang/srt/layers/quantization/qoq.py,sha256=jM96uJfKz3vo1B6SSIrQXNT3vnD3UJrepK2eY-tSQU4,8139
527
565
  sglang/srt/layers/quantization/rocm_mxfp4_utils.py,sha256=Z4pYWl6ExOXq2qfTHorW16hVbJ-Rk4G8Wrxn_x8boHE,327
528
- sglang/srt/layers/quantization/unquant.py,sha256=T8w0mPvtBM1JhGhle6NoDY9C4xfmPWHU_VEJZWSnUNY,16079
529
- sglang/srt/layers/quantization/utils.py,sha256=d4eaS4-Z4q3GRgb4HDMr2EoWEdQCefrVdJufK6n_NQY,18509
530
- sglang/srt/layers/quantization/w4afp8.py,sha256=uSVtBXYIKPMa_Li1HHyZEifdaNzVCr-lTiEwRnIexD0,12148
566
+ sglang/srt/layers/quantization/unquant.py,sha256=FtgCj24edm9AhrPpEqMAIf8w1Sz83EQ5dgBYXnRuGCk,15043
567
+ sglang/srt/layers/quantization/utils.py,sha256=yqgmoLvrrp5aRj-LTJZ6dI1hmP1UFgbpyjVWJJdomZQ,18472
568
+ sglang/srt/layers/quantization/w4afp8.py,sha256=dm8Um2oraXdrNXiyrdDshg-z3_aSTs_V7Eh-z3o9PuU,14155
531
569
  sglang/srt/layers/quantization/w8a8_fp8.py,sha256=ugLV4G4MDog-UuLqSnEasBqE3Hh6AqE5ZYI371ean90,10415
532
- sglang/srt/layers/quantization/w8a8_int8.py,sha256=e5mrRf7AWfit-5dOn3Ul9nTLt6OJth6SgrVpEdnVdE8,37076
533
- sglang/srt/layers/quantization/compressed_tensors/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
534
- sglang/srt/layers/quantization/compressed_tensors/compressed_tensors.py,sha256=Jfvvu0xL9WR075I2Qx8prTfGp77hKwkDH--V3R5pBpE,25928
535
- sglang/srt/layers/quantization/compressed_tensors/compressed_tensors_moe.py,sha256=tFw8PIF5r8yjdJFt2_3Ou72vUJvgLd3bXFOWdgsCeno,26732
570
+ sglang/srt/layers/quantization/w8a8_int8.py,sha256=WkhbRVnEamh78uyj9WyS9OfeSpZTsWh51kDCH4HICa4,37534
571
+ sglang/srt/layers/quantization/compressed_tensors/__init__.py,sha256=zMpLnf9GiRhV-jg1H2UiZ6OUMSKMcmLtrr2A4XjhuUs,217
572
+ sglang/srt/layers/quantization/compressed_tensors/compressed_tensors.py,sha256=P8RmY91K2a__xNQI69zqTuGFnFCBE41DGUlp9WutKJQ,24948
573
+ sglang/srt/layers/quantization/compressed_tensors/compressed_tensors_moe.py,sha256=yUITBLC024lXAkVh3qfvd6bX_U0prVMbX4me_gtqUWI,38895
536
574
  sglang/srt/layers/quantization/compressed_tensors/utils.py,sha256=mnUmKWFQUnY8bVoFHUuNVwqsfS-cefeR-ofyaihCXcY,7621
537
- sglang/srt/layers/quantization/compressed_tensors/schemes/__init__.py,sha256=ipQ5M4UkFHVsuAm2u4yZJd86NHtOenyeeahBtiLBLaM,448
575
+ sglang/srt/layers/quantization/compressed_tensors/schemes/__init__.py,sha256=qhx1YhMH6dzvnzLSSN1uQDE3wDHMoOA_HRkjn6lsvzU,589
538
576
  sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_scheme.py,sha256=tdKJC8c3SX8T3z8JL-1YCsg4ftcv55Wxt0vZrYftpX8,1635
539
- sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a16_fp8.py,sha256=VvqVpAr66AlS5IPVuIR5Nu0ESH0oAoKo545jNart6lI,5493
577
+ sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a16_fp8.py,sha256=kDkks4z5zCh3bBoAo0_I3Yyp0--a_sQBY2zNs2wzJ0w,4982
540
578
  sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a8_fp8.py,sha256=4cfB6pv7kt8Ek0e88vLyXymSW6VqbAUpIjNt_-KK9-M,6318
541
579
  sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a8_int8.py,sha256=6usNdpr8mL5QRlTK_pZQtGwgmSMNi0KdMfm57kq3lw0,6908
580
+ sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_wNa16.py,sha256=uG3dvlNuP5ZC3_NxIhjWWkrUVw4FQxlt5jobzaofAHM,12884
542
581
  "sglang/srt/layers/quantization/configs/N=1536,K=1536,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a8,block_shape=[128, 128].json",sha256=RdHQxWXwXqvio31192vsLaKjEr4f_DjpMPKlarY1IAk,3251
543
582
  "sglang/srt/layers/quantization/configs/N=1536,K=1536,device_name=NVIDIA_A800-SXM4-80GB,dtype=int8_w8a8,block_shape=[128, 128].json",sha256=0vLaJgo5B9ti-XMFKJuvSoMGjsZQ-RhHSx4cC8Xji-U,3254
544
583
  "sglang/srt/layers/quantization/configs/N=1536,K=1536,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=tkLjwLC_aVXhzuvo-2QHkojXZauPJsf3jNHFn1S7uRA,3244
@@ -691,325 +730,350 @@ sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a
691
730
  "sglang/srt/layers/quantization/configs/N=7168,K=256,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=PD4AJYCkHfy2ivv9baMouFXzBTy0eKMumbAfxfm91HI,3256
692
731
  "sglang/srt/layers/quantization/configs/N=7168,K=256,device_name=NVIDIA_H20,dtype=int8_w8a8,block_shape=[128, 128].json",sha256=FImA-TJ_tQDjqwoNWxS--sRDoKDXf9gamlME3tkxH58,3252
693
732
  "sglang/srt/layers/quantization/configs/N=7168,K=256,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=FFBjSWlpKXMxfAUUYUqXbOK_Hd7qBeBsfbcaa9uB4qY,3249
694
- sglang/srt/layers/quantization/deep_gemm_wrapper/__init__.py,sha256=esJMd0Yuj68t6QYOpmIFuiWP2J2dxTMC4bRBNH0Xk6I,26
695
- sglang/srt/layers/quantization/deep_gemm_wrapper/compile_utils.py,sha256=PI9r3PHCMK9EgpoFuBgR4jvokA5sBz8zyC47ps3wet4,8164
696
- sglang/srt/layers/quantization/deep_gemm_wrapper/configurer.py,sha256=a1b2P8-5PRNwW1ykXR7jJF94aUF3u3t3P9ad_R1k2PI,549
697
- sglang/srt/layers/quantization/deep_gemm_wrapper/entrypoint.py,sha256=qiUuQn-InDLYVNDPFOxde2XB-qlE0fol0HPTkY5KN8g,3197
698
733
  sglang/srt/layers/quantization/quark/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
699
- sglang/srt/layers/quantization/quark/quark.py,sha256=EqQvWzAc6nd_yl6UIMIwmozKif4I8fRNfBum040UUEQ,14613
700
- sglang/srt/layers/quantization/quark/quark_moe.py,sha256=fWUAEvLoaiw_6oNC7TQW2pUuR2AeNI9AaGWNcUGDiSQ,7446
734
+ sglang/srt/layers/quantization/quark/quark.py,sha256=Xt8e8Ds7wKV2UyQ3rJq9cFUtSNmTSAnRLnC2OgTBLds,14687
735
+ sglang/srt/layers/quantization/quark/quark_moe.py,sha256=-XW9mKSisXmqs7Ep9exPAFlGgCfZ0-N3P35B9HZdamA,7371
701
736
  sglang/srt/layers/quantization/quark/utils.py,sha256=zZHRe9mjxGp16_OJ5Qy_UtnQgipl3ZRZUmruYvyEm_w,7445
702
737
  sglang/srt/layers/quantization/quark/schemes/__init__.py,sha256=z1LHBPqkxAS6Wp70DWwESOSixWpIhIQwz1IHcWDdURQ,167
703
738
  sglang/srt/layers/quantization/quark/schemes/quark_scheme.py,sha256=b8-Djo-UQAwgxSWViKDoEP5dOSesnEBPyozX-osB3WY,1478
704
- sglang/srt/layers/quantization/quark/schemes/quark_w4a4_mxfp4.py,sha256=sW57dU7HoxQGVbzUhyhRirGWA8oVpENB4NTzO7URGgU,4198
739
+ sglang/srt/layers/quantization/quark/schemes/quark_w4a4_mxfp4.py,sha256=aASlSjoLgmEmiSAULaehpNOCSGy1OYiAFazWLmJB970,3935
740
+ sglang/srt/lora/eviction_policy.py,sha256=IaG1tlchPeT2iYwuaMGdHuma91wraO1K9qRIFoV4yko,5378
705
741
  sglang/srt/lora/layers.py,sha256=0XlVcBTT1InMsBoLfiOO7yOnlDrnpXD_08wKo84T4B4,11852
706
742
  sglang/srt/lora/lora.py,sha256=FooB4hOW5uvZJrDrdqKwBExb-lX5Uw_Y1gjU9an8hzc,7669
707
743
  sglang/srt/lora/lora_config.py,sha256=qDgMTx_69jyJUl29O5FxLzYa0BMhqYVXWXfyyVOvGm0,1684
708
- sglang/srt/lora/lora_manager.py,sha256=F5kO3A6NFNFfu0hFZcn4Yr6Hum6si_kH6eE3Aw_Wxjk,19247
709
- sglang/srt/lora/lora_registry.py,sha256=osbau-sQZ7BuCeGGpBMFy4w40GO5FGqRgRwDyxxgNmg,8167
710
- sglang/srt/lora/mem_pool.py,sha256=qh-AA7HhJDKG_xF5-67WGhrV6ohMM4TQU5oY40LVulc,11485
744
+ sglang/srt/lora/lora_manager.py,sha256=WkSFWbyWtR2jkG7Erled9PBLTMqkB3keVjaN31Cluq8,19950
745
+ sglang/srt/lora/lora_registry.py,sha256=Ox1n6ZmGAWGThpDVd8WjQbJACejnA8n2lGNCVzKReaQ,8173
746
+ sglang/srt/lora/mem_pool.py,sha256=WQex5E9lQ2Arzkc9X52EHx3OLWzMwQfoepv3OdL7Fv0,12412
711
747
  sglang/srt/lora/utils.py,sha256=FeIb51m5EIcetP1Pgn8X17EfuE5tGipm5iurRg3RAZw,4424
712
748
  sglang/srt/lora/backend/base_backend.py,sha256=kfkr-OxdPyUwMzi0HgjTNfX9bZC4z_ljt3srzRPgMfI,6139
713
749
  sglang/srt/lora/backend/chunked_backend.py,sha256=x2VNkjLHmrOXwI67v_2LgjpCH8R5wuSmY5jdTWV4K7g,12701
714
- sglang/srt/lora/backend/triton_backend.py,sha256=bKH8DPo6fg7JVZt73iFV5BHc8amEJkr4FopbCnJer94,6072
750
+ sglang/srt/lora/backend/triton_backend.py,sha256=XrOaZLlwldwvGjE1h0OOVKIwYIS98Ph0aWQetub3udo,6026
715
751
  sglang/srt/lora/triton_ops/__init__.py,sha256=no7N7uWnmCvHHbNZ6PZEadXDujIjHGP2jp_3N9j6vHM,495
716
- sglang/srt/lora/triton_ops/chunked_sgmv_expand.py,sha256=sW7vsjOvyoI_00KJLZ5g0JwjTY7-AGzPTpKo3tuYC6U,6812
717
- sglang/srt/lora/triton_ops/chunked_sgmv_shrink.py,sha256=sF9PzxK7XN3-MVqiz-S0DyVU2u1ADDhgnvpBe3GTaGI,5411
752
+ sglang/srt/lora/triton_ops/chunked_sgmv_expand.py,sha256=rllqrhX3NQTmFNXnfxm0v7sY06-hggZkNWIjU9TRBc4,6844
753
+ sglang/srt/lora/triton_ops/chunked_sgmv_shrink.py,sha256=n5ANXoEciOFgXuQkRZzZcW1WmdV2qtFDH7Yx83GYHUA,5462
718
754
  sglang/srt/lora/triton_ops/gate_up_lora_b.py,sha256=QURCYxHNR8Ls4SQtt3dvdgjvdDVhywI9tOzsK8SV9m8,5779
719
755
  sglang/srt/lora/triton_ops/qkv_lora_b.py,sha256=z9BB84Xu_MjwCu5v9Yvji-FkIzfEjDySAFybc4WYv7A,6483
720
756
  sglang/srt/lora/triton_ops/sgemm_lora_a.py,sha256=Ksova04wgeGsFqGOXWqJtMYaHgyUYcx8VU42BZQOkVA,5129
721
757
  sglang/srt/lora/triton_ops/sgemm_lora_b.py,sha256=VqCAFvUtq_l-0RGIkx3W_fzD55QcW2FAcqpvSHOBFp4,5115
722
758
  sglang/srt/managers/async_dynamic_batch_tokenizer.py,sha256=btIWhI15a3QCLabdZZhrJVEWZ3zZTgldbv7pGjAPZqo,7236
723
- sglang/srt/managers/cache_controller.py,sha256=G-2292PKRRUQR6Co3sFt0oGs7zk6bqJ6RldEH0JQMGA,29300
759
+ sglang/srt/managers/cache_controller.py,sha256=Wy0ygZ5FAiXLrz1xzczeinfJATk7aPkH6yvXqOzH5_A,30478
724
760
  sglang/srt/managers/configure_logging.py,sha256=8sNXZ2z9pBWOwn-X3wyz013Ob8Nbm1zDxRkxoZjH-l4,1633
725
- sglang/srt/managers/data_parallel_controller.py,sha256=YalvihRIJwph7OdSHf24rBsWYvmLQzUnJiDL261fyMM,14880
726
- sglang/srt/managers/detokenizer_manager.py,sha256=QhJDFju95xTw7epUXvBH0t2DfwU-sR13v4i4ZAcFyQo,11815
761
+ sglang/srt/managers/data_parallel_controller.py,sha256=TAJErsNQUomHFnekrPceMZbN95PfFadticjSup3JiLY,19236
762
+ sglang/srt/managers/detokenizer_manager.py,sha256=K6TLeBtDb8geRVKvTlFqZJN-26saYJxxLlRspvEOFe8,13080
727
763
  sglang/srt/managers/disagg_service.py,sha256=7VyRva5oniAPs8G-DYg2fv-mdjSxk9cLZPzl_TmB_2Q,1588
728
- sglang/srt/managers/io_struct.py,sha256=ZkxZpLbdEJTl92GtmaGfG0TDuuNpcC6YrvOXG6X75hI,48748
729
- sglang/srt/managers/mm_utils.py,sha256=b6n39SlbaFP2XdUvJYOfRQL1Gch8fP--VxpOGsRJ8tc,30917
730
- sglang/srt/managers/multi_tokenizer_mixin.py,sha256=audn1iSNNVu3d0DamslN1e-KGvhRJ5d_pw68nucQOUU,21676
764
+ sglang/srt/managers/io_struct.py,sha256=2RMpLqiZbI27kR1p9yJKZT1u1sA0NZWukfU4U0WM6gU,50932
765
+ sglang/srt/managers/mm_utils.py,sha256=xJ7Pbk1ZxIyodLyeNv_t0JeSKCqrP7u5hpMcC-0Rpzc,31283
766
+ sglang/srt/managers/multi_tokenizer_mixin.py,sha256=dELw8-Ka4-gY6ek5CSVW0DLK8Kq6jJDO6qMTNm5bOxk,21545
731
767
  sglang/srt/managers/multimodal_processor.py,sha256=0mLkwu6CGRQtt3G2T1tS3PSsh6dpyivV-vAfIHfcMbQ,1764
732
- sglang/srt/managers/overlap_utils.py,sha256=QHeF3rQPI_kgMngPfDpAO8m80ZKSXOxB2G6r4Znyi2U,1809
733
- sglang/srt/managers/schedule_batch.py,sha256=qQVFsvoJev5vgoOkFS4Zo_3tjv-5Vg0zxdxQlFYWS1Y,81929
734
- sglang/srt/managers/schedule_policy.py,sha256=tdb81t-_zILXSGe5E3zNqg7N0_pbLWa8lfV1V7lAGnY,28192
735
- sglang/srt/managers/scheduler.py,sha256=9hjS_FeM7Qfy1EYqvCmdrkuANFGFhNXvIXibDmGlZHE,119572
768
+ sglang/srt/managers/overlap_utils.py,sha256=dDz1zUBlJ9Ohw4TPHgOxnuh6LPCsN037c14XIw3E-J8,5050
769
+ sglang/srt/managers/schedule_batch.py,sha256=0oWPNVtdgoX2bFHOc1RN_1IYyoIE1yKwCImll65dAbQ,72622
770
+ sglang/srt/managers/schedule_policy.py,sha256=BFWoHG3m-lkeVvOkLGoMeEbRplq4vF4thsjv-P8MG84,28818
771
+ sglang/srt/managers/scheduler.py,sha256=aJnk_T9_ZNHCMhRs0cJqfkTH7EbW_B7OhXK2WV20UFE,115088
736
772
  sglang/srt/managers/scheduler_input_blocker.py,sha256=SYZ91JNTHtqiBHUpkk_MboAiBFyl5U7ardLcYDAQ0OU,3689
737
- sglang/srt/managers/scheduler_metrics_mixin.py,sha256=tvDovTLhtf8svgqVXIyoAc1xuf4PrH0AuCb0SPMYrGg,13197
738
- sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=-ObOi1TK7WBwbGOzB5usSKmnGYjAqMPsYXMP81hPC44,33753
739
- sglang/srt/managers/scheduler_profiler_mixin.py,sha256=62dv-rLS3acUncFNJd6S0P4jglJ5XY3CFIauB08xuJ4,11405
773
+ sglang/srt/managers/scheduler_metrics_mixin.py,sha256=OJKCTqNX5gxragq_774EeTSrNEPYp3N7udhE51pukFg,15337
774
+ sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=n6zvLqu-TpTaZuWfYxz7ivCBPP3Z7okTOOshTq0d4CQ,42449
775
+ sglang/srt/managers/scheduler_pp_mixin.py,sha256=oUl5oxbFPd2gxqn4JXk-Bn-uLrmJZ6_Km5SMpSe9Gtk,16433
776
+ sglang/srt/managers/scheduler_profiler_mixin.py,sha256=4yhFzHO8ir4TbnYluDFYvCl8RgH0L-AihdIYuMLtBcw,13453
740
777
  sglang/srt/managers/scheduler_recv_skipper.py,sha256=8rVQCBjn9f26Th4XbeUS3fEsvo1GI029Me28wMjcKRY,1103
741
- sglang/srt/managers/scheduler_update_weights_mixin.py,sha256=K9gCx16TaoeRah4fSYpIw_sOzRKuNUw2AJa6__dt5Bk,6194
778
+ sglang/srt/managers/scheduler_runtime_checker_mixin.py,sha256=54z5p36M2BgTQYrEz30aAtQVXWCBI9VHBjgzOf19QPo,8521
779
+ sglang/srt/managers/scheduler_update_weights_mixin.py,sha256=AuOKrV943inXe5s4cPb4_BQiNAFwkiQGlpaBS-aal-M,6957
742
780
  sglang/srt/managers/session_controller.py,sha256=FGADRGSkRmS76o_BQ2fivpgw0Q5Q-K0Ws3aezH41YSc,6041
743
781
  sglang/srt/managers/template_manager.py,sha256=M4EshVv1OhKxUAGQPP4OntRkSkUVvG93457xsYfWnQk,11968
744
- sglang/srt/managers/tokenizer_communicator_mixin.py,sha256=NshY8ibxS7EQQGSYEp1PAAli0UL0-J_XZFtpQr9BIS8,25048
745
- sglang/srt/managers/tokenizer_manager.py,sha256=YVCCbNP9g_56neSBcLnQCN1vtcmAp3apd7XLUq-NCig,77943
746
- sglang/srt/managers/tp_worker.py,sha256=Qprdf6QhbddbKiKtO6Huu6J9a6jpWB_BH5qXADHvkas,14145
747
- sglang/srt/managers/tp_worker_overlap_thread.py,sha256=9EoJ5ZbolfC8atvs6i6AFz9L9xHGj6OseaSLPezkVX8,11858
748
- sglang/srt/managers/utils.py,sha256=fE_RZl5q0sZl9EQZNLlX9VNOHINxh-TJLQoH26GW2Lo,4279
749
- sglang/srt/mem_cache/allocator.py,sha256=O-te5k_xLVB7o_GhBWCvperdm0_hJAlsxmw1QD3d9o4,18038
750
- sglang/srt/mem_cache/allocator_ascend.py,sha256=aGsh_VMI0eYoAy3uKCYbpAMFxyXVTyu4JmdeGDWLLbw,4997
751
- sglang/srt/mem_cache/base_prefix_cache.py,sha256=Bv84HD6e_yYdtmIQemK1m1OUViO0PnuAvOS9tDpQOJM,2795
752
- sglang/srt/mem_cache/chunk_cache.py,sha256=5_yPQMGDP6TGLSxrEhOrBcrpd_7Z15Qewh6DOC6WyA8,3487
753
- sglang/srt/mem_cache/evict_policy.py,sha256=yX8hFNQ_pdzuN4rMjYcByhQZLs-lRZdD0qDLkPe2ht0,627
782
+ sglang/srt/managers/tokenizer_communicator_mixin.py,sha256=CHry04ONVx3YMGNN5KtNJFaafxnw4LfXHceMR1q2Nwc,26088
783
+ sglang/srt/managers/tokenizer_manager.py,sha256=UM54r6Ox-dfTOesahpm6QmyXtvUTDCJyTRK4n903MFo,90468
784
+ sglang/srt/managers/tp_worker.py,sha256=qENe8zAagoTs50RJmCJi2il9JsQtuQqBHII6XBBPLJg,16212
785
+ sglang/srt/managers/utils.py,sha256=HRPecRiWLHTX6QbkyYRY-tjlpJEb9N1k0fSJsqBxJl8,7324
786
+ sglang/srt/mem_cache/allocator.py,sha256=TEAkK32vyYz7wow5bpZLlrzb3KHVXtw9h1KtGWg6kIo,18246
787
+ sglang/srt/mem_cache/allocator_ascend.py,sha256=GVI1HbNQRy_rIlUHEn-6oRe2WS_OBXfqmoco2Hxta_w,5017
788
+ sglang/srt/mem_cache/base_prefix_cache.py,sha256=Z6c9YKJjInVxvZAZpIh8KRAPlOyE0-aowncm4JMXE70,2813
789
+ sglang/srt/mem_cache/chunk_cache.py,sha256=u4EIGuWNonVoCItF2wrKnXzh2OtoDM04XhoffEK6ykE,3923
790
+ sglang/srt/mem_cache/common.py,sha256=PEFKzoawIIPRVboyInPKWG56qht-inp34vcj6q_fsfg,16283
791
+ sglang/srt/mem_cache/evict_policy.py,sha256=FVI4QsFJoRR1CaxE9jpX4OzBPt4w9ftfM2Ndu4BSfhA,1012
754
792
  sglang/srt/mem_cache/flush_cache.py,sha256=GYcxmNXh4hsMpFfNOuCTpKilW7guZwTtAg_usVeM3J0,979
755
- sglang/srt/mem_cache/hicache_storage.py,sha256=5L57L_vzqYyNk5PRdKikxyaaMj1LkCkWD38Sd93IAe8,7958
756
- sglang/srt/mem_cache/hiradix_cache.py,sha256=hSsz8k1foizh-wJUxDi9h0NQZNNmSQoH_YP4A4uLtms,35414
757
- sglang/srt/mem_cache/memory_pool.py,sha256=FiJzy8V39Jt7mIkyMiaq8OEhhnwP_GggOUm8nLiY3Ws,57038
758
- sglang/srt/mem_cache/memory_pool_host.py,sha256=T3lgq0dyjyvOGdx4nGSGZzm6fqkX9H0S0JzYaNGJJ7k,27659
759
- sglang/srt/mem_cache/multimodal_cache.py,sha256=zPnQLQhBZ6zsUpCQPSoNkrB9EEvpoDQS4mU7c3sRWjE,2171
760
- sglang/srt/mem_cache/radix_cache.py,sha256=1K1MvZZOLZVrbDti3pRrI1-pHJMlxxB3Scz9d9XNMo4,26390
761
- sglang/srt/mem_cache/radix_cache_cpp.py,sha256=0twLAAR2EYWyfRiUVsb__s01ITraNEF9bXBPZFvul1U,9454
762
- sglang/srt/mem_cache/swa_radix_cache.py,sha256=Kf5HAfnwJl1mr86pT7Y03o4RBKtUXfI6udbii9xAirs,40138
793
+ sglang/srt/mem_cache/hicache_storage.py,sha256=lvRaZesRhHQopBoNBbWlXxs4IbRwcWnpEP51MjowtWs,8366
794
+ sglang/srt/mem_cache/hiradix_cache.py,sha256=BK52hyQjPoXKzn_PDn_LRk_3a0AjWBie1Xk4yAO1B3s,35984
795
+ sglang/srt/mem_cache/mamba_radix_cache.py,sha256=mpKTxCzA1_u4eoHk0SvXPPNVVG_JivEAb44miY3aNuw,38678
796
+ sglang/srt/mem_cache/memory_pool.py,sha256=v0zHcqaOp1cUX2jNaNJOR5lnk0sdj7S4aViPjewpXJs,67163
797
+ sglang/srt/mem_cache/memory_pool_host.py,sha256=IBUKHCmU_Fu8d22_V5ssYp4Ff97w3EaMSpyFZvPD0Go,27634
798
+ sglang/srt/mem_cache/multimodal_cache.py,sha256=23d34nWEDtgiOM6fqAhmkQ8-OHnrNR1-n8Ert0K0n3U,2147
799
+ sglang/srt/mem_cache/radix_cache.py,sha256=7NQHMUKjdKaAGMFdx1z0pCPBPvwux9KcqymFRxFUAY4,28181
800
+ sglang/srt/mem_cache/radix_cache_cpp.py,sha256=PIJenIaR_ouY-pAmyYuI84KY0tDaLg6VAPvKBaNttPM,9663
801
+ sglang/srt/mem_cache/swa_radix_cache.py,sha256=xYK1K6tgyUErhWvfTDfm_TWDRiAWbRNWM1Wd4LSzv4Q,43420
763
802
  sglang/srt/mem_cache/cpp_radix_tree/radix_tree.py,sha256=tQZpz-H6HxNAQe9mYqt6aX8mfDZyu_fbJTcCNK-Ns1M,7179
764
803
  sglang/srt/mem_cache/storage/__init__.py,sha256=HDzHFUVeOHlry7HlfL5tRd5HUA02N94p8uzA_Va8nlM,251
765
- sglang/srt/mem_cache/storage/backend_factory.py,sha256=rN8OfnkROk1rFQpJeCkiXMucuI--Ez35h4physV6Ys4,7822
766
- sglang/srt/mem_cache/storage/aibrix_kvcache/aibrix_kvcache_storage.py,sha256=kYqfXHdWwmL8WPZ9Z5RtwPzKgb0Vq-QOTE-6YXndd5U,5463
767
- sglang/srt/mem_cache/storage/aibrix_kvcache/unit_test.py,sha256=X7-GU8X5-t9adyVuD09obHQUo8d_Rfu--7R0C631p_g,3718
768
- sglang/srt/mem_cache/storage/eic/eic_storage.py,sha256=V2isvEuzCsEZd1XzYFlwIyLbOm0P6rs4QXVqCDjRcPs,28628
804
+ sglang/srt/mem_cache/storage/backend_factory.py,sha256=ItY0f0YY7fto-oW_yuRxE7lxsv0e6Y3qnWCjgtr2BWE,7859
805
+ sglang/srt/mem_cache/storage/aibrix_kvcache/aibrix_kvcache_storage.py,sha256=0n8jH9Rrcv73X-qcQnaM4ozkb35UMWdxkmeBGfl-O1A,5573
806
+ sglang/srt/mem_cache/storage/aibrix_kvcache/unit_test.py,sha256=asSKZdmlPYxrEzQOqsscfx7fpzV8ueqYwO0npE20otk,3420
807
+ sglang/srt/mem_cache/storage/eic/eic_storage.py,sha256=UVPr5gMfm8TxaxRY2eYf9CsB8JM9VKVO6pI6MrpCvH8,28534
769
808
  sglang/srt/mem_cache/storage/eic/test_unit.py,sha256=PfNPpL624t23tyVgtmS5F1pGiuWDMrC39ZD6ZbkN828,3607
770
- sglang/srt/mem_cache/storage/hf3fs/hf3fs_client.py,sha256=le_iTE5HZAbQNToa5E_dq_3U5ztu60ej-58tmzRtndM,5245
809
+ sglang/srt/mem_cache/storage/hf3fs/hf3fs_client.py,sha256=3xG0dV5JmnbIJ8kB1_lk8jAeqshOcU7tXES27ldyb8I,5228
771
810
  sglang/srt/mem_cache/storage/hf3fs/hf3fs_usrbio_client.py,sha256=6oH4v_WF_pKH4FMSr252v6QPhBCnRHztHqzuS8j6_QI,5323
772
811
  sglang/srt/mem_cache/storage/hf3fs/hf3fs_utils.cpp,sha256=dDYPtxmL6OFhEyv_GuTgzkTDpBjcD0EK8kphnn7eaGc,1133
773
- sglang/srt/mem_cache/storage/hf3fs/mini_3fs_metadata_server.py,sha256=lJ9Jp2kOgQQaUihxlO9l-W8fYfOMa1h1y0WAtzzFGLM,17850
774
- sglang/srt/mem_cache/storage/hf3fs/storage_hf3fs.py,sha256=IeEc09wmBI5iRnN3rUSyfBxlFeHc92hHcA96dGRgCgM,21351
812
+ sglang/srt/mem_cache/storage/hf3fs/mini_3fs_metadata_server.py,sha256=IKIm5uQ9XyWx19YflkYZvBSjbVpYbMpeg3Mg7wYMwNM,17880
813
+ sglang/srt/mem_cache/storage/hf3fs/storage_hf3fs.py,sha256=MI-x2979lvJL8d4aJluTCx6DofIe0tkLTNbrAJbV0FI,21514
775
814
  sglang/srt/mem_cache/storage/hf3fs/test_hf3fs_utils.py,sha256=g2h0Woa2CK39pRTigHCVR_hq095dTaC70lCIAIs9THM,1089
776
- sglang/srt/mem_cache/storage/lmcache/lmc_radix_cache.py,sha256=AdujdsJ_3ODf11O0LpA59X6yWWJLPQELelxE4hKU5-U,9925
815
+ sglang/srt/mem_cache/storage/lmcache/lmc_radix_cache.py,sha256=pd5NC37FORcF-yHmOjbARZGGPcpc-Xd3iu3KGjgYnc4,10009
777
816
  sglang/srt/mem_cache/storage/lmcache/unit_test.py,sha256=DCSZDMJAe-HehL9hWzsP759pck36Q-8ijxWZKfgXmA8,3590
778
- sglang/srt/mem_cache/storage/mooncake_store/mooncake_store.py,sha256=OWHraCjil547NYf6SjTrB6dteznqJL8kPoCFA1DCgwc,16885
817
+ sglang/srt/mem_cache/storage/mooncake_store/mooncake_store.py,sha256=j4KVka-45-RaTnBoGLS8BQnGTxnTLPDOaT-jrFriPKg,20216
779
818
  sglang/srt/mem_cache/storage/mooncake_store/test_mooncake_store.py,sha256=6TiqbzEIL71DC7wL1B-Q-SMMZRYsz08sg-dZYeMzmAc,4930
780
- sglang/srt/mem_cache/storage/nixl/hicache_nixl.py,sha256=bau9Jsp50lpEiy_osgb-dYzeoUkPWM03x7Q8z2BpKaU,9920
781
- sglang/srt/mem_cache/storage/nixl/nixl_utils.py,sha256=KXkwMrbWwIOUOASINnUo4HyheiMd-93smmwGLv0CacU,7463
782
- sglang/srt/mem_cache/storage/nixl/test_hicache_nixl_storage.py,sha256=vENVvGAd3PqcQEFA812wPoSBYhRemLr8Sfh1LQa0INU,9609
783
- sglang/srt/metrics/collector.py,sha256=s1BpU0cLgG1nHWYH5Y0PT0NbqRVHIs_IWql-UxOEEYY,34078
784
- sglang/srt/metrics/func_timer.py,sha256=6-PYCeItVhsET6lc0BcFQfd0Tc3_wvJ8VHdp3mlWz7Y,3306
819
+ sglang/srt/mem_cache/storage/nixl/hicache_nixl.py,sha256=kfGOqJPtq_kiLO2m_bDMFGID9iO79D8iBWadPIgsanY,10911
820
+ sglang/srt/mem_cache/storage/nixl/nixl_utils.py,sha256=3ouXVNJ17nilYF5gKDqphWux2sHqdqD5ztusCv4aP9w,7457
821
+ sglang/srt/mem_cache/storage/nixl/test_hicache_nixl_storage.py,sha256=Jj3o2zkPZBBUYzbQeHWV1ujjlC70GYHXmQL_SPStp7Q,10031
822
+ sglang/srt/metrics/collector.py,sha256=Qvwsn5POBDbxsaNRfjwssLszdACtxNeIojq0zfy8O4Q,35327
823
+ sglang/srt/metrics/func_timer.py,sha256=Om9o4svdyPfUpgcwMt6tL560qmbPBQvkDPhPzTwCmvE,3300
785
824
  sglang/srt/metrics/startup_func_log_and_timer.py,sha256=PRVg3Z2d5GBMFifZXR-VhzGcn9nmKTkqEU41VJKZmaI,4937
786
825
  sglang/srt/metrics/utils.py,sha256=MGb3quRI39n4tgJS1e0UHI5TBX3D0MwsgiZFMW2EsSQ,1903
787
826
  sglang/srt/model_executor/cpu_graph_runner.py,sha256=ypp5yIW2OhRX-Xmido5mWuzEFpd-ohlq2c2wEuSW71I,23415
788
- sglang/srt/model_executor/cuda_graph_runner.py,sha256=GcD2FkWG6CJRO3A23HY3Cu24ZE2c2MSpCD1NbtoLLgY,34348
789
- sglang/srt/model_executor/forward_batch_info.py,sha256=834WSjXwpIeHGTgldRaBJ0R-YIjr8bops4YMzTHi9t4,42236
790
- sglang/srt/model_executor/model_runner.py,sha256=sTRCfbndxVaUXFOaBUy9u6VPOoFFZHvm0_RBKuBF2Y8,89531
791
- sglang/srt/model_executor/npu_graph_runner.py,sha256=HstTsIQF2QHCPMQH_AxKOu1Ulykw8q8Cpx7Q-u9Kq8I,3673
792
- sglang/srt/model_loader/__init__.py,sha256=_1Y5sUZGxEEG_bmvLbSgYGa__qO60_d0blGB8sIdOgo,1020
793
- sglang/srt/model_loader/loader.py,sha256=MhrqysDMxBTAuwoLbYyCfLJOluk_KSZWPhgiD-rP2Cw,64789
827
+ sglang/srt/model_executor/cuda_graph_runner.py,sha256=hz7y3q5J7e8lnDhDPxiJIGvtGG7Ws0Og8ztbaZ_mqXw,35580
828
+ sglang/srt/model_executor/forward_batch_info.py,sha256=wLkiWTAMgq-4xQFvimvRnQK9eDQKS0UurtooqueBbx4,44306
829
+ sglang/srt/model_executor/model_runner.py,sha256=82SAlFp14XbUocqGxcEkH4ToGL10Rh0Oz1YQtJ9R0rc,93938
830
+ sglang/srt/model_executor/npu_graph_runner.py,sha256=B1YQla4jW9PiciBBisKg-qoC-vmnldRr8ut_aSmUB-E,3664
831
+ sglang/srt/model_executor/piecewise_cuda_graph_runner.py,sha256=yYOuLLI8hscmpnlxEKrrIpGnirMIncoy0dHBWi7XcB8,22684
832
+ sglang/srt/model_loader/__init__.py,sha256=Y4gehllriF0JNjly4rGhQPSkUrA9u9Lr-WbfZfBIs6k,1034
833
+ sglang/srt/model_loader/loader.py,sha256=73Pd71im3E56u9SCZmrMgeq5ZJxadeb-ENIIQW4LW9I,80809
794
834
  sglang/srt/model_loader/remote_instance_weight_loader_utils.py,sha256=_HnQD1Ab-Wv9oATOmwJe6aQaQD_Gs_yG9EsDCGJQWfs,2881
795
- sglang/srt/model_loader/utils.py,sha256=KrOpyd_eefZC3zFnhnwxIKNTx9G-MmA6jIK3NQbTW0E,5002
796
- sglang/srt/model_loader/weight_utils.py,sha256=QbeiJY8VXIM1iLdG8X_JAjuy37mZzAUQzhBY_HHsxMw,44383
797
- sglang/srt/models/apertus.py,sha256=UL2Rd1TDDXPb2N4rWyymI3JThG7KlrGIyBuDIFCitPE,26002
798
- sglang/srt/models/arcee.py,sha256=Q6fujRESEnljzs8ls3XGsPtWxzfKfUa0QAvAekYzeBY,18981
835
+ sglang/srt/model_loader/utils.py,sha256=cfMXqVGRppD7CglcFqdMzwhCeB__FHWovYN0IBqkMuw,5001
836
+ sglang/srt/model_loader/weight_utils.py,sha256=O8cdxYdEjMyXgZT0Jz0PdagQGnIgPwnSvAWsyovOHsA,45019
837
+ sglang/srt/models/apertus.py,sha256=Wuz4H8EQUMlqlcCTM3Fe7E0lE0eodb-cX9us1avQxwI,25937
838
+ sglang/srt/models/arcee.py,sha256=O5yGtgAeIdcmYwZNLURWVE6Hu1O0k34gNiUEtux8ozU,18966
799
839
  sglang/srt/models/baichuan.py,sha256=HbvlErnkCSK4pRQYCSDxMcrn-1DQyfiNoeDcnRrJas8,15807
800
- sglang/srt/models/bailing_moe.py,sha256=IbG4BCgll0f5LUPkKZttizPU2wbtV5E9-dciUmjZ-EM,37726
801
- sglang/srt/models/bailing_moe_nextn.py,sha256=ntuaXP8PXc_X_oqmd4fp_FzpRmnajKoWQynXwjsEN5M,6000
802
- sglang/srt/models/bert.py,sha256=ODJe8YfNRP-hHsomFWk4_QpcuiSsNfjzGf256EDS0Pc,15802
840
+ sglang/srt/models/bailing_moe.py,sha256=Av6psy73-ZzsHnYLI4OTFshDVvjWtitGn_KQ_CY0fjQ,36313
841
+ sglang/srt/models/bailing_moe_nextn.py,sha256=rzHElrOiXJTV90khQUdx74u4RTXXu07_JUIY_zTRbaw,5930
842
+ sglang/srt/models/bert.py,sha256=2aUAVMT-43VGIbrI8keRBZZdCMOi5PzssykHO00zT94,15791
803
843
  sglang/srt/models/chatglm.py,sha256=cajLN9caBl09e0TwOFkiTTKDqwlbmHo_yS-NCjdeQW8,13957
804
844
  sglang/srt/models/clip.py,sha256=kOPSXnmgH_QKu2-ENn49HLDS9yf7Gm1HCOE_YvoNhlA,19858
805
845
  sglang/srt/models/commandr.py,sha256=5Y_b3K0QY7D37nFGkyiGgY38RleRui_GJUYcHSuHUZo,15315
806
846
  sglang/srt/models/dbrx.py,sha256=117gwrB_o8VlACwDH5YlXkPfuS7t2Mh-nyJvpNpIYxs,15903
807
847
  sglang/srt/models/deepseek.py,sha256=M7nyHcAbTIs8vc1g6u00oy22-pp704Xp4T3clBzu4xM,17460
808
848
  sglang/srt/models/deepseek_janus_pro.py,sha256=td8xGs6ARfJ8AQCYwUhMOZoWigrAs7m3trF5-kXCqik,70418
809
- sglang/srt/models/deepseek_nextn.py,sha256=QRcl5mWGDbYblV1dmo8MxPVeEUQQ_UhXumB5FEgj4M4,6255
810
- sglang/srt/models/deepseek_v2.py,sha256=K6QdBihJEF64gurObwIVfJJ2icJroO538D2LQvSmoBw,132581
849
+ sglang/srt/models/deepseek_nextn.py,sha256=B-Xk9mh7op-Gx42yJKV353yzWzL68iwwR08r6jbNZ6A,6710
850
+ sglang/srt/models/deepseek_ocr.py,sha256=WAPLXeg3S1UB3x3iP-tiandHk5AEnCUMeMs0ak302Gg,52416
851
+ sglang/srt/models/deepseek_v2.py,sha256=XZ2oYlX5GQ3dsRKlfr4g6RQMnXMf02S9ihszbn8ph9M,143886
811
852
  sglang/srt/models/deepseek_vl2.py,sha256=7X3gI4DE7guUtNJvMLf06jO8MUHKa2Aan8evZg5hsXc,13061
812
- sglang/srt/models/dots_ocr.py,sha256=Dr9O-VBY1aSOFoIzEKcqs_QKRipjs8OQTfKrO5fJd-I,6792
813
- sglang/srt/models/dots_vlm.py,sha256=0tbeQHbJryUMVqEnWelawDabzhcdwSj3Bb9-nj4YOKs,7242
814
- sglang/srt/models/dots_vlm_vit.py,sha256=K6QzcHx38XAq9fmNRJ-iApScZ9FoV0lkn3JYkRsxplk,12044
853
+ sglang/srt/models/dots_ocr.py,sha256=sWkFsENjX5b_CecLCqXjepsr6iyyCbNTmjZbRfoB4ek,6683
854
+ sglang/srt/models/dots_vlm.py,sha256=3uLSXO7W8UPKU7a3ixkC_gwSVDGYecCHK0kZAoD6vNs,7192
855
+ sglang/srt/models/dots_vlm_vit.py,sha256=JhX2E0UmjhdelDvR46-_ns5GCYsfnEpeqyDb9NNKUh4,12058
815
856
  sglang/srt/models/ernie4.py,sha256=3z14KFdYLR8J-zsm9oO1uBUeLlWrlkHoFKEYvKKJLKM,16079
816
857
  sglang/srt/models/ernie4_eagle.py,sha256=E7f-ygCcY8pIoyTMKFyVC2uRcG59-_RaQTO4gd5_uWI,7223
817
858
  sglang/srt/models/exaone.py,sha256=TpO-rtCpEZ8Ua7hGFnS8l2oAYhY0Pij50grc9WQ2mvc,13576
818
- sglang/srt/models/falcon_h1.py,sha256=vtFgy-P6Jc6VoUibjpLNDi7633rcw61Fdyo8RDabiUE,20825
859
+ sglang/srt/models/falcon_h1.py,sha256=UQZ8454btjoZ1kbktaqtIjHY1xdvaUZ1ZRnZZ2APlg4,20759
819
860
  sglang/srt/models/gemma.py,sha256=2atKwFN5wCsJCmBRmURX9vaCcFjxlFirL7xsnG5KPlI,14180
820
861
  sglang/srt/models/gemma2.py,sha256=n2s3WLGVM3XDvOXwbi_h7tgeh5SDDv1VvifH680DmV0,16785
821
862
  sglang/srt/models/gemma2_reward.py,sha256=V8U3_ADUHWPdOwvEe1jhGW-oJmBgL8t1TY3-67Ksv2A,2618
822
863
  sglang/srt/models/gemma3_causal.py,sha256=o46BNbaiOeoOv2xVU6-lWZhrrjyGskdebve0_wviWfU,27338
823
- sglang/srt/models/gemma3_mm.py,sha256=r4r7OcYqKE-ZpDBuPZCF4TnLmG10MCwXupKRDR3E76w,17195
864
+ sglang/srt/models/gemma3_mm.py,sha256=9JpkNj_u-8Af9RJJQbUNGOxWmvW3TbXUceoI6omb8jc,18030
824
865
  sglang/srt/models/gemma3n_audio.py,sha256=isgKfjA5UieYawxU6medL2ssXlzYPqAbagDBnLcemC0,36405
825
866
  sglang/srt/models/gemma3n_causal.py,sha256=kBDlpSWAg6ZDmUPe08Q7sj5CbdVD_0h07zwJw8sKu7I,36335
826
- sglang/srt/models/gemma3n_mm.py,sha256=94QLW3FfAcqhz0E-gti8rTizTL9ci6CjMTxYOv2vHac,20371
867
+ sglang/srt/models/gemma3n_mm.py,sha256=Il5LHjZdbHEXueUVdBp5lpSJHt56W7fpfPHD0Y7RED4,20301
827
868
  sglang/srt/models/glm4.py,sha256=dijzVTTgg8zyJ3gga95MKY0WwqwnuAaf-VIV93OFAmc,11433
828
- sglang/srt/models/glm4_moe.py,sha256=_H_ldIZCuR22kQJ-5wZ3D-NW8rg7Mi8crSzWdBGO_RE,42037
829
- sglang/srt/models/glm4_moe_nextn.py,sha256=pE9G2xr_hLBu6PpvWlyTVZ1BP_Eax2bVqwFHLv2d7kY,5962
830
- sglang/srt/models/glm4v.py,sha256=gn2a4Sb_txTKOguYIzIgw_3DQX8IG1vhJMulh2gfvPs,23761
831
- sglang/srt/models/glm4v_moe.py,sha256=wXbO-C3Kx6CEKGbzcs7CfdgH5giLjgrDDjJ7Nq7_rpw,17396
869
+ sglang/srt/models/glm4_moe.py,sha256=x8Y5gD4GMr6wvx3tzllMQ9dz7cWcq18rII986f_Bke8,38217
870
+ sglang/srt/models/glm4_moe_nextn.py,sha256=H-z8CKc1v_9oR6PzKE7aX6L1PHG8hHNrgyVgFO1ZZWE,5601
871
+ sglang/srt/models/glm4v.py,sha256=LwiFQxYm2ksmaePeO57i5d4YGQjiQX52e-Dsjyh_P7I,23834
872
+ sglang/srt/models/glm4v_moe.py,sha256=px1wUjDCU7Ro8GnxpjkGh8yQS0Tr_IjYmV2C8iPqhfM,9594
832
873
  sglang/srt/models/gpt2.py,sha256=kclhxEs8oJk1KCyhmAqo7rZqecVGGHYkc-a1WZi3aIk,9841
833
874
  sglang/srt/models/gpt_bigcode.py,sha256=1D6bi8Zu760gCRZkvdLHFcg8kCkY35ARwQYaMDtYhl4,10307
834
- sglang/srt/models/gpt_oss.py,sha256=7cjyN1v2cxP9vZNrMqeDorX20U9_I4YcSpz_b4x0zj8,43720
875
+ sglang/srt/models/gpt_oss.py,sha256=K9g2c9xTE2eM74isijM-KSvGPHt6Cjgjl8L8EzBTLmM,43711
835
876
  sglang/srt/models/granite.py,sha256=8q92shxVPAp_cJDohJATffSGd7Z0Oi-vF5jpY6DlK4s,19840
836
877
  sglang/srt/models/granitemoe.py,sha256=j1rgZ62CbBioECjUblDCw_NneDQgY_QJODsI0fqXVO8,13779
837
- sglang/srt/models/grok.py,sha256=8KCR13LtdnhswJrIwgb0sdFW0OxCA8GQ0fbN8gb856E,40518
838
- sglang/srt/models/hunyuan.py,sha256=RSZErx-Swt65kmfvSXJQJJ6KhjucuNY4UUVLWC8hWaA,31102
878
+ sglang/srt/models/grok.py,sha256=qEuuoVg5aaVGPyjuYvx_rTRcAiUToDNv0IQ8XbCXOr4,40021
879
+ sglang/srt/models/hunyuan.py,sha256=i4RUEDDwvflGV6hciBjTS46G10ew0DJcmaUpONkxlF4,30950
839
880
  sglang/srt/models/idefics2.py,sha256=U3khd3hbdawJeRNXsxmaKHdssOCT5TPOZ1D-2_zHoQo,12079
840
881
  sglang/srt/models/internlm2.py,sha256=F_iNY1gUqzAjAuUatcE47gnrcoTh5_08PY2Rw9tKr9M,13150
841
882
  sglang/srt/models/internlm2_reward.py,sha256=ndfGmyqYZbVZ7C7rJ-v9oK3wa-EpoBGybS8MlyKZi2E,2522
842
- sglang/srt/models/interns1.py,sha256=E4SyJWocXZ5rAuAV8kj569OHo57r04W4hmq1CF6oiFs,12516
883
+ sglang/srt/models/interns1.py,sha256=VZAGsvjkjPhdUvvLuSy9qV40KXsBTy0KdiXg00EeOnE,12450
843
884
  sglang/srt/models/internvl.py,sha256=iQm2wDtkcyjPYoV9oY_jQ3_7WvhP315eP_vZEiQX3uw,27062
844
- sglang/srt/models/kimi_vl.py,sha256=XulRiufQzOSWZe8-bUl2OEdznvsVU9OBsEYipaX3YkM,12877
845
- sglang/srt/models/kimi_vl_moonvit.py,sha256=0X07KnCsp9m8ZxVpdMSDSMH_yDZXkToIjwDtoyGX0Mo,23894
846
- sglang/srt/models/llama.py,sha256=ZQc5XgkAtgr4etZ8tVp1B_hTk0pz_IehkVlCoaI5BXo,28263
885
+ sglang/srt/models/kimi_vl.py,sha256=Tm0-cZXzD3FNW6YEoAFGqCX7ExW4hni-RGFsK3GOCcg,12707
886
+ sglang/srt/models/kimi_vl_moonvit.py,sha256=qtS8ANHYJ_VPrnzg7oSN30nGAnxfn6LA7xQ8GPH9uQM,23939
887
+ sglang/srt/models/llama.py,sha256=Et_i6a1A3TL0pS6ccD8NIOiBpqTxjmSMl1KUQsAXotE,28248
847
888
  sglang/srt/models/llama4.py,sha256=i4-Vo5FVE9zf_6Y80dyft5VjPOQ-a-xWYfEV8s-ltKQ,19872
848
889
  sglang/srt/models/llama_classification.py,sha256=4QWTFaUZIFKYZvEzs8bx8VkOZNIwdYCLrnwrdAw4QK0,3108
849
890
  sglang/srt/models/llama_eagle.py,sha256=Ubh_jmtfiOnriwvHgQT0ZGID7JvYvdSi_QGHOIkEgPE,5028
850
- sglang/srt/models/llama_eagle3.py,sha256=lutyS4UaPg5QussPu08En3iO5e1lhsSm4dBXTm4R_XI,9201
891
+ sglang/srt/models/llama_eagle3.py,sha256=yezjnua5fBjTwJT2lKmybn0uAE7dKOJtazN2fWxqY_k,9182
851
892
  sglang/srt/models/llama_embedding.py,sha256=zq-_lNu35VBFc7eemiam0zdkGIE8fzrgk5OWYfirZnA,3254
852
893
  sglang/srt/models/llama_reward.py,sha256=LF2nqMV5XOrljGjAwJg43mBv3z6Q040I2EYlgZeCp8k,4681
853
894
  sglang/srt/models/llava.py,sha256=xzYip_BAwpzSIdZre43LZiyTpFISa0ZCLdO6LUSbaCg,37702
854
895
  sglang/srt/models/llavavid.py,sha256=-CSk0RJ2MQeb81sh-RISeVJFaI-XWY6nR6_I594MkME,12818
855
- sglang/srt/models/longcat_flash.py,sha256=g_WX1UQgvkAtGGkw0Zk5NmDU9ew35zWKXn50CptKsh4,41016
856
- sglang/srt/models/longcat_flash_nextn.py,sha256=MdXz-KDjvNexD1rT3tSjVCgAe1p0G24HKkO613fIG2k,29605
857
- sglang/srt/models/mimo.py,sha256=Mp-iFp4YHuiuq-H8enUF5K5QbMnVcvEa6mURH6vM3yM,6140
858
- sglang/srt/models/mimo_mtp.py,sha256=jSmqJAXu7G3OO7jW1oa2suI4H_Yl7u5ZT7w4lHFbHhg,7292
896
+ sglang/srt/models/longcat_flash.py,sha256=CjlGMrV5IYZ98DoCByiN61rVn2CFtVKEEH7oWNp0OwY,40507
897
+ sglang/srt/models/longcat_flash_nextn.py,sha256=tbM7UYNs8iP_N2SN3tgP1GA3S9oEEq9KDkVPV-DF4hY,29353
898
+ sglang/srt/models/mimo.py,sha256=TdiflXteo_HLH7Q1Yf6xDAOXRzNrOpLR4kjVXMueltM,5662
899
+ sglang/srt/models/mimo_mtp.py,sha256=HbdSi0ZXW30YfQYhubnU6JmUI0zceJLvRjI2ptmqbVw,7251
859
900
  sglang/srt/models/minicpm.py,sha256=CzBJyZtfMpp8jvlEl29DHI7HLVq-CxuqP1UHwxIbaUI,14567
860
901
  sglang/srt/models/minicpm3.py,sha256=Cflu4Tb2hxpjapRBZ5n4kX8a1nnFwffK-M8uHPRUra4,19276
861
- sglang/srt/models/minicpmo.py,sha256=st8I13Ere5RkRHHQQN1LgZh1ybUA3_buxaaE4XlV8ag,76123
902
+ sglang/srt/models/minicpmo.py,sha256=1bNtbJM5wbMjV4ax8gesVsYVbMz4ozaIHAvvi8_d0iE,76175
862
903
  sglang/srt/models/minicpmv.py,sha256=_CnCR2y3RaYxhONAKFpBIuPQBrqn9Od4o7QnJw8CLR4,35884
904
+ sglang/srt/models/minimax_m2.py,sha256=cmdTbRl1VIBDb27t4glkhVwSy-2c3SikIcWociu5aD4,33995
863
905
  sglang/srt/models/mistral.py,sha256=ni7PppA_5X4ivTnIps3yoEaMEL-G6Gaf9b5hGC1vU5Q,3475
864
- sglang/srt/models/mixtral.py,sha256=ohZVFJ75QWuE2kBKD7Sd4fcx9YbbjA7JxnYAsOIfORU,17166
906
+ sglang/srt/models/mixtral.py,sha256=bZdsTw4A3B-MIHSR8U26mBv3sLYkawVM4V1VXEyBrmE,16992
865
907
  sglang/srt/models/mixtral_quant.py,sha256=UUIq7lpUonD9IoGePyl59oJYEcVwT9wUXvtVp5tjQ9Y,15406
866
- sglang/srt/models/mllama.py,sha256=OdX7brhyfGiMFPulxF77QOUi-Kcscg3Qo4ipyxzs9yA,39670
867
- sglang/srt/models/mllama4.py,sha256=ux93c-eLcG9LuL91f0euYHcMtYUt64VYmWXOo4JRzHQ,36255
908
+ sglang/srt/models/mllama.py,sha256=mMhDrLd1jJ-4lwMMHKRC5Uzcs3kWdzRJJzdjhQN4LOw,39671
909
+ sglang/srt/models/mllama4.py,sha256=z6YKfmHu0lJ-oyALZNlL9-EcHzFvNgkxWU_mURyS7z4,36694
910
+ sglang/srt/models/nemotron_h.py,sha256=clbTirOxve6yefRaf2eE0dT0IqhPDfknOtnsAEsnZOM,17904
868
911
  sglang/srt/models/nemotron_nas.py,sha256=CoSAKqlbej4Xe30uY4w76iASBqeuJf8-imisDK00zEU,15964
912
+ sglang/srt/models/nvila.py,sha256=2IVELp0pFTnN8Yz1GVns03aoLsgb8_7X_x5gQd02Vqg,12077
913
+ sglang/srt/models/nvila_lite.py,sha256=Cl7wey1bXUyyaDjntCytS4Z-cRVljK4WJU_Z-exjD1s,6206
869
914
  sglang/srt/models/olmo.py,sha256=7-q_fA6XXdG7kPUjpUzYkzMUWJobuSjhqjYw9xSUs_c,12671
870
- sglang/srt/models/olmo2.py,sha256=azmljhJF4ivcQfUtfsAUxq3ducE4tRKTL6iwe0IKYMg,14327
915
+ sglang/srt/models/olmo2.py,sha256=zprucQEogxPV38E_IU0edcTYP-d-dqLVeTmt2kRLznA,15448
871
916
  sglang/srt/models/olmoe.py,sha256=zryYUQEhEdhd6xcR_HyLV7gHCcKt-HWHeEeIUqmhmcc,16100
872
- sglang/srt/models/opt.py,sha256=1fdsQU7yXSN9HEWb0ZVdiAF8wLzAunW4XomIrlHyu2o,23476
917
+ sglang/srt/models/opt.py,sha256=-nCg_g2I84JtJQ7Fhh2eyp1cko3TxxicheM7gGpX0A0,23415
873
918
  sglang/srt/models/persimmon.py,sha256=86Duo3HiZqDj9O2UzWbJgUEhQOXzGBUdhUofQhcs1VE,11244
874
- sglang/srt/models/phi.py,sha256=n6A1d47MvnR1lmSsZ3TuzXk5kT1Lntj_YQ5uNvR0s5o,10287
919
+ sglang/srt/models/phi.py,sha256=tnhdiD_zo7KeHMTI8UxDfJN5brpHSAaKPSN-2e2iGk0,10280
875
920
  sglang/srt/models/phi3_small.py,sha256=eJb8aS_3KLObrq3PNkoIyVHaQ6SZTAJe42rbpC54QKg,16012
876
- sglang/srt/models/phi4mm.py,sha256=TKOFM4k8o_JGwYM5mBb2hHbbOMLjbveu5izIHCbT7ug,20617
921
+ sglang/srt/models/phi4mm.py,sha256=Pe5IjZcu7N8w_UmEXO0Mb98-tihc50ih6y5cS7b6BIY,20597
877
922
  sglang/srt/models/phi4mm_audio.py,sha256=0ChekwoYudAnbY0-JyNwz_inzMlxM8FmULqR9mwkPhQ,48877
878
923
  sglang/srt/models/phi4mm_utils.py,sha256=bW3un4x3SHDvSkAOHQEFO286FGdOPeKhBpJCOmNlC9E,66956
879
- sglang/srt/models/phimoe.py,sha256=EGaKFi02MZP20qFrILA4o2SJ0wb1HoJagFTSqVUbJcQ,19223
880
- sglang/srt/models/pixtral.py,sha256=ZkZrV0mEfmbBdgRko2AvsMFZbAVskgp_5a5p1xCSRN0,16835
881
- sglang/srt/models/qwen.py,sha256=j0OU3JjznWi_TbayI09yYGM-Obov6mQzJO82Hs0qBGw,11868
882
- sglang/srt/models/qwen2.py,sha256=kHNZCtT0jnQXC2aJN7Bp1DzaEzKWuhUAGL3hAmt8OU8,23598
883
- sglang/srt/models/qwen2_5_vl.py,sha256=rMmmoc1ba3GjIE5bfcaEBSh62hNuBZT0tlEpiY-9N8Y,25031
884
- sglang/srt/models/qwen2_audio.py,sha256=Q6zUfBdUTXDa7qx_aDVw6et7wonJsvBbrABmxLa_1YA,7782
924
+ sglang/srt/models/phimoe.py,sha256=cZQIGjEvArPDiJzC3uKYje-o48QZC699P8TTLwfVIas,19172
925
+ sglang/srt/models/pixtral.py,sha256=H378jvdhwjgdAuUszhCe5tmcEPYvw2YPhg_d8QrjLZE,16776
926
+ sglang/srt/models/points_v15_chat.py,sha256=HV_GRgLTcetKh0B2agJry02N_atcWI5NPjjQELarUGk,6415
927
+ sglang/srt/models/qwen.py,sha256=_X1mUt_MczEE2jFK7rfGyRRtpd4U93jdD1SVpCTNsns,11856
928
+ sglang/srt/models/qwen2.py,sha256=ryMQxd10i41JWYTzxXPZMBu68XK_7wpHRQg7_fmlmy4,24361
929
+ sglang/srt/models/qwen2_5_vl.py,sha256=X7Hh-75gsoGqaK2iJg7eBUFR_8qwJRLhhkii3yxc-KA,25084
930
+ sglang/srt/models/qwen2_audio.py,sha256=Hr4j9W-q23XjQUX4kk1NxUGA-EQkj8AKDqKVK741TjI,7097
885
931
  sglang/srt/models/qwen2_classification.py,sha256=dGrMm4ebd30_lBhHOhaV57ig2iOTx3nqB4GEzsrRIM8,2747
886
932
  sglang/srt/models/qwen2_eagle.py,sha256=6spFg6JYQGeUXLv2Q5eMkVzZvnqGyvW6SdVBtFMxlTM,4806
887
- sglang/srt/models/qwen2_moe.py,sha256=LfqgHflkQFhiRVSuRnKBaCHW-zf4HKRN7q5ZGm6bGl8,30854
933
+ sglang/srt/models/qwen2_moe.py,sha256=-pkURmqiLazr7oq11-3hQCFKrdj1crx30Z7iK7DBs90,30920
888
934
  sglang/srt/models/qwen2_rm.py,sha256=-mQXDEv11p-I1HXgYLTtY6ROem6UYorO958WsDrzsgs,2837
889
- sglang/srt/models/qwen2_vl.py,sha256=HwNc08L3zgVfpD59QFcyrDefbems_dfLgapJpTBRhRw,21372
890
- sglang/srt/models/qwen3.py,sha256=2OSKkk-AdIpg6ZnNcQ9tqZLlF-VH-QxncY1J_g8k-bc,19637
935
+ sglang/srt/models/qwen2_vl.py,sha256=xV8s6kgyjZ37SqLi9nF9J6n3gq9piUmlXOe2PVPQqjI,21488
936
+ sglang/srt/models/qwen3.py,sha256=XWFC8O9WCP6oRkwUGMG5s87lGVyGa3pRQx8YwdTQzPI,20617
891
937
  sglang/srt/models/qwen3_classification.py,sha256=bdjAylXJCjXKjAho74nmtIMpEG0Af98N-aZQ-pKKMY0,3262
892
- sglang/srt/models/qwen3_moe.py,sha256=AcOGpft3b-p31LII8jA2sRDK497fIicxFNIDGQbKG28,34083
893
- sglang/srt/models/qwen3_next.py,sha256=nvQ2VVUNjHvU5cxXgx5Bh5EWMtkPMfHPYP9Ni45J3hI,37364
894
- sglang/srt/models/qwen3_next_mtp.py,sha256=F-NnFGer8KxijNKIZoKICDfp6iFwct-XV0-q0KxAApg,4465
895
- sglang/srt/models/qwen3_vl.py,sha256=2kFQAZ9yq9GNj7aVF9ktyghsTFtNOyHczBYLNF2X4UQ,29368
896
- sglang/srt/models/qwen3_vl_moe.py,sha256=Bvx7dqzg0XzipiYqioCtVkwqxGSh8Y1zyvbMQ6D7HL0,18625
938
+ sglang/srt/models/qwen3_moe.py,sha256=jm5ntkmhdkTujJEwmIRLnaHgAEC5f4pmwMASU_Ru9-c,33211
939
+ sglang/srt/models/qwen3_next.py,sha256=hbIiLXcPBNa41lRnqZqdXa7Q8FDYX9JlaviXIZN_BEk,37279
940
+ sglang/srt/models/qwen3_next_mtp.py,sha256=nua9MgSa0_2Dz2Zju0chk6VXGDndBqr-1xMQ-_OirTU,4387
941
+ sglang/srt/models/qwen3_omni_moe.py,sha256=X5dB2zB1LAAD6_baK84y6MGvEm5ArgcFDmarUyoaS9c,25444
942
+ sglang/srt/models/qwen3_vl.py,sha256=fNTKorRODMDFOkARN0vcC8sLrcwLZlLpNCf_JQJKohM,29489
943
+ sglang/srt/models/qwen3_vl_moe.py,sha256=rY87FpfVOpHw0PuYu7l5nt3sFdSIHrn964XLVQjLyLY,13708
897
944
  sglang/srt/models/registry.py,sha256=BpYy-E2m5jPmCNmue_o3G9lCQza1ge7ftmTJQ78pFGc,4276
898
- sglang/srt/models/roberta.py,sha256=3k53V2Gbezk3jU-D03thXx8csGn5DxFK01ZQ9WFiWPI,9828
899
- sglang/srt/models/sarashina2_vision.py,sha256=P71n-U3XqUcavrWNBAjpQ2V4P1fkZJOKMOqrIvfbNSg,10945
945
+ sglang/srt/models/roberta.py,sha256=h5lLKiLIjBxYEFgUORWXWdW6bJ8skKyFWNnEqVJXBt4,11907
946
+ sglang/srt/models/sarashina2_vision.py,sha256=tvH4Zb-U9pgcrxm_7Uurnmr5Xeo0xXcWYHuucIDseks,10913
900
947
  sglang/srt/models/siglip.py,sha256=DIVJRwdtpLD2QT1kVPIHw7Bn9BE40xJbkHujDNzkjgA,9892
901
948
  sglang/srt/models/solar.py,sha256=BM30Eyn5Ptc0PCA6Lx3Hn7LZ_fV05n0rVm0vY_ILv5Y,18347
902
949
  sglang/srt/models/stablelm.py,sha256=0x_31uIr3WcWwecdPAI3ek9KkyKBJS7VwknTk2y0gjY,12281
903
950
  sglang/srt/models/starcoder2.py,sha256=ts6LDIjQ2FVnyLk4s2K9COD01RRhewJDW-VlvoyAk24,12377
904
- sglang/srt/models/step3_vl.py,sha256=4j7drPJT2h-QwFH7tK7zR96xnuGvrxNbestuZsflCxg,35666
951
+ sglang/srt/models/step3_vl.py,sha256=QeU7RQ5YnU6FcAi4c-ICVABpM1PJ5E65w5XE3UJmIbE,35557
905
952
  sglang/srt/models/torch_native_llama.py,sha256=3xf6CzCiizJ8i94GIChpOLq9q64Xa519RtuEspPTZQk,18501
906
953
  sglang/srt/models/transformers.py,sha256=laA2h39MPeiAWKv4DEg0ydre-1pyXWFSRga-nwy1HUk,10244
907
- sglang/srt/models/utils.py,sha256=NNKR-N_BGXRxbO6hCSwcq9kF9gZXCOfFc_8PPyo_aFs,1748
908
- sglang/srt/models/vila.py,sha256=3NiRHWOqXnCRjXmswAldsNtiE5zRILbScEsbhUzLZF4,9846
954
+ sglang/srt/models/utils.py,sha256=yB1rHC9Xk6hTQ59Fy2ExdrtntuSn6vkm-idf3CFrYP4,2032
909
955
  sglang/srt/models/xverse.py,sha256=DsNVI9JpzN4jj0Ry6aTrj7r-xq5YLOoDX2kH4YLJA-I,14035
910
956
  sglang/srt/models/xverse_moe.py,sha256=nBtG_PAK8wcp1tW2l2Zby2oEOmtWAYzH5COH-_N5IAM,17072
911
957
  sglang/srt/models/yivl.py,sha256=oToK7-u5IGO7xwpJIQ7VtudlK6-zPqJX4bt6_wv0SH8,4850
912
958
  sglang/srt/multimodal/mm_utils.py,sha256=6bV1_a7Iet9W0y3qdd0E-hFM78zalIzNZCYbLzJX2y8,12640
913
- sglang/srt/multimodal/processors/base_processor.py,sha256=1u6ewRgHL-svE1JSZ95iJVDFZIslfvBZne_LDR8YMPc,24902
959
+ sglang/srt/multimodal/processors/base_processor.py,sha256=h914TZNxWT8-wT0bQRXUCYE4wBTylJs9ip36nFNz_KI,25096
914
960
  sglang/srt/multimodal/processors/clip.py,sha256=5nXZuQYbyf-5mlqPwjhQrlWqxvswImWZQXivChsiHfQ,1057
915
- sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=Pymag9f0U5L_bBOTFs2q94BbuPJ-VwqSixs3meO0nsM,2569
916
- sglang/srt/multimodal/processors/dots_vlm.py,sha256=1Lk8eE7y4g1Sdn_1CfR4EOI4deVHeJRlgHLmS7UUNBw,3533
961
+ sglang/srt/multimodal/processors/deepseek_ocr.py,sha256=ZuP-zHNjPV3-lb6NkmNIitwIiXtNopNIwOLPttLjBYI,1234
962
+ sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=nKqWQ9PmtY66cMx0YhIHGPaGIW-VyPKt_KeRqFLU60c,2479
963
+ sglang/srt/multimodal/processors/dots_vlm.py,sha256=azazFc_lFj40NJKWf1X1MGgJ5FXgv2RlgVS-R6IhFdk,3521
917
964
  sglang/srt/multimodal/processors/gemma3.py,sha256=7aD6cR60iSC_MqjzdCDMAgtrb_cmy9YJyqLgVRClBT8,1986
918
965
  sglang/srt/multimodal/processors/gemma3n.py,sha256=mtmvBasOMxb3Y2NLZR02nMYX30RLUXhDYJ5uVOElr10,2776
919
- sglang/srt/multimodal/processors/glm4v.py,sha256=SQXatu6t-YgE8wNSavBRliN7J4DqiP57lmA47-zRlYQ,4953
920
- sglang/srt/multimodal/processors/internvl.py,sha256=Po3_Dv71vKJidyyTY-KJRzGtxU2mCYIsETtcg9GhDg0,9853
921
- sglang/srt/multimodal/processors/janus_pro.py,sha256=_4ltWmdtFjbh1VCMRbcgxW61eWIABIzHG-YgwHWaYq8,1471
966
+ sglang/srt/multimodal/processors/glm4v.py,sha256=Q9ifVo4DMsxsysta2cqUGwHGdx3pT5fS_jVB31pUfP8,4883
967
+ sglang/srt/multimodal/processors/internvl.py,sha256=vvOlWmJ4AzbXnDxHED1NkRgHQfOnZlmEaWMA3-1_2cQ,9765
968
+ sglang/srt/multimodal/processors/janus_pro.py,sha256=nd1v0--5733pOwWTpArnOHCfh4aHHVBUOJPOhk9rLd4,1395
922
969
  sglang/srt/multimodal/processors/kimi_vl.py,sha256=5i8KmGxnnDtQc7XqUBNyanAfGxhxj8iRFBFONHmpiFg,1565
923
970
  sglang/srt/multimodal/processors/llava.py,sha256=-YtDc_7TsMWmwKkD4KJZW2Y0jPFlZtbQ38K_N24hk0w,8231
924
971
  sglang/srt/multimodal/processors/minicpm.py,sha256=ysJlUaxcBcWjKliz5VmXKVv0ec4QWRHXZk4ga-hXVf0,5354
925
972
  sglang/srt/multimodal/processors/mlama.py,sha256=FgPm2JQzfPFDcGYDm0mqfDfO_eJKy-NiVgF-vId6w8Y,1233
926
- sglang/srt/multimodal/processors/mllama4.py,sha256=1YGETKSzMZIa7BOwq3T9cbsYjUcW5sopcpc9JNJ000g,1911
927
- sglang/srt/multimodal/processors/phi4mm.py,sha256=8GaUVpGucV4UKoa0XkxN0gDpMZax6UyCiRBX_QaJK78,3857
973
+ sglang/srt/multimodal/processors/mllama4.py,sha256=pYzqbuV9Hb5RMYNLRabTMIMTwL8C5SCToZdhSg403go,1653
974
+ sglang/srt/multimodal/processors/nvila.py,sha256=MqpZmj2fO9U8DQSFGVkrUYqK7HBrhx5nIlMCdrZShfY,2524
975
+ sglang/srt/multimodal/processors/phi4mm.py,sha256=8Co-UPT8Am2P5dfW8bjZcy-pVAPqFXW7hbK8v23NMiA,3781
928
976
  sglang/srt/multimodal/processors/pixtral.py,sha256=Lx5Z-9NkovLDTHlRBznHxGn4r2XhDz8am2XpOskOVQY,3203
977
+ sglang/srt/multimodal/processors/points_v15_chat.py,sha256=bd_gpgkpcMcl6gxugqfQSJwyr50szjKOAHrsVrBnuPg,1575
929
978
  sglang/srt/multimodal/processors/qwen_audio.py,sha256=xkIFrHepF8Ok6MB-1OwVz1BmzPmEPgUe8lIb0azO2Bc,2411
930
- sglang/srt/multimodal/processors/qwen_vl.py,sha256=3ZjxgINjukJ953Vj6c67v8_x0Kh_9xq-1jOgVO-mqa8,10983
979
+ sglang/srt/multimodal/processors/qwen_vl.py,sha256=h26WSDFJiXvyCmUxNwetjgDANxXoQGxocdd_uudC2Vw,13537
931
980
  sglang/srt/multimodal/processors/sarashina2_vision.py,sha256=E0KSOw_yzc7prHkQfMHS_DzOcYL1GZJ77NopVkd_V5M,3024
932
- sglang/srt/multimodal/processors/step3_vl.py,sha256=9OI6UW9ybGbAnYN_S-5jh7TN8BGM_bQkvh1AHBJKzAQ,18350
933
- sglang/srt/multimodal/processors/vila.py,sha256=vWgV1lTdjiFiTR8w-7fC66-L_tpOOD59c-c9NljGelE,2192
981
+ sglang/srt/multimodal/processors/step3_vl.py,sha256=2zNf1gT-fSrA88-cvkr6xJDE0sEWFKdBDUWsMiFx_uY,18330
934
982
  sglang/srt/parser/code_completion_parser.py,sha256=KFa95OU0TeVjJkOqIgS4xV3kaJ5dFWOmAAgISyc1oEc,3803
935
- sglang/srt/parser/conversation.py,sha256=cmVT4SCqRYxprYvmftUC_z_TkhXCqYC9B2rVZsmQe30,38869
983
+ sglang/srt/parser/conversation.py,sha256=r5Fp4BGNjGeuvBw7dAUt-aUl3ExsTSG00Gq8dS8_hj0,40089
936
984
  sglang/srt/parser/harmony_parser.py,sha256=YweG4azWm5jmzYGaAHEXSaORpgWctPpSGQk_jp5H-CE,23227
937
985
  sglang/srt/parser/jinja_template_utils.py,sha256=_rtLpriMmodo-tBD8B9ifu3BsZFdaQQCDPRUqF26pIg,8006
938
- sglang/srt/parser/reasoning_parser.py,sha256=3P5viZ4oCsz695rZULWnRKSYBJxouHjihdpZMBuY9yc,11159
939
- sglang/srt/sampling/custom_logit_processor.py,sha256=AwODYVJdRkcQ8PGtJrhzKsqAgn8XZLQbAmR9fGiQzmc,1608
940
- sglang/srt/sampling/sampling_batch_info.py,sha256=a-t8Al8D4x4DRqTnvmnTA4jHzOVp6JEFNJxUat7mDqE,15498
941
- sglang/srt/sampling/sampling_params.py,sha256=yRkiwoZz0OrmmdMn2v63O5qkbns3Gv9MonxKYvyYcKc,6690
986
+ sglang/srt/parser/reasoning_parser.py,sha256=sGHGN8UUYjv6qW3HtHlgGGwf_5NRzlBF1jvCEiG-5vI,12180
987
+ sglang/srt/sampling/custom_logit_processor.py,sha256=phIOI0ttJHQ_yCZhnqD5qNs98QG0gdY9evbXkgS3544,4272
988
+ sglang/srt/sampling/sampling_batch_info.py,sha256=xlkEs3zgrwZCNBs69JHL3og9-jJnFbDD3_RLJJ-M36U,15544
989
+ sglang/srt/sampling/sampling_params.py,sha256=ULhZRhA9C1oK34T3cbwqaODV3iMX8HL1VOlo_gewzZw,9193
942
990
  sglang/srt/sampling/penaltylib/__init__.py,sha256=mtN8grFEcaBUhl4yBHmw8NNirt_i6uKO2cDNLHOpZQE,496
943
991
  sglang/srt/sampling/penaltylib/frequency_penalty.py,sha256=Loc3qjJTksNc5s-DV7QZHjgqoo5pxk7-nZzxwyhD2tQ,2144
944
992
  sglang/srt/sampling/penaltylib/min_new_tokens.py,sha256=rdU_D7RoIcrQPhysNQEzmr4TO2OoEi___p-i3QdwkgU,3331
945
993
  sglang/srt/sampling/penaltylib/orchestrator.py,sha256=Romk41ahToaVlNMnnd1Enko7_kRA4KdMGO94qnEbDHA,6061
946
994
  sglang/srt/sampling/penaltylib/presence_penalty.py,sha256=NRh10AJrrQlGJ6S-enGdRefrTrWpyqrSm-aNnyqQNQQ,2119
947
- sglang/srt/speculative/build_eagle_tree.py,sha256=O9LJNaBflgJdWT94D-rGH1gJFJ18nst2oOD8HnA2mZ4,12859
948
- sglang/srt/speculative/eagle_draft_cuda_graph_runner.py,sha256=7QpNIGrZE8GEqe_B1vuLhpWPCAV9jY0Kr67Imbirycs,14201
949
- sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py,sha256=nqnlTLzqfz-zYJvIFALXzfgbCJdrtslIhfCnxEkvQ5I,15897
950
- sglang/srt/speculative/eagle_info.py,sha256=3JtRb60iCQzzi1JgreRhpGzC1aTs5Zbqv8XBDknnGHQ,29942
951
- sglang/srt/speculative/eagle_worker.py,sha256=bAvFoMs1Mc5YcwEQhfysuaKIPvZOLdb6QqUeqNSrrFA,46909
952
- sglang/srt/speculative/ngram_utils.py,sha256=U3a-c2bhNeIqZV4sKbzh3Hz_lAiqN1YFuFrbiaf0nsU,16600
953
- sglang/srt/speculative/ngram_worker.py,sha256=F4TDjVNiwzD-iQrqFArTybODtITdZLpFUYTtGdCPc2I,9727
954
- sglang/srt/speculative/spec_info.py,sha256=R3FK3ghFBUDSIUuNUYf41kFwEzP2fDBIlGdc45sRc4Y,2608
955
- sglang/srt/speculative/spec_utils.py,sha256=7l-jkBg-of_5NJJ1boH98GN4YyAbjxfs39gZzykfK_o,20072
956
- sglang/srt/speculative/standalone_worker.py,sha256=jcM_-7DMtRUMC9R0YeD6815kaWuftkFe8LIo7ThLVCc,4069
995
+ sglang/srt/speculative/base_spec_worker.py,sha256=M2hIHGmno1ew_gbgsU7rcIsNzR7pixDkN0UDJpZneEY,698
996
+ sglang/srt/speculative/draft_utils.py,sha256=E7u9u_-lrjOu82bBqmLB6zsbygRbWuLHO0Y1NwfbH4o,8261
997
+ sglang/srt/speculative/eagle_draft_cuda_graph_runner.py,sha256=LmqXLmMxLBuAFz8XiJpBQAsjpX77ZLrcDlv2hCXDRKs,14995
998
+ sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py,sha256=AucQHsYM9hktPgmjtygPCxjMyQhFikJX_pc41APXR4M,16737
999
+ sglang/srt/speculative/eagle_info.py,sha256=ucS_hYCxoKlHA8pGtDN5mdk9i6z-NHYq4vAz1uLGcwk,31479
1000
+ sglang/srt/speculative/eagle_info_v2.py,sha256=2PmbYzDrMkgNky0xeTIVaL04hDI15JaEqaE8pUlsu8c,16548
1001
+ sglang/srt/speculative/eagle_utils.py,sha256=HA_h9dkO9RLOBXn4dFFQHY3yiSw4CwjuYewer5BchHI,4581
1002
+ sglang/srt/speculative/eagle_worker.py,sha256=m40xi1IAWZQLX48D297BZy7ohlCWbptqkOszXmWC9JA,39344
1003
+ sglang/srt/speculative/eagle_worker_v2.py,sha256=nzW7KQFBwU8F7F4CRlBGr7i_7_uCJzjcdMA5zCHqdB8,26315
1004
+ sglang/srt/speculative/ngram_info.py,sha256=WEpR-I6dGbzKPvH915pPysONO5TodtyfrX0mN9LNBMU,16777
1005
+ sglang/srt/speculative/ngram_worker.py,sha256=t05lgkBATs-mo45eloiqvMalsJKdHI7fZ2BTYEpXoxg,9720
1006
+ sglang/srt/speculative/spec_info.py,sha256=1AkkpJwifuOtB1ZEjLctrzzjC46O1qtJIkoAdY2rmas,2669
1007
+ sglang/srt/speculative/spec_utils.py,sha256=hxm84b37ADwntrlpJ6JOxVGdZ22Ek4uBICnHUy82AxU,21345
1008
+ sglang/srt/speculative/standalone_worker.py,sha256=9PfG1-aXG3W4j43vLnSvBuaOqgqs-MsfWRH1e7nbkSg,3745
957
1009
  sglang/srt/speculative/cpp_ngram/ngram.cpp,sha256=j8D4xNaa8dv8CN9F5TG_yHxil-A79XiuMjyEE3ZUOSs,12962
958
1010
  sglang/srt/speculative/cpp_ngram/ngram.h,sha256=9OMOzO3KXEVbT5gEXjK-IRATI63in54LjeT_Xba5DSU,2492
959
1011
  sglang/srt/speculative/cpp_ngram/ngram_cache.py,sha256=Y22AM1CC0zOOarMWJzZQKz1-IMk3d4isSGkk-Uti74I,4383
960
1012
  sglang/srt/speculative/cpp_ngram/ngram_cache_binding.cpp,sha256=yrRXulpjivoSveCRL5ORfZ0hj2yXqjdVqc88APUJllg,1911
961
1013
  sglang/srt/speculative/cpp_ngram/param.h,sha256=tLSD_Ke1c2GjTY9tl3p1UgpbrBfaZqPRsHfw2YJ87hw,4375
962
1014
  sglang/srt/speculative/cpp_ngram/queue.h,sha256=m8OK4Nd6_yWnJkWxx-JRqUIOfzQwi3apy_3TvyxSY4Q,1288
963
- sglang/srt/tokenizer/tiktoken_tokenizer.py,sha256=KJwr6Xlc7AdHegMTnAVKJlPpW59Z7AE27GTzFL78GwI,6222
1015
+ sglang/srt/tokenizer/tiktoken_tokenizer.py,sha256=xIi7o38MB-pWPLC6sTdmGC9NN_kgRDvMStIo0nJZulw,6246
964
1016
  sglang/srt/tracing/trace.py,sha256=5SKy8XA4KLaTcBO6ZJvJSP_IYK5--2RJN0Q6O6Vg10g,16110
965
- sglang/srt/utils/__init__.py,sha256=M47TWjBX488QHsDCOTKHv-979SGOsnSu1wIWEqUaXnI,86
966
- sglang/srt/utils/common.py,sha256=gbj2-BL4ffLEkdQBqBs93NYU8QWwA3UN8qOEVZua2w0,108529
967
- sglang/srt/utils/hf_transformers_utils.py,sha256=7nUwqdrlkJMbi4aB5Ebvcf5NDVkLTzX4VVTNZav9Nps,17263
1017
+ sglang/srt/utils/__init__.py,sha256=zuoHoZnKrciwFy11a6p5Ua8mYU67QUI_09L0SfEjpeo,102
1018
+ sglang/srt/utils/aio_rwlock.py,sha256=6LYtOdeTUY3hkfa1dmYkgsaF2ttrwIF3hUWz2AZ2fqw,2970
1019
+ sglang/srt/utils/bench_utils.py,sha256=0xXUeDk61RynxbOV0P_okb-5rLPpc-ZqfCGx3W35K4I,4421
1020
+ sglang/srt/utils/common.py,sha256=sAN5cre5l1b8IuUSQSzXVOOu2swU8k1ZEEVxWXbPBDw,114705
1021
+ sglang/srt/utils/hf_transformers_utils.py,sha256=E-K0S1ykwqxFNLmXCSmQ6taFYlbncN0EuvS1EPBcvmY,17793
1022
+ sglang/srt/utils/host_shared_memory.py,sha256=0tO3qMlbmEIs11XvdI7BB0AtH4Z5hm9vWEkEyau4vlM,2264
1023
+ sglang/srt/utils/offloader.py,sha256=mKN1Vd0ftr2mjcVIXKCZnc51pcQ6bfYvhqFvdAUyRC4,18771
968
1024
  sglang/srt/utils/patch_torch.py,sha256=yaVs6YNm63rFYBw-v59usYR3cmb_qX6F69L5dMfQCxg,3307
969
1025
  sglang/srt/utils/poll_based_barrier.py,sha256=9vjn32ROlSueEk7EuZjWKUrrL7XVR9KJsSVliGTYB_4,937
1026
+ sglang/srt/utils/profile_merger.py,sha256=bvnz-yHMb7zHE1Bv09JKgCgYZY1n4h_UK7Wz2wNAmro,7202
970
1027
  sglang/srt/utils/rpd_utils.py,sha256=F8FWL_mT05xKQYLrzCJ8Q_5zfZJ86dHxX6LEqpwC7rw,20743
971
1028
  sglang/srt/utils/slow_rank_detector.py,sha256=81-KXp33wevk4jG2QuThsc17fLdmdeMouxwVfSXscic,2052
1029
+ sglang/srt/utils/torch_memory_saver_adapter.py,sha256=WFwPsOBvnWu6N2yTHmiOjLbDAYosslHwNSfyFHjz-7w,2511
972
1030
  sglang/srt/weight_sync/tensor_bucket.py,sha256=vp_LRrhULNnxiw9Tf56FcEckgUg07lifgv1lasG6y7o,3695
973
1031
  sglang/srt/weight_sync/utils.py,sha256=1FHM5kBav1GJUyYQLKHSJAh9MXwsuizDWxAVJMg1ZgE,4155
974
1032
  sglang/test/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
975
1033
  sglang/test/doc_patch.py,sha256=P9PYjBIVlZHvP9M34qS-8m1scmDP27ciNJNvZOdrUKE,1614
976
1034
  sglang/test/few_shot_gsm8k.py,sha256=zalplyHOYCnIwAnSQg-xlZl-Q-wGuMfjLdl9EJnUN7U,4333
977
- sglang/test/few_shot_gsm8k_engine.py,sha256=h88s3HzEStA1zjQkR-AgIEOQMwJMSnPHkX_wGBWXUYw,3907
1035
+ sglang/test/few_shot_gsm8k_engine.py,sha256=Vgs0SBguumrdlGOY1Hjjc8nTIdv5mxiTAmR4Isa4g4I,3793
978
1036
  sglang/test/get_logits_ut.py,sha256=XotfHBDbQDRuSrJLRErsrdIOA0WDflnrK9171E-2iWE,1822
979
- sglang/test/run_eval.py,sha256=1WaGfgsxCQWrvaIWS-m4lWjfTW-Y7IcASKvTG0Q-9gM,6420
980
- sglang/test/runners.py,sha256=Tn__rDchJRP7pAorTS6gAAtqdPIeexpoEvwOwohTsB8,34105
981
- sglang/test/send_one.py,sha256=XNZdfZs21tXDBwrDj2pq46WQd5smiKoYETY8U09c1Z8,5079
982
- sglang/test/simple_eval_common.py,sha256=Fm9PYFk6bYCb8RyMWr-ODfoNMUIftahTTOCBh84qiM0,12888
983
- sglang/test/simple_eval_gpqa.py,sha256=M6hpPs8l2Z4wUiyE7rCU1zyKoImXB4Z395Hgz43uvvQ,3293
984
- sglang/test/simple_eval_humaneval.py,sha256=s8YuKIBkNUEOBP4XKsTMRdXGv5aRhl0oJyl-89lGk1w,5687
1037
+ sglang/test/kit_matched_stop.py,sha256=60YESivdEqn6XXUa9oLu1UeLozp4ahteEEvWyOUVDx8,5382
1038
+ sglang/test/run_eval.py,sha256=88EUq7X9L1jN83IO9kijEoBXq9CS0DHgKaiX4QtgmUk,7829
1039
+ sglang/test/runners.py,sha256=dz4ZlbsF7BePTrS84BmlVt8LnxkoZhkyCPdjGg1hd04,34203
1040
+ sglang/test/send_one.py,sha256=sxdAVh6nxq8IgPf1behPiWF7ZVugwoOE4DjdJyY6qzo,6392
1041
+ sglang/test/simple_eval_common.py,sha256=06wMMTLf8kpbySBtImD9xdjmYCPuJSghhKcJ_D_KdB4,12976
1042
+ sglang/test/simple_eval_gpqa.py,sha256=Ui416_9Fh8TYU_51bClhEXi6wVCLEhLG28a7qPJfJYQ,3276
1043
+ sglang/test/simple_eval_humaneval.py,sha256=AhB-0dimur6_vSH9qHVyCRag_VZ8Jf3gH6PdmTkPHAU,5658
1044
+ sglang/test/simple_eval_longbench_v2.py,sha256=LLa3qAmF8PF1HGC-ubNcaB4jaz22NhZBY67rIzTH5Dk,12169
985
1045
  sglang/test/simple_eval_math.py,sha256=6kGKNwNbLN-Af3Wj8WTimWhH-Xp3enDmSvvSjsgWUpk,2550
986
1046
  sglang/test/simple_eval_mgsm.py,sha256=rd7TSUyxdKbrXaVoewo24V8lCo_6kO8zxPhhmvylpw8,10259
987
1047
  sglang/test/simple_eval_mmlu.py,sha256=FkwamjGMjueTixymkedF-YiPloSLiy4ftILFUrKZ9XI,4357
988
1048
  sglang/test/simple_eval_mmmu_vlm.py,sha256=XpADoB825LUX-n4hDFOR3wkuowdLPB6sMHJEvM2dah8,15195
989
1049
  sglang/test/test_activation.py,sha256=bDBFl4Y30siXj7Ifl66fc2HytOrcZdHFiP2i9K8TIsY,3140
990
- sglang/test/test_block_fp8.py,sha256=CNQE3CildtLO49ZegwhWBIN3QyvA0qI6p25xQeuUrWE,21824
991
- sglang/test/test_block_fp8_deep_gemm_blackwell.py,sha256=Hnhq4kkyINHb4ONedkp5Kf7Xx0MjOoOBYL8J7ETvOVA,8180
992
- sglang/test/test_block_fp8_ep.py,sha256=n4X6ZKwuUUbV5Ofjg64ptlaFGI1LbRXDfFiJW1ELHgY,10546
1050
+ sglang/test/test_block_fp8.py,sha256=z7cVJLy9jfD-xer3lALeBWkzRxhseqSboBAw75LZGgE,21828
1051
+ sglang/test/test_block_fp8_deep_gemm_blackwell.py,sha256=G6Yw6npnUO8OSuu4L2fOl-vP3mYCI7Mcrst6hc96t4s,8170
993
1052
  sglang/test/test_custom_ops.py,sha256=PenQ8zM1wj5xwiVEPVzD37pO-x90aOfFMpCRZenaKsY,5709
994
- sglang/test/test_cutlass_moe.py,sha256=WHCruIMzxzRzxQEeFEUtk0e0IefjiO0Kjfgnx42r0UI,10069
995
- sglang/test/test_cutlass_w4a8_moe.py,sha256=Ku9VCXEMJ3BwXtvb1A3FzY-zek-S-A4thWyX6m-1v-A,9219
1053
+ sglang/test/test_cutlass_moe.py,sha256=0kzalShZCSSbV1JLKv77mx8bXgK2wvskTuPGqK_qNnQ,10051
1054
+ sglang/test/test_cutlass_w4a8_moe.py,sha256=iQIZ1K43emzqI9WVKlb2fplLPcvlpm3D7qCNK-wJfa4,8924
996
1055
  sglang/test/test_deepep_utils.py,sha256=749ysTBGNzh6rYUCJhhZBtZpeD15eWTeNHYCytcvZtc,7448
997
- sglang/test/test_deterministic.py,sha256=3TW6QogzSrvARizRRwELesKy-_NM3NfQkLEGoAvpadI,10120
998
- sglang/test/test_disaggregation_utils.py,sha256=9LB6vCKr55iHhFN5saOwlKealG4ME20O3LTBbCCPbGI,2573
1056
+ sglang/test/test_deterministic.py,sha256=94QAh_y98SLjbroZ837qQ4qv2LypvbLmgX60WD9lu24,23593
1057
+ sglang/test/test_deterministic_utils.py,sha256=iGP6d7JRpk49u4l8IXI-Ix8-pfDliTt0TwD1NvIg_Y0,2212
1058
+ sglang/test/test_disaggregation_utils.py,sha256=k_V_vw6qCEw3iZyUeujozMBkUgGRfCWxkLyCb9ktIbk,5588
999
1059
  sglang/test/test_dynamic_grad_mode.py,sha256=L76yUCuk_ymNpXD2CmO8r2GiGjIvD_gtTsuFDs2NolI,1638
1000
1060
  sglang/test/test_fp4_moe.py,sha256=wvHbGMH1UBr_XVWYgX57Y2bLy9h2DPQH10_Hmf2q6iw,22436
1001
1061
  sglang/test/test_layernorm.py,sha256=2GMWqqNDuGvSMSsEBF5eDCzwVSYA9E6hGhRo6s4ecKg,3764
1002
- sglang/test/test_marlin_moe.py,sha256=TOuYlVMx2Lv_IN3AMWsg5aGaxQF472E1B9ev_vvfU2Q,7971
1062
+ sglang/test/test_marlin_moe.py,sha256=d3LsMn9qT-r-DzHKhHikRTzSPSDWDtBNuIpz35AeM20,7958
1003
1063
  sglang/test/test_marlin_utils.py,sha256=kC7IzN364mJT9xw0nKUP1V1OK1hkw6fQTBvD4nRaOz4,5151
1004
1064
  sglang/test/test_programs.py,sha256=R-pzgNB-h_jjdJiW50hn83-nY7z5q5XcqPwugPnVF5Y,18916
1005
- sglang/test/test_utils.py,sha256=ED7Kktyg5tgaOv8UAFCg29XKMz0MLd7Zgl8ctQFwHOQ,54542
1065
+ sglang/test/test_utils.py,sha256=-i5Jh91gO7fDkr6PM1Lb7s7tyUqcI5v_qdhCKyDbgNg,56381
1006
1066
  sglang/test/attention/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
1007
- sglang/test/attention/test_flashattn_backend.py,sha256=_rTG849FwQdVTyGKkqhczaOqngBmRWXFmkl5NnuK1GM,13914
1008
- sglang/test/attention/test_flashattn_mla_backend.py,sha256=g4O50WblTpM7_Gq2b76k0i25_z01BOUBQ4i6PmyxpO4,10774
1009
- sglang/test/attention/test_prefix_chunk_info.py,sha256=hpoDe2wfSa6RlUbfyri_c0iyBTb35UXGL9I2Xh6jamM,7772
1010
- sglang/test/attention/test_trtllm_mla_backend.py,sha256=wp2_LSTwQ_vIdNPUCbEz7PA4doDU8sTWs6s6XVI0YnI,48874
1011
- sglang-0.5.3rc2.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
1012
- sglang-0.5.3rc2.dist-info/METADATA,sha256=9jumtyFrtne6z3uEpBy23xFvdJ59YgHVrXclky7_43k,24609
1013
- sglang-0.5.3rc2.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
1014
- sglang-0.5.3rc2.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
1015
- sglang-0.5.3rc2.dist-info/RECORD,,
1067
+ sglang/test/attention/test_flashattn_backend.py,sha256=Uh895KymXiRFH1pJ1NR9eSfoi6UI41YdPc4viLdUTBA,13904
1068
+ sglang/test/attention/test_flashattn_mla_backend.py,sha256=XW12ALYv2Ncs4t-Bz6omhYzNUQGe_P10K0gyqp9Y37U,10690
1069
+ sglang/test/attention/test_prefix_chunk_info.py,sha256=er0i3KGHMkw-4UZB1GCFd4oYwRcXfU5wpO1ORqpNGGA,7626
1070
+ sglang/test/attention/test_trtllm_mla_backend.py,sha256=UbtvkzTAqP-kHHEhhtPxVpuzG9QmyWBrFuJa0S7Z52g,54951
1071
+ sglang/test/longbench_v2/__init__.py,sha256=ZcOIPSyqbDI_tzB-qltXF67-4uMMPwCkkiWDVcDBDvQ,63
1072
+ sglang/test/longbench_v2/test_longbench_v2_eval.py,sha256=NI_Om4ODw5utUNsYjrj6nueebI4U5u4N2PKBtT5O27k,7352
1073
+ sglang/test/longbench_v2/validate_longbench_v2.py,sha256=mJa5Lh8XiSTXKrf5qopKuAfspSVbhoacnCkz6u4lYFQ,11635
1074
+ sglang/test/longbench_v2/validate_longbench_v2_standalone.py,sha256=gr0zif2c680hSyIHDVJ_NHYcrMquM3fpJ26mBtbm7zs,10909
1075
+ sglang-0.5.4.post1.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
1076
+ sglang-0.5.4.post1.dist-info/METADATA,sha256=NblJNZ18C87lGtQ0Ofds9W374PcXOVZ_4lljf_zeWCU,25916
1077
+ sglang-0.5.4.post1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
1078
+ sglang-0.5.4.post1.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
1079
+ sglang-0.5.4.post1.dist-info/RECORD,,