sglang 0.5.3rc2__py3-none-any.whl → 0.5.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (408) hide show
  1. sglang/bench_one_batch.py +47 -28
  2. sglang/bench_one_batch_server.py +41 -25
  3. sglang/bench_serving.py +330 -156
  4. sglang/check_env.py +1 -1
  5. sglang/compile_deep_gemm.py +6 -2
  6. sglang/global_config.py +1 -25
  7. sglang/lang/api.py +6 -0
  8. sglang/lang/interpreter.py +1 -0
  9. sglang/lang/ir.py +13 -0
  10. sglang/launch_server.py +8 -15
  11. sglang/profiler.py +18 -1
  12. sglang/srt/_custom_ops.py +1 -1
  13. sglang/srt/batch_invariant_ops/batch_invariant_ops.py +4 -6
  14. sglang/srt/checkpoint_engine/checkpoint_engine_worker.py +142 -0
  15. sglang/srt/compilation/backend.py +437 -0
  16. sglang/srt/compilation/compilation_config.py +20 -0
  17. sglang/srt/compilation/compilation_counter.py +47 -0
  18. sglang/srt/compilation/compile.py +210 -0
  19. sglang/srt/compilation/compiler_interface.py +503 -0
  20. sglang/srt/compilation/cuda_piecewise_backend.py +228 -0
  21. sglang/srt/compilation/fix_functionalization.py +134 -0
  22. sglang/srt/compilation/fx_utils.py +83 -0
  23. sglang/srt/compilation/inductor_pass.py +140 -0
  24. sglang/srt/compilation/pass_manager.py +66 -0
  25. sglang/srt/compilation/piecewise_context_manager.py +40 -0
  26. sglang/srt/compilation/weak_ref_tensor_jit.py +16 -0
  27. sglang/srt/configs/__init__.py +4 -0
  28. sglang/srt/configs/deepseek_ocr.py +262 -0
  29. sglang/srt/configs/deepseekvl2.py +194 -96
  30. sglang/srt/configs/dots_vlm.py +2 -7
  31. sglang/srt/configs/falcon_h1.py +13 -64
  32. sglang/srt/configs/load_config.py +25 -2
  33. sglang/srt/configs/mamba_utils.py +117 -0
  34. sglang/srt/configs/model_config.py +134 -23
  35. sglang/srt/configs/modelopt_config.py +30 -0
  36. sglang/srt/configs/nemotron_h.py +286 -0
  37. sglang/srt/configs/olmo3.py +105 -0
  38. sglang/srt/configs/points_v15_chat.py +29 -0
  39. sglang/srt/configs/qwen3_next.py +11 -47
  40. sglang/srt/configs/qwen3_omni.py +613 -0
  41. sglang/srt/configs/qwen3_vl.py +0 -10
  42. sglang/srt/connector/remote_instance.py +1 -1
  43. sglang/srt/constrained/base_grammar_backend.py +5 -1
  44. sglang/srt/constrained/llguidance_backend.py +5 -0
  45. sglang/srt/constrained/outlines_backend.py +1 -1
  46. sglang/srt/constrained/reasoner_grammar_backend.py +9 -6
  47. sglang/srt/constrained/utils.py +12 -0
  48. sglang/srt/constrained/xgrammar_backend.py +20 -11
  49. sglang/srt/disaggregation/ascend/transfer_engine.py +1 -1
  50. sglang/srt/disaggregation/base/conn.py +17 -4
  51. sglang/srt/disaggregation/common/conn.py +4 -2
  52. sglang/srt/disaggregation/decode.py +123 -31
  53. sglang/srt/disaggregation/decode_kvcache_offload_manager.py +1 -1
  54. sglang/srt/disaggregation/fake/conn.py +11 -3
  55. sglang/srt/disaggregation/mooncake/conn.py +157 -19
  56. sglang/srt/disaggregation/nixl/conn.py +69 -24
  57. sglang/srt/disaggregation/prefill.py +96 -270
  58. sglang/srt/distributed/device_communicators/all_reduce_utils.py +4 -4
  59. sglang/srt/distributed/device_communicators/custom_all_reduce.py +6 -6
  60. sglang/srt/distributed/device_communicators/pymscclpp.py +2 -2
  61. sglang/srt/distributed/device_communicators/pynccl.py +24 -12
  62. sglang/srt/distributed/device_communicators/pynccl_allocator.py +2 -2
  63. sglang/srt/distributed/device_communicators/symm_mem.py +1 -1
  64. sglang/srt/distributed/naive_distributed.py +5 -4
  65. sglang/srt/distributed/parallel_state.py +70 -19
  66. sglang/srt/elastic_ep/elastic_ep.py +74 -0
  67. sglang/srt/entrypoints/context.py +3 -2
  68. sglang/srt/entrypoints/engine.py +66 -66
  69. sglang/srt/entrypoints/grpc_server.py +431 -234
  70. sglang/srt/entrypoints/harmony_utils.py +2 -2
  71. sglang/srt/entrypoints/http_server.py +120 -8
  72. sglang/srt/entrypoints/http_server_engine.py +1 -7
  73. sglang/srt/entrypoints/openai/protocol.py +225 -37
  74. sglang/srt/entrypoints/openai/serving_base.py +49 -2
  75. sglang/srt/entrypoints/openai/serving_chat.py +29 -74
  76. sglang/srt/entrypoints/openai/serving_classify.py +204 -0
  77. sglang/srt/entrypoints/openai/serving_completions.py +15 -1
  78. sglang/srt/entrypoints/openai/serving_responses.py +5 -2
  79. sglang/srt/entrypoints/openai/serving_tokenize.py +144 -0
  80. sglang/srt/environ.py +42 -4
  81. sglang/srt/eplb/eplb_algorithms/__init__.py +18 -1
  82. sglang/srt/eplb/eplb_algorithms/deepseek.py +0 -2
  83. sglang/srt/eplb/eplb_algorithms/elasticity_aware.py +87 -0
  84. sglang/srt/eplb/expert_distribution.py +3 -4
  85. sglang/srt/eplb/expert_location_dispatch.py +2 -2
  86. sglang/srt/eplb/expert_location_updater.py +2 -2
  87. sglang/srt/function_call/base_format_detector.py +17 -18
  88. sglang/srt/function_call/function_call_parser.py +18 -14
  89. sglang/srt/function_call/glm4_moe_detector.py +1 -5
  90. sglang/srt/function_call/gpt_oss_detector.py +1 -1
  91. sglang/srt/function_call/json_array_parser.py +0 -2
  92. sglang/srt/function_call/utils.py +2 -2
  93. sglang/srt/grpc/compile_proto.py +3 -3
  94. sglang/srt/{entrypoints → grpc}/grpc_request_manager.py +112 -52
  95. sglang/srt/grpc/health_servicer.py +189 -0
  96. sglang/srt/grpc/scheduler_launcher.py +181 -0
  97. sglang/srt/grpc/sglang_scheduler_pb2.py +78 -70
  98. sglang/srt/grpc/sglang_scheduler_pb2.pyi +66 -10
  99. sglang/srt/grpc/sglang_scheduler_pb2_grpc.py +89 -1
  100. sglang/srt/layers/activation.py +4 -1
  101. sglang/srt/layers/attention/aiter_backend.py +3 -3
  102. sglang/srt/layers/attention/ascend_backend.py +17 -1
  103. sglang/srt/layers/attention/attention_registry.py +43 -23
  104. sglang/srt/layers/attention/base_attn_backend.py +20 -1
  105. sglang/srt/layers/attention/double_sparsity_backend.py +2 -2
  106. sglang/srt/layers/attention/fla/chunk.py +0 -1
  107. sglang/srt/layers/attention/fla/chunk_o.py +1 -1
  108. sglang/srt/layers/attention/fla/index.py +0 -2
  109. sglang/srt/layers/attention/fla/layernorm_gated.py +50 -32
  110. sglang/srt/layers/attention/fla/utils.py +0 -3
  111. sglang/srt/layers/attention/fla/wy_fast.py +0 -2
  112. sglang/srt/layers/attention/flashattention_backend.py +12 -8
  113. sglang/srt/layers/attention/flashinfer_backend.py +248 -21
  114. sglang/srt/layers/attention/flashinfer_mla_backend.py +20 -18
  115. sglang/srt/layers/attention/flashmla_backend.py +2 -2
  116. sglang/srt/layers/attention/hybrid_attn_backend.py +1 -1
  117. sglang/srt/layers/attention/hybrid_linear_attn_backend.py +165 -62
  118. sglang/srt/layers/attention/intel_amx_backend.py +1 -1
  119. sglang/srt/layers/attention/mamba/causal_conv1d.py +1 -1
  120. sglang/srt/layers/attention/mamba/causal_conv1d_triton.py +9 -5
  121. sglang/srt/layers/attention/mamba/mamba.py +189 -241
  122. sglang/srt/layers/attention/mamba/mamba2_metadata.py +211 -0
  123. sglang/srt/layers/attention/mamba/mixer2_rms_norm_gated.py +120 -0
  124. sglang/srt/layers/attention/mamba/ops/ssd_bmm.py +0 -50
  125. sglang/srt/layers/attention/mamba/ops/ssd_chunk_scan.py +0 -60
  126. sglang/srt/layers/attention/mamba/ops/ssd_chunk_state.py +0 -111
  127. sglang/srt/layers/attention/mamba/ops/ssd_combined.py +0 -1
  128. sglang/srt/layers/attention/mamba/ops/ssd_state_passing.py +0 -11
  129. sglang/srt/layers/attention/npu_ops/mla_preprocess.py +1 -1
  130. sglang/srt/layers/attention/nsa/nsa_indexer.py +40 -83
  131. sglang/srt/layers/attention/nsa/triton_kernel.py +136 -0
  132. sglang/srt/layers/attention/nsa/utils.py +0 -1
  133. sglang/srt/layers/attention/nsa_backend.py +404 -90
  134. sglang/srt/layers/attention/triton_backend.py +208 -34
  135. sglang/srt/layers/attention/triton_ops/double_sparsity_attention.py +2 -2
  136. sglang/srt/layers/attention/triton_ops/extend_attention.py +539 -44
  137. sglang/srt/layers/attention/trtllm_mha_backend.py +2 -2
  138. sglang/srt/layers/attention/trtllm_mla_backend.py +361 -30
  139. sglang/srt/layers/attention/utils.py +11 -7
  140. sglang/srt/layers/attention/vision.py +3 -3
  141. sglang/srt/layers/attention/xpu_backend.py +1028 -0
  142. sglang/srt/layers/communicator.py +11 -7
  143. sglang/srt/layers/{quantization/deep_gemm_wrapper → deep_gemm_wrapper}/compile_utils.py +4 -8
  144. sglang/srt/layers/{quantization/deep_gemm_wrapper → deep_gemm_wrapper}/configurer.py +4 -3
  145. sglang/srt/layers/{quantization/deep_gemm_wrapper → deep_gemm_wrapper}/entrypoint.py +3 -3
  146. sglang/srt/layers/dp_attention.py +17 -0
  147. sglang/srt/layers/layernorm.py +45 -15
  148. sglang/srt/layers/linear.py +9 -1
  149. sglang/srt/layers/logits_processor.py +147 -17
  150. sglang/srt/layers/modelopt_utils.py +11 -0
  151. sglang/srt/layers/moe/cutlass_moe.py +0 -2
  152. sglang/srt/layers/moe/cutlass_w4a8_moe.py +213 -21
  153. sglang/srt/layers/moe/ep_moe/kernels.py +35 -457
  154. sglang/srt/layers/moe/ep_moe/layer.py +119 -397
  155. sglang/srt/layers/moe/flashinfer_cutedsl_moe.py +1 -1
  156. sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=128,N=192,device_name=NVIDIA_H200,dtype=fp8_w8a8.json +146 -0
  157. sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=256,N=256,device_name=NVIDIA_B200.json +146 -0
  158. sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_config.py +11 -3
  159. sglang/srt/layers/moe/fused_moe_triton/layer.py +76 -70
  160. sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py +18 -42
  161. sglang/srt/layers/moe/moe_runner/deep_gemm.py +304 -0
  162. sglang/srt/layers/moe/moe_runner/runner.py +3 -0
  163. sglang/srt/layers/moe/moe_runner/triton.py +3 -1
  164. sglang/srt/layers/moe/rocm_moe_utils.py +0 -1
  165. sglang/srt/layers/moe/router.py +51 -15
  166. sglang/srt/layers/moe/token_dispatcher/__init__.py +10 -0
  167. sglang/srt/layers/moe/token_dispatcher/base.py +1 -1
  168. sglang/srt/layers/moe/token_dispatcher/deepep.py +110 -97
  169. sglang/srt/layers/moe/token_dispatcher/mooncake.py +386 -0
  170. sglang/srt/layers/moe/token_dispatcher/standard.py +46 -0
  171. sglang/srt/layers/moe/topk.py +3 -2
  172. sglang/srt/layers/moe/utils.py +17 -1
  173. sglang/srt/layers/quantization/__init__.py +2 -53
  174. sglang/srt/layers/quantization/awq.py +183 -6
  175. sglang/srt/layers/quantization/awq_triton.py +29 -0
  176. sglang/srt/layers/quantization/base_config.py +20 -1
  177. sglang/srt/layers/quantization/compressed_tensors/__init__.py +7 -0
  178. sglang/srt/layers/quantization/compressed_tensors/compressed_tensors.py +20 -49
  179. sglang/srt/layers/quantization/compressed_tensors/compressed_tensors_moe.py +421 -70
  180. sglang/srt/layers/quantization/compressed_tensors/schemes/__init__.py +3 -0
  181. sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a16_fp8.py +4 -22
  182. sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_wNa16.py +339 -0
  183. sglang/srt/layers/quantization/fp8.py +84 -18
  184. sglang/srt/layers/quantization/fp8_kernel.py +55 -10
  185. sglang/srt/layers/quantization/fp8_utils.py +42 -14
  186. sglang/srt/layers/quantization/fpgemm_fp8.py +2 -3
  187. sglang/srt/layers/quantization/gptq.py +0 -1
  188. sglang/srt/layers/quantization/int8_kernel.py +18 -2
  189. sglang/srt/layers/quantization/marlin_utils.py +12 -0
  190. sglang/srt/layers/quantization/modelopt_quant.py +125 -100
  191. sglang/srt/layers/quantization/mxfp4.py +5 -30
  192. sglang/srt/layers/quantization/petit.py +1 -1
  193. sglang/srt/layers/quantization/quark/quark.py +3 -1
  194. sglang/srt/layers/quantization/quark/quark_moe.py +3 -3
  195. sglang/srt/layers/quantization/quark/schemes/quark_w4a4_mxfp4.py +0 -7
  196. sglang/srt/layers/quantization/unquant.py +1 -4
  197. sglang/srt/layers/quantization/utils.py +0 -1
  198. sglang/srt/layers/quantization/w4afp8.py +51 -20
  199. sglang/srt/layers/quantization/w8a8_int8.py +30 -24
  200. sglang/srt/layers/radix_attention.py +59 -9
  201. sglang/srt/layers/rotary_embedding.py +673 -16
  202. sglang/srt/layers/sampler.py +36 -16
  203. sglang/srt/layers/sparse_pooler.py +98 -0
  204. sglang/srt/layers/utils.py +0 -1
  205. sglang/srt/layers/vocab_parallel_embedding.py +4 -1
  206. sglang/srt/lora/backend/triton_backend.py +0 -1
  207. sglang/srt/lora/eviction_policy.py +139 -0
  208. sglang/srt/lora/lora_manager.py +24 -9
  209. sglang/srt/lora/lora_registry.py +1 -1
  210. sglang/srt/lora/mem_pool.py +40 -16
  211. sglang/srt/lora/triton_ops/chunked_sgmv_expand.py +1 -1
  212. sglang/srt/lora/triton_ops/chunked_sgmv_shrink.py +4 -2
  213. sglang/srt/managers/cache_controller.py +48 -17
  214. sglang/srt/managers/data_parallel_controller.py +146 -42
  215. sglang/srt/managers/detokenizer_manager.py +40 -13
  216. sglang/srt/managers/io_struct.py +66 -16
  217. sglang/srt/managers/mm_utils.py +20 -18
  218. sglang/srt/managers/multi_tokenizer_mixin.py +66 -81
  219. sglang/srt/managers/overlap_utils.py +96 -19
  220. sglang/srt/managers/schedule_batch.py +241 -511
  221. sglang/srt/managers/schedule_policy.py +15 -2
  222. sglang/srt/managers/scheduler.py +399 -499
  223. sglang/srt/managers/scheduler_metrics_mixin.py +55 -8
  224. sglang/srt/managers/scheduler_output_processor_mixin.py +317 -111
  225. sglang/srt/managers/scheduler_pp_mixin.py +341 -0
  226. sglang/srt/managers/scheduler_profiler_mixin.py +57 -10
  227. sglang/srt/managers/scheduler_runtime_checker_mixin.py +217 -0
  228. sglang/srt/managers/scheduler_update_weights_mixin.py +33 -14
  229. sglang/srt/managers/tokenizer_communicator_mixin.py +71 -55
  230. sglang/srt/managers/tokenizer_manager.py +378 -90
  231. sglang/srt/managers/tp_worker.py +212 -161
  232. sglang/srt/managers/utils.py +78 -2
  233. sglang/srt/mem_cache/allocator.py +7 -2
  234. sglang/srt/mem_cache/allocator_ascend.py +2 -2
  235. sglang/srt/mem_cache/base_prefix_cache.py +2 -2
  236. sglang/srt/mem_cache/chunk_cache.py +13 -2
  237. sglang/srt/mem_cache/common.py +480 -0
  238. sglang/srt/mem_cache/evict_policy.py +16 -1
  239. sglang/srt/mem_cache/hicache_storage.py +4 -1
  240. sglang/srt/mem_cache/hiradix_cache.py +16 -3
  241. sglang/srt/mem_cache/mamba_radix_cache.py +993 -0
  242. sglang/srt/mem_cache/memory_pool.py +435 -219
  243. sglang/srt/mem_cache/memory_pool_host.py +0 -1
  244. sglang/srt/mem_cache/multimodal_cache.py +0 -1
  245. sglang/srt/mem_cache/radix_cache.py +53 -19
  246. sglang/srt/mem_cache/radix_cache_cpp.py +19 -14
  247. sglang/srt/mem_cache/storage/aibrix_kvcache/aibrix_kvcache_storage.py +8 -2
  248. sglang/srt/mem_cache/storage/aibrix_kvcache/unit_test.py +1 -13
  249. sglang/srt/mem_cache/storage/backend_factory.py +2 -2
  250. sglang/srt/mem_cache/storage/eic/eic_storage.py +5 -6
  251. sglang/srt/mem_cache/storage/hf3fs/hf3fs_client.py +0 -1
  252. sglang/srt/mem_cache/storage/hf3fs/storage_hf3fs.py +9 -3
  253. sglang/srt/mem_cache/storage/lmcache/lmc_radix_cache.py +5 -3
  254. sglang/srt/mem_cache/storage/mooncake_store/mooncake_store.py +101 -17
  255. sglang/srt/mem_cache/storage/nixl/hicache_nixl.py +38 -9
  256. sglang/srt/mem_cache/storage/nixl/nixl_utils.py +1 -1
  257. sglang/srt/mem_cache/storage/nixl/test_hicache_nixl_storage.py +17 -2
  258. sglang/srt/mem_cache/swa_radix_cache.py +92 -26
  259. sglang/srt/metrics/collector.py +31 -0
  260. sglang/srt/metrics/func_timer.py +1 -1
  261. sglang/srt/model_executor/cuda_graph_runner.py +43 -5
  262. sglang/srt/model_executor/forward_batch_info.py +28 -23
  263. sglang/srt/model_executor/model_runner.py +379 -139
  264. sglang/srt/model_executor/npu_graph_runner.py +2 -3
  265. sglang/srt/model_executor/piecewise_cuda_graph_runner.py +539 -0
  266. sglang/srt/model_loader/__init__.py +1 -1
  267. sglang/srt/model_loader/loader.py +424 -27
  268. sglang/srt/model_loader/utils.py +0 -1
  269. sglang/srt/model_loader/weight_utils.py +47 -28
  270. sglang/srt/models/apertus.py +2 -3
  271. sglang/srt/models/arcee.py +2 -2
  272. sglang/srt/models/bailing_moe.py +13 -52
  273. sglang/srt/models/bailing_moe_nextn.py +3 -4
  274. sglang/srt/models/bert.py +1 -1
  275. sglang/srt/models/deepseek_nextn.py +19 -3
  276. sglang/srt/models/deepseek_ocr.py +1516 -0
  277. sglang/srt/models/deepseek_v2.py +273 -98
  278. sglang/srt/models/dots_ocr.py +0 -2
  279. sglang/srt/models/dots_vlm.py +0 -1
  280. sglang/srt/models/dots_vlm_vit.py +1 -1
  281. sglang/srt/models/falcon_h1.py +13 -19
  282. sglang/srt/models/gemma3_mm.py +16 -0
  283. sglang/srt/models/gemma3n_mm.py +1 -2
  284. sglang/srt/models/glm4_moe.py +14 -37
  285. sglang/srt/models/glm4_moe_nextn.py +2 -2
  286. sglang/srt/models/glm4v.py +2 -1
  287. sglang/srt/models/glm4v_moe.py +5 -5
  288. sglang/srt/models/gpt_oss.py +5 -5
  289. sglang/srt/models/grok.py +10 -23
  290. sglang/srt/models/hunyuan.py +2 -7
  291. sglang/srt/models/interns1.py +0 -1
  292. sglang/srt/models/kimi_vl.py +1 -7
  293. sglang/srt/models/kimi_vl_moonvit.py +3 -1
  294. sglang/srt/models/llama.py +2 -2
  295. sglang/srt/models/llama_eagle3.py +1 -1
  296. sglang/srt/models/longcat_flash.py +5 -22
  297. sglang/srt/models/longcat_flash_nextn.py +3 -14
  298. sglang/srt/models/mimo.py +2 -13
  299. sglang/srt/models/mimo_mtp.py +1 -2
  300. sglang/srt/models/minicpmo.py +7 -5
  301. sglang/srt/models/mixtral.py +1 -4
  302. sglang/srt/models/mllama.py +1 -1
  303. sglang/srt/models/mllama4.py +13 -3
  304. sglang/srt/models/nemotron_h.py +511 -0
  305. sglang/srt/models/olmo2.py +31 -4
  306. sglang/srt/models/opt.py +5 -5
  307. sglang/srt/models/phi.py +1 -1
  308. sglang/srt/models/phi4mm.py +1 -1
  309. sglang/srt/models/phimoe.py +0 -1
  310. sglang/srt/models/pixtral.py +0 -3
  311. sglang/srt/models/points_v15_chat.py +186 -0
  312. sglang/srt/models/qwen.py +0 -1
  313. sglang/srt/models/qwen2_5_vl.py +3 -3
  314. sglang/srt/models/qwen2_audio.py +2 -15
  315. sglang/srt/models/qwen2_moe.py +15 -12
  316. sglang/srt/models/qwen2_vl.py +5 -2
  317. sglang/srt/models/qwen3_moe.py +19 -35
  318. sglang/srt/models/qwen3_next.py +7 -12
  319. sglang/srt/models/qwen3_next_mtp.py +3 -4
  320. sglang/srt/models/qwen3_omni_moe.py +661 -0
  321. sglang/srt/models/qwen3_vl.py +37 -33
  322. sglang/srt/models/qwen3_vl_moe.py +57 -185
  323. sglang/srt/models/roberta.py +55 -3
  324. sglang/srt/models/sarashina2_vision.py +0 -1
  325. sglang/srt/models/step3_vl.py +3 -5
  326. sglang/srt/models/utils.py +11 -1
  327. sglang/srt/multimodal/processors/base_processor.py +6 -2
  328. sglang/srt/multimodal/processors/deepseek_ocr.py +37 -0
  329. sglang/srt/multimodal/processors/deepseek_vl_v2.py +0 -3
  330. sglang/srt/multimodal/processors/dots_vlm.py +0 -1
  331. sglang/srt/multimodal/processors/glm4v.py +1 -5
  332. sglang/srt/multimodal/processors/internvl.py +0 -2
  333. sglang/srt/multimodal/processors/janus_pro.py +0 -1
  334. sglang/srt/multimodal/processors/mllama4.py +0 -8
  335. sglang/srt/multimodal/processors/phi4mm.py +0 -1
  336. sglang/srt/multimodal/processors/points_v15_chat.py +52 -0
  337. sglang/srt/multimodal/processors/qwen_vl.py +75 -16
  338. sglang/srt/multimodal/processors/step3_vl.py +1 -1
  339. sglang/srt/parser/conversation.py +41 -0
  340. sglang/srt/parser/reasoning_parser.py +0 -1
  341. sglang/srt/sampling/custom_logit_processor.py +77 -2
  342. sglang/srt/sampling/sampling_batch_info.py +17 -22
  343. sglang/srt/sampling/sampling_params.py +70 -2
  344. sglang/srt/server_args.py +577 -73
  345. sglang/srt/server_args_config_parser.py +1 -1
  346. sglang/srt/single_batch_overlap.py +38 -28
  347. sglang/srt/speculative/base_spec_worker.py +34 -0
  348. sglang/srt/speculative/draft_utils.py +226 -0
  349. sglang/srt/speculative/eagle_draft_cuda_graph_runner.py +24 -7
  350. sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py +23 -2
  351. sglang/srt/speculative/eagle_info.py +57 -18
  352. sglang/srt/speculative/eagle_info_v2.py +458 -0
  353. sglang/srt/speculative/eagle_utils.py +138 -0
  354. sglang/srt/speculative/eagle_worker.py +83 -280
  355. sglang/srt/speculative/eagle_worker_v2.py +702 -0
  356. sglang/srt/speculative/{ngram_utils.py → ngram_info.py} +14 -9
  357. sglang/srt/speculative/ngram_worker.py +12 -11
  358. sglang/srt/speculative/spec_info.py +2 -0
  359. sglang/srt/speculative/spec_utils.py +38 -3
  360. sglang/srt/speculative/standalone_worker.py +4 -14
  361. sglang/srt/tokenizer/tiktoken_tokenizer.py +2 -2
  362. sglang/srt/two_batch_overlap.py +28 -14
  363. sglang/srt/utils/__init__.py +1 -1
  364. sglang/srt/{bench_utils.py → utils/bench_utils.py} +4 -2
  365. sglang/srt/utils/common.py +192 -47
  366. sglang/srt/utils/hf_transformers_utils.py +40 -17
  367. sglang/srt/{host_shared_memory.py → utils/host_shared_memory.py} +0 -1
  368. sglang/srt/{offloader.py → utils/offloader.py} +4 -4
  369. sglang/srt/utils/profile_merger.py +199 -0
  370. sglang/test/attention/test_flashattn_backend.py +1 -1
  371. sglang/test/attention/test_flashattn_mla_backend.py +0 -1
  372. sglang/test/attention/test_prefix_chunk_info.py +0 -2
  373. sglang/test/attention/test_trtllm_mla_backend.py +221 -53
  374. sglang/test/few_shot_gsm8k_engine.py +2 -4
  375. sglang/test/kit_matched_stop.py +157 -0
  376. sglang/test/longbench_v2/__init__.py +1 -0
  377. sglang/test/longbench_v2/test_longbench_v2_eval.py +238 -0
  378. sglang/test/longbench_v2/validate_longbench_v2.py +337 -0
  379. sglang/test/longbench_v2/validate_longbench_v2_standalone.py +306 -0
  380. sglang/test/run_eval.py +41 -0
  381. sglang/test/runners.py +2 -0
  382. sglang/test/send_one.py +42 -7
  383. sglang/test/simple_eval_common.py +3 -0
  384. sglang/test/simple_eval_gpqa.py +0 -1
  385. sglang/test/simple_eval_humaneval.py +0 -3
  386. sglang/test/simple_eval_longbench_v2.py +344 -0
  387. sglang/test/test_block_fp8.py +1 -2
  388. sglang/test/test_block_fp8_deep_gemm_blackwell.py +0 -1
  389. sglang/test/test_cutlass_moe.py +1 -2
  390. sglang/test/test_cutlass_w4a8_moe.py +10 -20
  391. sglang/test/test_deterministic.py +232 -99
  392. sglang/test/test_deterministic_utils.py +73 -0
  393. sglang/test/test_disaggregation_utils.py +81 -0
  394. sglang/test/test_marlin_moe.py +0 -1
  395. sglang/test/test_utils.py +85 -20
  396. sglang/version.py +1 -1
  397. {sglang-0.5.3rc2.dist-info → sglang-0.5.4.dist-info}/METADATA +45 -33
  398. {sglang-0.5.3rc2.dist-info → sglang-0.5.4.dist-info}/RECORD +404 -345
  399. sglang/srt/layers/attention/mamba/mamba_utils.py +0 -81
  400. sglang/srt/managers/tp_worker_overlap_thread.py +0 -311
  401. sglang/srt/speculative/build_eagle_tree.py +0 -427
  402. sglang/test/test_block_fp8_ep.py +0 -358
  403. /sglang/srt/layers/{quantization/deep_gemm_wrapper → deep_gemm_wrapper}/__init__.py +0 -0
  404. /sglang/srt/{aio_rwlock.py → utils/aio_rwlock.py} +0 -0
  405. /sglang/srt/{torch_memory_saver_adapter.py → utils/torch_memory_saver_adapter.py} +0 -0
  406. {sglang-0.5.3rc2.dist-info → sglang-0.5.4.dist-info}/WHEEL +0 -0
  407. {sglang-0.5.3rc2.dist-info → sglang-0.5.4.dist-info}/licenses/LICENSE +0 -0
  408. {sglang-0.5.3rc2.dist-info → sglang-0.5.4.dist-info}/top_level.txt +0 -0
@@ -1,23 +1,23 @@
1
1
  sglang/__init__.py,sha256=CK60u1J439CJZaPihWqlDjFZ8doIC-5YgIYz-E1PIh4,1823
2
2
  sglang/bench_offline_throughput.py,sha256=Bge0KG4Uiv9CHsxDnqKdXJmG_TcxM4blz3CmvLmDRvM,14815
3
- sglang/bench_one_batch.py,sha256=TFYI_wQGFpeJMV5r4C_EABmwZD3EDNuT1ORQX3jUWlY,23109
4
- sglang/bench_one_batch_server.py,sha256=nD7GMOQE1I57BC1E7dTmqx-PMeSUPq8RF8W39s5z86I,26128
5
- sglang/bench_serving.py,sha256=0l-QrhHtIMUVyewiuvxoRx6_MIulMpadkKtbzpQMxyQ,87841
6
- sglang/check_env.py,sha256=qDMIG2rCNBH1yKnxQmF-Bp10oiFMUKMgfZLHZYOmdSY,8412
7
- sglang/compile_deep_gemm.py,sha256=EsgboGA-MK3Rvx9TlUJPLxJ5LBira4bTcHJLKEp1H6k,6488
8
- sglang/global_config.py,sha256=qnMsK6AKzl8dhEbg-Jlbp_OVY9JUV0X9BqQiOl8VkiE,1737
9
- sglang/launch_server.py,sha256=zBCKcUg4d7_-Zpp0NE9C7z8CIFYw94UH0wo7ZIilHMM,1063
10
- sglang/profiler.py,sha256=zjD9-TxnDv3yU1Qmv4vItH5Nuhiu230ssqOA43EyH2g,4420
3
+ sglang/bench_one_batch.py,sha256=cjECJgTmPcnP-b8Fcy7ldFU6FaEqBpz7Z45RTwBwNR8,23763
4
+ sglang/bench_one_batch_server.py,sha256=8zAjLFu0tgfIhhtEaPGdDhi15YCcHcaK19vz6Rmn_Jw,26565
5
+ sglang/bench_serving.py,sha256=KrPHSzFmzyhRerLBBOm-72sOr1toBQkNIOvRPdVBBc0,94023
6
+ sglang/check_env.py,sha256=6wRlWL7UwY1JjYRG307bLLJRoirPk2RVLYrDWV8Et0c,8413
7
+ sglang/compile_deep_gemm.py,sha256=v7WJZLSrJw3Vc_28lTReRDJ1WdiPKLRHizFi2l2chv8,6614
8
+ sglang/global_config.py,sha256=bVpUL_gMSA0FwJl8y8tP5CIa7d083o6Dcak-yRytzGw,767
9
+ sglang/launch_server.py,sha256=VqPi2ecJmQuvw1aYppiKEp45NC_FthgBjzhHM2pXItY,620
10
+ sglang/profiler.py,sha256=uprc8Lo-WeqrQY9u2Wj503swEp4P_2laLJ6cWGALgME,4854
11
11
  sglang/utils.py,sha256=YreOyt4-fWdDcg01abaMJ0y0ly4gYps26vRlmWhwGC8,17267
12
- sglang/version.py,sha256=PgjGjGwMjSvY5WJg-jqo1zKEBRurR4G1DY2OwoitREE,25
12
+ sglang/version.py,sha256=DITpct-LrdIsTgwx2NgH5Ghx5y8Xgz1YMimy1ZV5RTY,22
13
13
  sglang/eval/llama3_eval.py,sha256=mLNRZJIqV4CfqrY8UGnJEcHw2Xsyr1eyYZgFSUFYr1g,9997
14
14
  sglang/eval/loogle_eval.py,sha256=-CC2s2kh5qUoDrHRkQVkC_jNvBgNojXbf456ny5s78s,4557
15
- sglang/lang/api.py,sha256=rcp3GeoyZhmJ0GDLPRkuZNcxd0TBJy_wfUDpcmQoqW8,7210
15
+ sglang/lang/api.py,sha256=kyfJuErqMyle6hnx3Q_oqNSFDe0q4gFob1yd5ZLTatw,7438
16
16
  sglang/lang/chat_template.py,sha256=4_JVa7NDpHP2it6rAQS5UnCSxSMy0rtfdOgSvH_Kbdc,22549
17
17
  sglang/lang/choices.py,sha256=-W1DVw9N9ZliVpvmWrzIXG4cswAah8eMQrHWzkS3D8o,6234
18
18
  sglang/lang/compiler.py,sha256=MAuzoOOpb98njJ7Io2SDmFkhTroDYiq0te0ZpfHkMY4,7597
19
- sglang/lang/interpreter.py,sha256=F-wxyKDUnTygmJpSEYsrQermls2RyWJntOep9_P7V1I,34818
20
- sglang/lang/ir.py,sha256=FnRJ-lndAsR4GR0ONJRPDtlYx8FvL9RIk44vSA16RBk,19656
19
+ sglang/lang/interpreter.py,sha256=wy6dWNzk57Mp7U15I3VeCT_UFBSnLmff2vXRdDbh1hE,34844
20
+ sglang/lang/ir.py,sha256=wcV1dMwn-L6gK-ERu-Gg_2dqCkAuWkFNIGh0kRhFa7M,20184
21
21
  sglang/lang/tracer.py,sha256=ljBo9VZ0zVaGwzNk32qw21acyo60N0UjIjqBbT5a1WI,8175
22
22
  sglang/lang/backend/anthropic.py,sha256=qXWqqFlk0-nC62QCcYIRjLTc4AHrdTKpl7hCeDzROUs,2019
23
23
  sglang/lang/backend/base_backend.py,sha256=tEutGCU5tni1xGlrIjAVvA9aflJBt2duKrIDzqabJWc,1975
@@ -25,148 +25,167 @@ sglang/lang/backend/litellm.py,sha256=ugmL7sfUxkUHVbHtwNzHgdQAEd4UCjNQboFuE3KThc
25
25
  sglang/lang/backend/openai.py,sha256=YFs7pCDK6_DoYmjTa-vgDVdaeE4PYr7E-sIC1q7vAns,16422
26
26
  sglang/lang/backend/runtime_endpoint.py,sha256=UZRKqQ8eE_N11oiv9rViF3THNq21A_uio0N0Bt9MaY8,17487
27
27
  sglang/lang/backend/vertexai.py,sha256=gz0uNYyBb88jbPYz6ZIJ774fefrcbuVdoK33bphUZpI,4827
28
- sglang/srt/_custom_ops.py,sha256=9GPNUyqnybgvUnzdQ8n5_NgluHmQNw0Gptos0iLPfrY,5342
29
- sglang/srt/aio_rwlock.py,sha256=6LYtOdeTUY3hkfa1dmYkgsaF2ttrwIF3hUWz2AZ2fqw,2970
30
- sglang/srt/bench_utils.py,sha256=zNTsTBUta27XxojgvR5p5X9M0v1MFzZ7dcX9TMq4NvQ,4348
28
+ sglang/srt/_custom_ops.py,sha256=P4MLtuF8DzK66R_Sw88AYsiCOn7YNGZ93H7isJq0dUA,5356
31
29
  sglang/srt/constants.py,sha256=0i-tEwG2BSYNDy96MxnGHV5HnBELkYcnsVGsE-R18o0,93
32
30
  sglang/srt/custom_op.py,sha256=m5F7x3LHlnOuesmcNmJtIWsfHGFLBJ807vKc05Gu1D0,3312
33
- sglang/srt/environ.py,sha256=QaYZPUkvV-KyRWzJ6nz-kNO75Khn_pNbx2yX_YBL7-A,8894
34
- sglang/srt/host_shared_memory.py,sha256=00TgVm3PNCl4rTPJZChG5uu4I5hd_Xf587r39tibmIg,2274
35
- sglang/srt/offloader.py,sha256=cYON5jZErAp88Sh5JseaRw0B2Ho2MQz9smgvrTc-2KA,18765
31
+ sglang/srt/environ.py,sha256=2D5x1OaR_lRd-oSLilf1lZo01Pqz2_t5Bru-LHIxYys,10447
36
32
  sglang/srt/operations.py,sha256=za_h1_kcR1Te6-i_r0i_zAeumbmIRhLK2pS31sukkrw,6089
37
33
  sglang/srt/operations_strategy.py,sha256=-w6GI2VgSGvORy3pUWRAJo6244ykSW1ZBV1Dx0fZlHA,7138
38
- sglang/srt/server_args.py,sha256=pjtjMs62nnyMIRQMaL161QKDE2DViatyZNrfbYSkYuM,137969
39
- sglang/srt/server_args_config_parser.py,sha256=niM5LYNaVxQg4FKHUJ3YmMZ-ekB3bDlvTwD7KqdLZoE,5220
40
- sglang/srt/single_batch_overlap.py,sha256=m70hHl1ufIvc_9Nl2bYqnIcfoMIJkPyGjWIqJLBsKhI,4844
41
- sglang/srt/torch_memory_saver_adapter.py,sha256=WFwPsOBvnWu6N2yTHmiOjLbDAYosslHwNSfyFHjz-7w,2511
42
- sglang/srt/two_batch_overlap.py,sha256=0cHUV2ZeyCaojDRpqNcRSUIQM3_Y4H4HfssML2gt_6k,34240
34
+ sglang/srt/server_args.py,sha256=Qen-c7jcgQpTrub1ogsyxX_8Joj7WfP_rA6ZMIfsH-Q,160382
35
+ sglang/srt/server_args_config_parser.py,sha256=NW_tnD_ixnIpEhIuhn1W67pnAOJSGWKKN-jHcssKD-Q,5213
36
+ sglang/srt/single_batch_overlap.py,sha256=mUW2yBRxLWKlDlpTqIKkICWzMkcbKsmPjUtcvGiVYq4,5388
37
+ sglang/srt/two_batch_overlap.py,sha256=xDDMyE1hKQPq-yu_GkVnNXskyc1CVoPYPaB6AvoPXKA,34667
43
38
  sglang/srt/warmup.py,sha256=fQYzNp-I9mZccs2BerI6mOZd1CDQjdiuFCeUkcwiOb4,1834
44
39
  sglang/srt/batch_invariant_ops/__init__.py,sha256=Z9TvOE4BL7cAaBIePEsVglH7RcWBSBIsSHs-XbveQNE,728
45
- sglang/srt/batch_invariant_ops/batch_invariant_ops.py,sha256=5vtvEFezea4tjGFuVMkadgZxynxAZZ8yxGwpkSm7Sl4,16246
46
- sglang/srt/configs/__init__.py,sha256=aMxLOh72NAL0iQl0aPcPP2Ih9oY5vhHUHAcymE0fv-4,1142
40
+ sglang/srt/batch_invariant_ops/batch_invariant_ops.py,sha256=Kb4uxHPDwlQYg1CfEOhuRDcHTI3Yr8Kbq3GkF57iUZs,16249
41
+ sglang/srt/checkpoint_engine/checkpoint_engine_worker.py,sha256=YlyiZ46LOi5aib0N5IyrPMuGbnVi_Xnnf9r2XdR1OtY,5509
42
+ sglang/srt/compilation/backend.py,sha256=SClr9jjC8wb8vymB2cE-6DN36bEbZeBlYcFx0qe-pfM,14395
43
+ sglang/srt/compilation/compilation_config.py,sha256=9GDBY3SAV5hIJ6hmYurJ3vfYh9-gtZP3nEzp0TrUdeM,617
44
+ sglang/srt/compilation/compilation_counter.py,sha256=qrCqMCaui2eOBpxi3ZBiuvmJ6dkWah_6dYjhvu6_MqE,1623
45
+ sglang/srt/compilation/compile.py,sha256=All4G5VjYBY9MOalW5YDo17eEtho-o_BG5V86lNJ-5c,6965
46
+ sglang/srt/compilation/compiler_interface.py,sha256=k6EDIpdtEB0NCOaDxsgXwaSXH4xTLQsflFdy-sTsyRQ,19508
47
+ sglang/srt/compilation/cuda_piecewise_backend.py,sha256=_MOgUhUGg9kBDIhSJWq-vUwZrluwScy4PbCzD-X9g7g,9237
48
+ sglang/srt/compilation/fix_functionalization.py,sha256=SDQ1Pbvh5PiUg3M82NAfyXPjz21wmBRQgzM_HHKRHss,5156
49
+ sglang/srt/compilation/fx_utils.py,sha256=vv32jqNIYcdvLiz0W4yGcUyh_ko6LJwrES8ZMU2vIis,2873
50
+ sglang/srt/compilation/inductor_pass.py,sha256=zebqIifs0wvLXIUy43ablX87qh4jnn9876ZHzw4c2IQ,4041
51
+ sglang/srt/compilation/pass_manager.py,sha256=n8TIJkWIxegDd5lX6Xja4l4YuBQLZvn2_9yEY8Esp80,2213
52
+ sglang/srt/compilation/piecewise_context_manager.py,sha256=P-WpB3Ny8sMEFUpkQv4ExSoqQPPyEwhXZraDWQjP8ak,1113
53
+ sglang/srt/compilation/weak_ref_tensor_jit.py,sha256=XJLJsj5t84QLhF0Bjx0j2Iow51d8zc6inASOd9watFA,390
54
+ sglang/srt/configs/__init__.py,sha256=a8_ODqcCzMN1q_fNHKMBNHM9aGH8LF92GLGcLeViLWY,1291
47
55
  sglang/srt/configs/chatglm.py,sha256=j-b0YkdYUmQm2y1kNmMJtKeACxWKmBbvNNkDWbs6kbI,2907
48
56
  sglang/srt/configs/dbrx.py,sha256=tdhIkXAQl1yr0MxqFmsDG1E0e2puRTTKm6UTyANBLac,11005
49
- sglang/srt/configs/deepseekvl2.py,sha256=sYMmoy5_LlDXht7MTi4QGYOaiE8iMGUO44bnuOu4i8I,23683
57
+ sglang/srt/configs/deepseek_ocr.py,sha256=3nZL7pWJ-WwN6ZYqRsPy7zbxgZCggW5igVfIvJhGUXY,8102
58
+ sglang/srt/configs/deepseekvl2.py,sha256=QTZnL47wIx0mkd_HCn_Kfzu4oCHEJaYZpvVSjmaDvp8,26518
50
59
  sglang/srt/configs/device_config.py,sha256=1Iaxrk65bJsCWV3E2cDfiap_T_xJIIj9oFVn9y6v0EI,515
51
60
  sglang/srt/configs/dots_ocr.py,sha256=HSKerqzHzrKIzoNZOUXA_KiBLmL-Rs8h4Vw17pjF1Uo,1863
52
- sglang/srt/configs/dots_vlm.py,sha256=PYoSrT-sRoykfNhdXFauqv21Sb54iavjYD3F09xww3U,5176
61
+ sglang/srt/configs/dots_vlm.py,sha256=Q2qaP65sYCKGmg_bvc4g5yb-pasdZNx4xnnlzu6Ed1U,4912
53
62
  sglang/srt/configs/exaone.py,sha256=Duxd4yQoKy8GWEzZD_kCY_OzmN_67CTJL_Kgn0eXk3g,10731
54
- sglang/srt/configs/falcon_h1.py,sha256=qn_n2uLRVN4EK4gn4UoHo_1NhV6kPFdOIb5TBJ0NAYs,16395
63
+ sglang/srt/configs/falcon_h1.py,sha256=LFxN0We8Gfgk-RWVeegzvyh-R4msAYF96ioO97Ta4ig,14939
55
64
  sglang/srt/configs/internvl.py,sha256=rIC-CBWJHy-Mjmk0_H3YcvVmZzeCRbXGo3dQMex-yeg,28141
56
65
  sglang/srt/configs/janus_pro.py,sha256=yI2c_aWBIKiTcK6RZxK6hq8CIxyYRH_NN8uaSNKsrKI,19156
57
66
  sglang/srt/configs/kimi_vl.py,sha256=4W7VQI3pr888ZsFA2SqCQo4mI0seXTOrGQ-x3oTvWew,1358
58
67
  sglang/srt/configs/kimi_vl_moonvit.py,sha256=hx2Rt4JSFbvy2HUTeLjBpge87m8M6ITAhqsgdNf_Jd4,1163
59
- sglang/srt/configs/load_config.py,sha256=_XhZdoP2Kbzih3FBZiiwGhXBf2-bNrn6f8eA63zqS7Y,3840
68
+ sglang/srt/configs/load_config.py,sha256=_x9n6Rkbi3VqYmXJ7PNdce32mvUNP1ewqrkUsJ7qprw,4765
60
69
  sglang/srt/configs/longcat_flash.py,sha256=Qp25xJVLq2K72Z80cXhcJxtqhagAdiPySDoevuT0Sno,3589
61
- sglang/srt/configs/model_config.py,sha256=fICFIXWjFrS7xtQYA-8TNJigD9blBfnEKmsbDsbMenE,35245
62
- sglang/srt/configs/qwen3_next.py,sha256=MVMDzdwlxrdar_6p6n9HjaXAei_giFfXlQNJAWpSLQ4,15794
63
- sglang/srt/configs/qwen3_vl.py,sha256=FMC-SVeM_sxLdjEAfJ_oNog1P5kXm70NMHNXmzSMo_U,29008
70
+ sglang/srt/configs/mamba_utils.py,sha256=AD96wj8FCxRsEovdtGn88xzcKAw5KErbO5xFSk0xwxc,3684
71
+ sglang/srt/configs/model_config.py,sha256=7KAlFFRQr9Vsj2PzFBsGnmzXQGWo3eHtftSnaQjDruE,39695
72
+ sglang/srt/configs/modelopt_config.py,sha256=pr4Q_J4G1Ff-wy24BYRzWaN0UI34rreGef7Nt6d0X3M,1070
73
+ sglang/srt/configs/nemotron_h.py,sha256=X39hWm2KQoAcZ4HXKDCfbua9aOTlcxcK89c52cmAq-k,13072
74
+ sglang/srt/configs/olmo3.py,sha256=DOyp1cNi_n8ckz9Ohs3zUZqkk6n26UBsNQ3zngHNNNY,3600
75
+ sglang/srt/configs/points_v15_chat.py,sha256=qand7WMc3L96wg-wzA9YqnzMz7ZUM6quAuThjO1rfM8,983
76
+ sglang/srt/configs/qwen3_next.py,sha256=XQje5KTnw2aA187DNkAFRUbIPFnTsKwl64FJCW1gcLA,14884
77
+ sglang/srt/configs/qwen3_omni.py,sha256=m6NxdP-iKVkKuYARukqjNhQ01D5gmNQOsfFKU5qZEqI,22384
78
+ sglang/srt/configs/qwen3_vl.py,sha256=0Coyj3ZYUJIgEfxt_6xx8wgd5Fy1tkMAeEhIaXXaZyk,28854
64
79
  sglang/srt/configs/step3_vl.py,sha256=_Otgnym57DVgB_kZ__8c1_Ys5gSalA_K0ZuVjcG51T0,4845
65
80
  sglang/srt/configs/update_config.py,sha256=GEf-XhL8JPrbX9-Hz8V7S3M6YTg76DVdIhc_4YdMDtc,6291
66
81
  sglang/srt/configs/utils.py,sha256=3nHUfisMs_Ltuhv8OZTNCJp63YJKJVF43h1QZB1zqx8,670
67
82
  sglang/srt/connector/__init__.py,sha256=zPuaRKulJsrDyT3OtN9wUT-4fqQBX-cJr2fZUB0_KPM,1562
68
83
  sglang/srt/connector/base_connector.py,sha256=LCKsTX_yWHclPrzNNB1fLwVCN8rIDKZaZhqHQ54B9MU,2774
69
84
  sglang/srt/connector/redis.py,sha256=K3fJSm2rZsd0R_KkICV3jIWKtrwxXE1tYktWnovLbz4,2514
70
- sglang/srt/connector/remote_instance.py,sha256=X_PIZFvZPsnUZ_54AgnzR0NdUfi6ClwQVlNexZatkXU,2710
85
+ sglang/srt/connector/remote_instance.py,sha256=LpPVftvXN0xRVPthwFm2fgnuvxSlYxwE_47NRGAmkmY,2704
71
86
  sglang/srt/connector/s3.py,sha256=hn5Ow9Y6ItS8RMJDwnTQe5QaiQ7HKMgiwggE9QnUewM,3743
72
87
  sglang/srt/connector/utils.py,sha256=isTvxauz1_8no5MW6p8Bwj2H9mQkweaRO_RSwAPA7R8,983
73
88
  sglang/srt/connector/serde/__init__.py,sha256=zuleyYN-jrDyiPiXjTbQKA27llb4H7HuDTZcBwrLk1U,707
74
89
  sglang/srt/connector/serde/safe_serde.py,sha256=XSjb9mRv1HqeG6Jiw633EOQYlrcI23Q21UluYqPZaWA,760
75
90
  sglang/srt/connector/serde/serde.py,sha256=n59I2MXLa7WCyN_8pEd8L-scJk7lMhmEX-GOUIhF0ZA,1004
76
- sglang/srt/constrained/base_grammar_backend.py,sha256=FKlBqllZ-bs65DYG5l-qsuuqfXOPeuUe5_NvPlpBzUs,8114
77
- sglang/srt/constrained/llguidance_backend.py,sha256=JkA_59nZ4zd8ciGvXsZ-OEsGCyQMoIxBO8QXIUqAUn4,6161
78
- sglang/srt/constrained/outlines_backend.py,sha256=t4gkO9AX8xfYulvhNx0n-p1kUavJnCjE9XjwN1Z4BV4,6883
91
+ sglang/srt/constrained/base_grammar_backend.py,sha256=LVEaY4JrF8zCbn1chwva0zJ9cW00dZ4yVTREmzJx9Zs,8307
92
+ sglang/srt/constrained/llguidance_backend.py,sha256=OxJoMbhi1InKzxMkGQrvetWU5GR9n8C1jc74fHBFQtc,6433
93
+ sglang/srt/constrained/outlines_backend.py,sha256=1pQNeROdrFBiXIIkIYKB0xufIfp6KDxm8G7C_xMooH8,6889
79
94
  sglang/srt/constrained/outlines_jump_forward.py,sha256=dm3PVswx2oE_JfAv-tPd7irMI95VCq4cZT-AF-Ohx3s,6823
80
- sglang/srt/constrained/reasoner_grammar_backend.py,sha256=YFxWuOTTo4e6cGhxnaBwuwli6f8FTUJtszib8dBq_8I,3207
81
- sglang/srt/constrained/xgrammar_backend.py,sha256=Dhn0sROXQtybY-sJfMcleIu_Rmn0sjleGMywCD3Simk,9338
95
+ sglang/srt/constrained/reasoner_grammar_backend.py,sha256=O36HzXEB-YKgo0recrLtW36EiTZIBbpnbHBPeGkWEyI,3334
96
+ sglang/srt/constrained/utils.py,sha256=ZDXuyKjGYHfPo3ZhcgxZe7pk_Qb4_ilBV2WjbDRXKDc,418
97
+ sglang/srt/constrained/xgrammar_backend.py,sha256=x7iwMMojTI3pcMmnyUPI1k4bCRoe1IIw76_IIJTAXBs,9855
82
98
  sglang/srt/constrained/triton_ops/bitmask_ops.py,sha256=WjTen9iuuFWLzkE1mAHQZB9_7aIy5QH8Wjf-lB-Fams,4614
83
99
  sglang/srt/debug_utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
84
100
  sglang/srt/debug_utils/dump_comparator.py,sha256=3rWdv4BQXTDtB3z5ao9VPN5lK31ImKf2zMWX7f0Xe6s,5394
85
101
  sglang/srt/debug_utils/dump_loader.py,sha256=RzWpl7RsDRw98DJMEvf6U9c9fPiobyeWI8opmRaRGGA,2632
86
102
  sglang/srt/debug_utils/dumper.py,sha256=6frfI4WErneQE4RpXgAR5gZJQRdzcQjyO3McW56jgYo,3517
87
103
  sglang/srt/debug_utils/text_comparator.py,sha256=NLJdjUikW--bWnGQWIeFJesyuvZ2Vni2S53fIED-m8s,7370
88
- sglang/srt/disaggregation/decode.py,sha256=_k9uVKzFUxEJIpBQSjoBVaY-GMoc0zTW6FuVhiH05os,36936
89
- sglang/srt/disaggregation/decode_kvcache_offload_manager.py,sha256=BWjhO0CDdpU8VIC_-hL9R8CjqUk5cQ1ivfXLjPSS9jU,7029
104
+ sglang/srt/disaggregation/decode.py,sha256=EJNSz7J2hmO5VuqXu14O6k57w7WizFRK5n1uE8iSzdY,40441
105
+ sglang/srt/disaggregation/decode_kvcache_offload_manager.py,sha256=jD_O-uRaZ5cD8C9qtto6m5ZXyM86loJzkdLgwheMBao,7045
90
106
  sglang/srt/disaggregation/decode_schedule_batch_mixin.py,sha256=BeGxXbFLW_ZbuyOs0idWzlicCh6NA1pTOXgON5SAdaE,6947
91
107
  sglang/srt/disaggregation/kv_events.py,sha256=yFbtwOeblcCmOXTjg00TopxnyjkmCBQIVz46KB8jetY,13555
92
108
  sglang/srt/disaggregation/mini_lb.py,sha256=JY2uCeUM3Zk3FdGWmCQBY3LeiJ5FM1PlrqAW8wJTTHI,395
93
- sglang/srt/disaggregation/prefill.py,sha256=eOEdepYknYHO6vz-MCV-jmuTOe_qq9X_ZD_AX1SwICU,37138
109
+ sglang/srt/disaggregation/prefill.py,sha256=crU3CZ5oITm3W9dSxIsvbPIwzOM9dPDOhPTELZcYepA,28325
94
110
  sglang/srt/disaggregation/utils.py,sha256=oBMqYOMAnyK4T69fFaDIuM1AAGa2vOvoA-CBtGocOkk,12263
95
111
  sglang/srt/disaggregation/ascend/__init__.py,sha256=-lxnica6fZYmYNpKwmE8yESUpQ5Sxf2DiZoBHzboKc8,146
96
112
  sglang/srt/disaggregation/ascend/conn.py,sha256=Z0xTJjSYXal7uGA5e7ci4oxOcWdC9qrV-gMd06ikp2w,4109
97
- sglang/srt/disaggregation/ascend/transfer_engine.py,sha256=JkalkQUFCwdCjJ_k8hxJqmgJ4CfxgiQzHzplP1S6xqE,3577
113
+ sglang/srt/disaggregation/ascend/transfer_engine.py,sha256=MK9G22_YUkvpaH4XVvKe1iz7F-bzhOdtYaVQ2jKiY2s,3567
98
114
  sglang/srt/disaggregation/base/__init__.py,sha256=4VwUv0aWxwmVL1049XK82aLTNxmt0WY5RPy9li-wyVk,160
99
- sglang/srt/disaggregation/base/conn.py,sha256=0CGEv-B24woyDBdEgQwT8Gqz10Uox3gCgWiCxznXkwQ,2912
115
+ sglang/srt/disaggregation/base/conn.py,sha256=SvNYNFIjC0adxt0vs3g80P-vdVCleBPE4VKs0-hUIz4,3271
100
116
  sglang/srt/disaggregation/common/__init__.py,sha256=7yl-EGLMVKRpBUaGF_7lwAsw2J_mqpRZV0238VGxD9o,126
101
- sglang/srt/disaggregation/common/conn.py,sha256=PiYuKGYVeVxoPaQcUK673IGelN9XnK7fyHSb6y6mptY,24415
117
+ sglang/srt/disaggregation/common/conn.py,sha256=mlZJnlsvdS2WxapGtMhV1YpE9M9zLm2NXPMNuI7PSFo,24443
102
118
  sglang/srt/disaggregation/common/utils.py,sha256=SxRhAWisNK8seGhb5BXBJ5u53DF7yeKVPMWPcB5ywbE,1194
103
119
  sglang/srt/disaggregation/fake/__init__.py,sha256=jJGWdXwaQiGIoR6atKqkQfkJmVyQ09l55VUN2WjwaeY,77
104
- sglang/srt/disaggregation/fake/conn.py,sha256=qsN5SEQLMenALxYC3x7GYZprhUQyRje5ldNwjkT6OPw,2283
120
+ sglang/srt/disaggregation/fake/conn.py,sha256=C5gYCsqf-CfffDhqzbp4FL1GQ3xFo_OvKkcC4W6R1OM,2502
105
121
  sglang/srt/disaggregation/mooncake/__init__.py,sha256=0TgqkAdQI1YynbHY6c0QISvVoOSk-0SwCIq5rjPSmgE,156
106
- sglang/srt/disaggregation/mooncake/conn.py,sha256=01TcfkekA3v7ApN11ATx_YsFi6B5U1xd3yPDxRx6F9Y,50697
122
+ sglang/srt/disaggregation/mooncake/conn.py,sha256=ruE4Rb0dPIhAmpQEKkePgnyRDG0xMbySgsrCb7wFIh8,56422
107
123
  sglang/srt/disaggregation/mooncake/transfer_engine.py,sha256=O-XRmQ3QwD6RuiyRgw4ZohSrFkuPdppV_eDBMUXn0jk,5884
108
124
  sglang/srt/disaggregation/nixl/__init__.py,sha256=qODVPIGWUXKXq4zsRIcMYoAoAeg6nBIN9vdQOlVMANE,136
109
- sglang/srt/disaggregation/nixl/conn.py,sha256=_si9ryeRoDHYmomthSyztUOEYl20aa18mS9_Sm961S4,32299
125
+ sglang/srt/disaggregation/nixl/conn.py,sha256=w_kDDEB4fIvDe-Z7ufxmw_cpDR57xXJVQrqWvYe88vo,33788
110
126
  sglang/srt/distributed/__init__.py,sha256=jFOcyt-wFAPMBUAf9zkZalNQlt-4rqmT6pCKBz1E4qo,149
111
127
  sglang/srt/distributed/communication_op.py,sha256=IBnFUdMftK_VSTMMMitGveonorFUUVNL4guqO31cMSc,1130
112
- sglang/srt/distributed/naive_distributed.py,sha256=5Kcfapzz61G3TtScTZrHoWa4bf6Vr27GlMcBAGMz7tQ,3260
113
- sglang/srt/distributed/parallel_state.py,sha256=m0T-Tfqi7DnCUPEGhA8Fr-dNlbeoowvG3Ds60IoDeos,68541
128
+ sglang/srt/distributed/naive_distributed.py,sha256=GX7CHhUb9rIQuaIPX4TYm01S7XQdBXvdqaJoPdxFyAI,3317
129
+ sglang/srt/distributed/parallel_state.py,sha256=SHisHdAql3dVBFUR1zIZo3apQMejRPh0hQYn5AaA9N8,70931
114
130
  sglang/srt/distributed/utils.py,sha256=aaCxATncLGnVgB0WlGpBdee0behKW8Dy_dakqcuKSaQ,8497
115
- sglang/srt/distributed/device_communicators/all_reduce_utils.py,sha256=IxCuujkRVUGckr-PAhe2F_QfHGKhvQHo9ryB9-CQjpA,332
131
+ sglang/srt/distributed/device_communicators/all_reduce_utils.py,sha256=dk-uFaKZgVG-1dZDwMT6GvpFi2xP0DJRJ9BiRjHq0zw,336
116
132
  sglang/srt/distributed/device_communicators/cuda_wrapper.py,sha256=3jvPG-Ow5UBLiXhfx8T8snR7crSZbPpARAggsDPWq7k,7038
117
- sglang/srt/distributed/device_communicators/custom_all_reduce.py,sha256=Q1kkKPKFPV0QMmKLyjOBlOnX8-Pr4UeGBZYkG6j0gc0,16570
133
+ sglang/srt/distributed/device_communicators/custom_all_reduce.py,sha256=RCF9FzJYI9EzlNEDUZB-uL_0VKjTqNn0_MfZED-0RhA,16615
118
134
  sglang/srt/distributed/device_communicators/custom_all_reduce_utils.py,sha256=Fx9D70NO2dplyuqOxTasMwkzONN3wfC4WOny3tWSbPA,14159
119
135
  sglang/srt/distributed/device_communicators/hpu_communicator.py,sha256=gPjEH1-izoby5uDrfUlzNf21luPT0Ow7pJjhCRKnHy8,1728
120
136
  sglang/srt/distributed/device_communicators/npu_communicator.py,sha256=bRXN1Md_4SHQGzQYZa2GrHv2zbIU5vSpkueHiAZL1xQ,1345
121
- sglang/srt/distributed/device_communicators/pymscclpp.py,sha256=8Pgehd02v-BpHixTTB4OB9ZlxA7fyXiPF4Xp9F_heyU,10890
122
- sglang/srt/distributed/device_communicators/pynccl.py,sha256=7aE-pKMyJfawGo7Vzymb6Nlz3ux2G_dPflYPK2kzpaQ,12208
123
- sglang/srt/distributed/device_communicators/pynccl_allocator.py,sha256=zAxWwI73ZNsF_c4PZUnRMzwzSD88v26w8komzZ4Uatc,4771
137
+ sglang/srt/distributed/device_communicators/pymscclpp.py,sha256=8ujiWibMH36TGh0kWnJKcP_AqaVAX0dYhJHtZemRefM,10874
138
+ sglang/srt/distributed/device_communicators/pynccl.py,sha256=TqczleI5orlLfP3UkhccOIQexh_ih1b98kqUxtE42jY,12813
139
+ sglang/srt/distributed/device_communicators/pynccl_allocator.py,sha256=jNvIJiYPiEJYV6Q0kvcdbYZfxjh7wq0yWiRJuWWzYi8,4756
124
140
  sglang/srt/distributed/device_communicators/pynccl_wrapper.py,sha256=BLGEl90GZSl3K-04x7eCTaVmpZBXpcb7uJakAseteFU,18539
125
141
  sglang/srt/distributed/device_communicators/quick_all_reduce.py,sha256=4j1_E4azoxfd8wxtfFmt9rvbQncl8ny6wmTMl6gAkp0,9932
126
142
  sglang/srt/distributed/device_communicators/shm_broadcast.py,sha256=q68niUgh8zF7CgNwqny9vaZU1aHGpLSrxBMiUWZ5Nsk,20969
127
- sglang/srt/distributed/device_communicators/symm_mem.py,sha256=EFN6v2l3Hrxek_1kxDHMMmzLP-bDswhdNW53FrQm2-I,5664
143
+ sglang/srt/distributed/device_communicators/symm_mem.py,sha256=MauP4LGMIKSfoDx-L8o0kaXg7rsAuVDT92ugjlM68xM,5641
128
144
  sglang/srt/distributed/device_communicators/xpu_communicator.py,sha256=ajW6132BvA6jkeipEIgN27TFycI0U06Ih2Z8WNjlA4s,1593
145
+ sglang/srt/elastic_ep/elastic_ep.py,sha256=KaSUAi0JHB82desvcv-TW5_PYCrzQStslOCcl9_g-LM,2311
129
146
  sglang/srt/entrypoints/EngineBase.py,sha256=yKN76witT2jz1zhmLHmPNLGMpK2UiOTaKQ2KPD8l99U,2594
130
- sglang/srt/entrypoints/context.py,sha256=aD-94xkD0komuGO5gtYUoJKCHdc4hAipMxQt04yVRGA,8030
131
- sglang/srt/entrypoints/engine.py,sha256=hDuQJ5XheUZNfScFRBxKHEev_gDTiKH3f6gKtcWfj-U,34950
132
- sglang/srt/entrypoints/grpc_request_manager.py,sha256=0tVlP5eRgQTk1PGWsQtzNrlqd3-HJp67yu3o6jRkan4,32273
133
- sglang/srt/entrypoints/grpc_server.py,sha256=WjToYISgaWQwlmUz6-1PxMd84YPGmTPpbdKvNiukt4A,31208
134
- sglang/srt/entrypoints/harmony_utils.py,sha256=01T-A5GBUm2b306PcxNEg2rfx4cykBcqNYrzcXTWBlc,13590
135
- sglang/srt/entrypoints/http_server.py,sha256=8f9fJhaXGEGwMCsLp5B2Ukk_MDd5dNRYE8NJ5FbLKk0,52423
136
- sglang/srt/entrypoints/http_server_engine.py,sha256=_--j4U04OeJLlnnv1f0XmCd_Ry0z1FlhkrbePX8rYV0,4938
147
+ sglang/srt/entrypoints/context.py,sha256=YQdVLmELQD1tNT6Q1BLl04sATwTJAAomCATZyD19S8g,8035
148
+ sglang/srt/entrypoints/engine.py,sha256=yiIVBjbMLgL1s5A19bShgeqRdAQlv3OGfz5swHNTunc,35010
149
+ sglang/srt/entrypoints/grpc_server.py,sha256=CHiZDErgPHnVp8PtfH246U6Eq_BEoKANJKAttNYXjBQ,38869
150
+ sglang/srt/entrypoints/harmony_utils.py,sha256=FhpPFnwgy1-qLnu_HZAk5V_RPmQkT81dFVp8A6xINEU,13594
151
+ sglang/srt/entrypoints/http_server.py,sha256=Y1Rl71phsasv8Tot1wlKl1GpJK2b_xqT_EqPEfjKOTM,56378
152
+ sglang/srt/entrypoints/http_server_engine.py,sha256=rWgdCYLZZP89MA-Y-hfACQqdDu0LC7lLYghi2wk-nU8,4809
137
153
  sglang/srt/entrypoints/tool.py,sha256=aAXEjBqkr5j6_IgRL8fZCKgoDPY2TikM20-LQXU9TaI,2709
138
154
  sglang/srt/entrypoints/openai/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
139
- sglang/srt/entrypoints/openai/protocol.py,sha256=UmPdjkfaFYP2X5NYI0rt8L1w2pdqGYsIcIiCO1bnF7Y,33216
140
- sglang/srt/entrypoints/openai/serving_base.py,sha256=b15N627nn3me2jHzXJBFkWPpX8OJdtD66v8aSsx0i0s,7746
141
- sglang/srt/entrypoints/openai/serving_chat.py,sha256=w1awHs-msdhKEzlMHUA_e_Ptx3qlUcdiUGVLq6ryYfs,49829
142
- sglang/srt/entrypoints/openai/serving_completions.py,sha256=SBoaa9KIIL7NQCWwB1B2A9roTrQW1P9C4fkhuHymo00,18233
155
+ sglang/srt/entrypoints/openai/protocol.py,sha256=NkK_i-Njzxzp_FIVFoOJXonz0kdYLtf_crLBuj69LoI,39612
156
+ sglang/srt/entrypoints/openai/serving_base.py,sha256=-L4lcJCTCJPEmtYHtQXLFgJnvJ3CbUp80uyEI0X_C6w,9665
157
+ sglang/srt/entrypoints/openai/serving_chat.py,sha256=NQs4XRPE7JEV8Mmpe1XSVWKD4VQxr8Fcw1ItLUeO3jA,47908
158
+ sglang/srt/entrypoints/openai/serving_classify.py,sha256=ifEjD-2rq7izbgITMB_nZkrUDN8wj73ZMV634G_HJ4U,7148
159
+ sglang/srt/entrypoints/openai/serving_completions.py,sha256=-kTg3BYaKLmnneKh-1_2QVC0KPg1e2VV1DEKImG9KpM,18831
143
160
  sglang/srt/entrypoints/openai/serving_embedding.py,sha256=H7Nv1vSUuyOUXBeaNvYB4XMFxmcJc8or7MUKyuAw_XA,6435
144
161
  sglang/srt/entrypoints/openai/serving_rerank.py,sha256=G79XdomjzLhH1YCbGR4alSxWO9NNmi7U-YSPsH61cjk,3379
145
- sglang/srt/entrypoints/openai/serving_responses.py,sha256=ro1VwdazJNqm5RRVbMKI7NliPsVMFcrNEsRD23QiADc,54989
162
+ sglang/srt/entrypoints/openai/serving_responses.py,sha256=LDnLzUHpNrIibmUWlqCAtosUg7X3G-AIOvnUJ6etDwg,55122
146
163
  sglang/srt/entrypoints/openai/serving_score.py,sha256=LuwXzWRAMm-xMK8ZjP3JaJ84Gxjr0Oi-e3keCsIgK38,1992
164
+ sglang/srt/entrypoints/openai/serving_tokenize.py,sha256=kgLBC8a_j16T2Gm5nv4DaUjjt9voerrbe-LrB5hJz-0,5525
147
165
  sglang/srt/entrypoints/openai/tool_server.py,sha256=rRNGELPV5RHONp55MYkO4_b0NPsPffJnWg-gMYwDSTc,5659
148
166
  sglang/srt/entrypoints/openai/usage_processor.py,sha256=9LTB5rqdRuMKyZrIXiUBuF_WKaSg9X45YdzERDxbtCY,2746
149
167
  sglang/srt/entrypoints/openai/utils.py,sha256=DT9quW0F1DX1P9NAuMxpERgXcNYKKtm7rd7J1m7EaDQ,2112
150
168
  sglang/srt/eplb/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
151
169
  sglang/srt/eplb/eplb_manager.py,sha256=e8HMGzZb2QFRGdS7JZIFSy8cOIlxOlGRY-ef7Wei0Sw,4364
152
- sglang/srt/eplb/expert_distribution.py,sha256=gd3PktGCSqHLjB5XHhTSA-OtaDVYw-taExCe7NOHM9E,32939
170
+ sglang/srt/eplb/expert_distribution.py,sha256=lU1Pw8qVooiyv3LPIW1Jec09wLs22_eKdxs0kuS6vgc,32901
153
171
  sglang/srt/eplb/expert_location.py,sha256=WoOmsZ4u9le44km3nbjJjF6BVBxN3cKRz9nQM0uWH_s,18386
154
- sglang/srt/eplb/expert_location_dispatch.py,sha256=vA0o-7bXf847BQAVCqElWKEpofZLAIsir_d0pew2KNQ,4178
155
- sglang/srt/eplb/expert_location_updater.py,sha256=ScoyCJbtJNQLriQXJNZTV2-5G8-tR3AocZDK3ujMaJk,21172
156
- sglang/srt/eplb/eplb_algorithms/__init__.py,sha256=c6fo4qM8N0p5DyyfGp9fxqc2wkxvzSJBzJFRG1I1leg,1959
157
- sglang/srt/eplb/eplb_algorithms/deepseek.py,sha256=mMZT7zAAArccdRS0xXxifvMb3qn9enSt426uUTKeiq4,8340
172
+ sglang/srt/eplb/expert_location_dispatch.py,sha256=mZUH-jvz7yvxC-5bwMFQalfKbbJiZujMiRK_M9oGOT8,4163
173
+ sglang/srt/eplb/expert_location_updater.py,sha256=7LOmLtY_YWYySI2GgFuTJ__Qde0LEKq70E77Q608OFU,21157
174
+ sglang/srt/eplb/eplb_algorithms/__init__.py,sha256=FBO0vEaWbpURbrSV6Uq753Zm2ukiCTUkDvOd292xU_E,2695
175
+ sglang/srt/eplb/eplb_algorithms/deepseek.py,sha256=LHEW_v5vA6FgH-oFqG4Cu113T-5ZPVdGV791MrM4K20,8293
158
176
  sglang/srt/eplb/eplb_algorithms/deepseek_vec.py,sha256=Vzy5Iarua1VgVHzjBNZaVV_vt1LY1BLtJz7PmzB701k,10654
177
+ sglang/srt/eplb/eplb_algorithms/elasticity_aware.py,sha256=x6ab8G_CCaUnkFDmI6JdzQqaNIXyETW1oCsCx4PPxKY,3230
159
178
  sglang/srt/eplb/eplb_simulator/__init__.py,sha256=HIZaXqsvsOCMMJ81dSs1afSGZ5G6OiOZEtHpltyzzjY,21
160
179
  sglang/srt/eplb/eplb_simulator/reader.py,sha256=OlsWqsuXqVQY7PfvvrP-vsl2Ww2Kg4vD_K9BltM_QHo,1828
161
- sglang/srt/function_call/base_format_detector.py,sha256=DunwyYJxLcwrD-iHDXX9uqJ5S8zMJhUXfzHiBgbXaZ0,15728
180
+ sglang/srt/function_call/base_format_detector.py,sha256=pQjF8ri_i7wc8diX-sGC4FkKi6eOqSUUi39Wu2Q3-AM,15585
162
181
  sglang/srt/function_call/core_types.py,sha256=wLUsW8mUA-i-ISz5QUDL7Ejq72W-K1HIhFa9Wm-_oA8,786
163
182
  sglang/srt/function_call/deepseekv31_detector.py,sha256=hpRjjv219mH0v1PQpMvj_gezrP7PwvLiNbBKOTCSC3U,9731
164
183
  sglang/srt/function_call/deepseekv3_detector.py,sha256=DhO3tUX1nvFlfRkHJ1Vm_7OMXFFTvWBA9u9SZKFAwuQ,9710
165
184
  sglang/srt/function_call/ebnf_composer.py,sha256=OpjfvYowLlMLnxz5fwS7zv5-d43_ZwO9ucGAMsILvm4,15321
166
- sglang/srt/function_call/function_call_parser.py,sha256=NUQCh7dMwRTkudRDFz3Mdr-nDL_zXqABVQYPocGI274,8592
167
- sglang/srt/function_call/glm4_moe_detector.py,sha256=fUqozcc_V2g4Vd0l3BjhZZ0MRKmLinx98-Gm8aOlVgI,6975
168
- sglang/srt/function_call/gpt_oss_detector.py,sha256=f0fjnxNKLb_TrxvNWbmCOB3_KN07NtZacazFpyIcqC8,9262
169
- sglang/srt/function_call/json_array_parser.py,sha256=i985g7MUHj1M8gJ0it3Lw663Bx1uh0biN_It13hnMxU,2227
185
+ sglang/srt/function_call/function_call_parser.py,sha256=CXP_4OEo0M9aE3vXMW-m3VJTq9uVhM2w3NOcnnmXjuA,8762
186
+ sglang/srt/function_call/glm4_moe_detector.py,sha256=B4GjjgoDVc4ETyqCowfWQamIhhUDwl6pA9xsAE3sOfo,6943
187
+ sglang/srt/function_call/gpt_oss_detector.py,sha256=ti5Dwci_3J9XzqQetMILY7R-VTCCRbGbHas3DdC5x28,9263
188
+ sglang/srt/function_call/json_array_parser.py,sha256=m37S_3bQtyAI86T3ju80dkKJxuazA1VV0J5ioK1uQbw,2205
170
189
  sglang/srt/function_call/kimik2_detector.py,sha256=VWN4Nf9l9O0uSUR0UppuoAyVObvGw-rVvklFJ1qzbRA,10641
171
190
  sglang/srt/function_call/llama32_detector.py,sha256=trZja7IXc2IWUko5PRj7p4pRU6XCVjtxr-7qJNr0EWo,3647
172
191
  sglang/srt/function_call/mistral_detector.py,sha256=Ts2HrJdu5r2lCCMVKPZfnCds9pt1K5H1EaOQrF_HD60,4686
@@ -174,121 +193,133 @@ sglang/srt/function_call/pythonic_detector.py,sha256=yAatItKtVDf9uhlB78wPWKP3fbe
174
193
  sglang/srt/function_call/qwen25_detector.py,sha256=nv83_sipZMU6Vie3J4HeNiZVCSRU5ei7601j50779HA,5181
175
194
  sglang/srt/function_call/qwen3_coder_detector.py,sha256=fyiF0WkNwozlKZQy0G903hj-ZAyvEgkFC8l20FVOVX8,14299
176
195
  sglang/srt/function_call/step3_detector.py,sha256=SAibrispu0peDQzqOG2-V93KGHtV6Ud7a38vlnhTunA,17442
177
- sglang/srt/function_call/utils.py,sha256=HeRwtWRrkwipIKM_EBfCgyNxy2It_7kAfPUcBhMERjU,4548
196
+ sglang/srt/function_call/utils.py,sha256=P-iT81YRm1zPV7Y19bkQq5VcV15-XLF1AwoeXWI7Nig,4552
178
197
  sglang/srt/grpc/__init__.py,sha256=dPeDsMRMW8WyHD6jolIpIlvlJsYLAhwewHhCTdu1MAE,21
179
- sglang/srt/grpc/compile_proto.py,sha256=kiaVgK1eEcSMVd5mCed-5cs_78JIawjJ1jQ2U6mdYkg,6997
180
- sglang/srt/grpc/sglang_scheduler_pb2.py,sha256=Q0QVnMvRovwWpFmd3j2-fNLZfuvX_4Hq8iRKM6sz-s4,14182
181
- sglang/srt/grpc/sglang_scheduler_pb2.pyi,sha256=RN5UOWYzxPBFUUcWAaiXPeOB9iclizo7ehFzNrI5P94,23095
182
- sglang/srt/grpc/sglang_scheduler_pb2_grpc.py,sha256=s8WXOFE0a0zGkcfVUxHxa28yA8VOZxua5K31dEXqt_A,9051
183
- sglang/srt/layers/activation.py,sha256=iWEi9wIdAf0xov0KU27JUB5FIl6dqCGQjbIm_9dVSfQ,13368
198
+ sglang/srt/grpc/compile_proto.py,sha256=ZRH11Wodv4BbYo0F-JqA-ymIM-FwkkiAjwM_7msI2uA,7011
199
+ sglang/srt/grpc/grpc_request_manager.py,sha256=ZX4p3ewoUAd9vGG3lNKv9MknFV4BtXJQtP1u8hDJrKk,34849
200
+ sglang/srt/grpc/health_servicer.py,sha256=6h0JFrvVKz5hRBh3pzz_N1Hsj2WgM_Kyd7kfHuJqlDI,7278
201
+ sglang/srt/grpc/scheduler_launcher.py,sha256=GMuNCfF4MYYjJL3O8NqQrg1N9P7T2QyRmpxxXOAYeDw,6563
202
+ sglang/srt/grpc/sglang_scheduler_pb2.py,sha256=ALq0gD19OUC4CdjbOU2YYHGmgTlkJvWX3exX_SOXSv4,16016
203
+ sglang/srt/grpc/sglang_scheduler_pb2.pyi,sha256=ibYeIZPchbx4fcLDeAa-LSnq6MZi-mh4DgzIGg-SUWY,26274
204
+ sglang/srt/grpc/sglang_scheduler_pb2_grpc.py,sha256=8FQtALiqSyWkqL6P_rKerievE9q19V3675AEEomNSe8,12633
205
+ sglang/srt/layers/activation.py,sha256=Qg-goR7CSwQeBhS4IO56wCA7jMR_bPNZJHnLDZNnm5s,13407
184
206
  sglang/srt/layers/amx_utils.py,sha256=1mENgHK2B8mgaD1oMtgbZ15Jmy_Uu1QueBmo09Ff2iA,2865
185
- sglang/srt/layers/communicator.py,sha256=KzmCXRknuxlRnwdA3G38wRlVHYD_kf76mOZWhaIU5lo,24366
186
- sglang/srt/layers/dp_attention.py,sha256=ly-EMgb_I0neGA0Y4Hq9Z_sp1plIRwoBM3feTqLJob4,16322
207
+ sglang/srt/layers/communicator.py,sha256=dmoydeyHoiVQCr1PvMcTwM1Kirv71PZOa-JSeVD6n50,24465
208
+ sglang/srt/layers/dp_attention.py,sha256=dBfEtofjY9MlCDF5B-y_zrX-owfZ46mSBYioCzlIoHM,16817
187
209
  sglang/srt/layers/elementwise.py,sha256=tGbN7bbK2s-j3DoJeJfkfyPNmKdVAutAd0J3TbxUPAQ,18849
188
210
  sglang/srt/layers/flashinfer_comm_fusion.py,sha256=hnVVS_VsWukTYhREubWs2KcJ1GjVMEI9ECqxqOMXZv8,6729
189
- sglang/srt/layers/layernorm.py,sha256=WKAv4N6LFDLu9x62XBqGT9xEcrj2W53GtP8ji4zTbTM,11335
190
- sglang/srt/layers/linear.py,sha256=z15L32URxbPUb34_urGDwSWIZNfh1jmyKUF1A9lzI9I,55761
191
- sglang/srt/layers/logits_processor.py,sha256=BYDSuqVCrpo67JFCSvmATfegVwgtJ-2_Bgwp23y-Ds8,28094
211
+ sglang/srt/layers/layernorm.py,sha256=Kf18oGBMTyqjaeeTJMeCYhyrQb-8NsSjhG0QDswM8rM,12334
212
+ sglang/srt/layers/linear.py,sha256=1g5vEFHqSd1TPb0VxQiZ5oga45QorYxvj2CZl_NM9wc,56084
213
+ sglang/srt/layers/logits_processor.py,sha256=VNMPpyxVNNXtOxd9nui0Yrm8MUkjrGBEL1cmUYXLyM0,34499
192
214
  sglang/srt/layers/model_parallel.py,sha256=eLXZhvJ4wG6dh0FontNCIdVZvHYdWgaeY-5cu7TD9tE,6078
215
+ sglang/srt/layers/modelopt_utils.py,sha256=Abhiwmu1VOoSePJWytgFxRw_6qTtN2rqT61DPDboCIw,335
193
216
  sglang/srt/layers/multimodal.py,sha256=vNswe0J0maeBiN8ehlmxfs-YYlrmMllYl6Nc_Y57Neg,5114
194
217
  sglang/srt/layers/parameter.py,sha256=6ce1lx2urWJKz87g2qg_oce_S5BV0IcguSiOGGHbcC8,18378
195
218
  sglang/srt/layers/pooler.py,sha256=uZ6WX1FLMEafZwusyZdm6KuVlIwSjbKrdwk2qzgqNGk,3812
196
- sglang/srt/layers/radix_attention.py,sha256=MpugwaqiY2zPTeg7FVW41OljljCXmYVvHZ2MvneF6PI,3745
219
+ sglang/srt/layers/radix_attention.py,sha256=HvTa-gSz86XdN9mcK7H3lrQXjGfAMnBzI1lM8WKaIUc,5203
197
220
  sglang/srt/layers/rocm_linear_utils.py,sha256=7PPh-5H2IYjiLp_g_szzVBsmiMacZ1RtjVtjdrdFJKI,1374
198
- sglang/srt/layers/rotary_embedding.py,sha256=D6X_HmwtGShR_XKuOBPXtRSmfrUU_VMuJ58HycmRUxY,75058
199
- sglang/srt/layers/sampler.py,sha256=C4iNOK42sfUGKhA9xBZA4xXHDsciC3V_5aPoJr-kpJM,19805
221
+ sglang/srt/layers/rotary_embedding.py,sha256=ZekORUqqnej3PP8-ETIhvlkweLMhrP1nZTH4Qz3fB-E,101467
222
+ sglang/srt/layers/sampler.py,sha256=bnfa0jtHBWcXeDALGGYR6t1DOejaG2LBqgG6kmXP7Fc,20632
223
+ sglang/srt/layers/sparse_pooler.py,sha256=9gB8duR48R-FGtA4Q7D1fIDSvbKlD70N38S3Lvg773s,3424
200
224
  sglang/srt/layers/torchao_utils.py,sha256=Ws24FdRBSkTpyeyA6bQrdDm-W5wfDxKvSIPUSahyMfA,4063
201
- sglang/srt/layers/utils.py,sha256=58yO8aKsAvS0jJ3nhOWVR_WAc5oTFiMeAERWNkXGR-I,1945
202
- sglang/srt/layers/vocab_parallel_embedding.py,sha256=x0421kNUgnAb5LnkJR6O67vGZ0ikSD-ThluV3QGsZ_8,22673
203
- sglang/srt/layers/attention/aiter_backend.py,sha256=oovonzjvnijaegNmkyTlWlEhCuhXAMNd85EykvKvvow,43923
204
- sglang/srt/layers/attention/ascend_backend.py,sha256=JwbuW4a-urczuVHEP7oRGOehJOcfUO71LCG3BiQq-zA,27206
205
- sglang/srt/layers/attention/attention_registry.py,sha256=RT9Z1Jg0pM65FO08S9Vs3K_7BxfOYpFsgbl3_FZ-uZ4,6795
206
- sglang/srt/layers/attention/base_attn_backend.py,sha256=AGCPd_VqvvZ0tLExCEs_9RenwhP7nB47nNcbR9VuSJw,3831
225
+ sglang/srt/layers/utils.py,sha256=F_hhE514OZ4cyMklga3mipdUzlrKo3SolIcuqgqqQqQ,1913
226
+ sglang/srt/layers/vocab_parallel_embedding.py,sha256=jPZ6H45qD6ieWV2TqU65YzSaJwRWURoJQ1J-6eOOG-E,22737
227
+ sglang/srt/layers/attention/aiter_backend.py,sha256=bv9yGDu-4oLZlA3A00GDpOWU84cLJ97cW08aVoGEjn8,43935
228
+ sglang/srt/layers/attention/ascend_backend.py,sha256=lb3ZmNZmEqnmf3zng38sA48NBBLn9M9lVXW_UdB6SNw,27892
229
+ sglang/srt/layers/attention/attention_registry.py,sha256=OpiNS5eGkYK05lt0L6zm0NfHZFQKyI-fGtLl3wHqONk,7505
230
+ sglang/srt/layers/attention/base_attn_backend.py,sha256=oYk0ch5ptL2EtlhjyitKvu6H2qCHvrXSjUJVJgPnGd8,4495
207
231
  sglang/srt/layers/attention/cutlass_mla_backend.py,sha256=cb2dMTnDMmMVBG_lqFRciVDiF3PeEAcXYaKDFWszeTw,9849
208
- sglang/srt/layers/attention/double_sparsity_backend.py,sha256=2ZRL_gYz14idoVqQzeQ6N77nXer0f_8_TUYw40XUUz0,9161
232
+ sglang/srt/layers/attention/double_sparsity_backend.py,sha256=wkF1GxFuLsGUWYoPWoqdz0xpePqA_nbo7xd2ha67sng,9135
209
233
  sglang/srt/layers/attention/dual_chunk_flashattention_backend.py,sha256=20vmnq68-Cq62UWIzQU_uwJzq4B8KdJeZUPVoWPiyDs,68620
210
- sglang/srt/layers/attention/flashattention_backend.py,sha256=nuOTQ8Zl2anCrNYDLoDiBhCkd3XE4UAA9ZThcY7zFOU,105158
211
- sglang/srt/layers/attention/flashinfer_backend.py,sha256=3tX5ThHhH4Za0jhONXxxViUxN1sYmuqkdOOD0TGq9Go,52247
212
- sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=hEoTNUHPM1LJXMPNVY9FGazUnord_Bmr5WsQY0mxRx0,39403
213
- sglang/srt/layers/attention/flashmla_backend.py,sha256=QqQgWIcF90wVqcvsxJR7lHtCtAqkNd9Rdl-tLq7cHHk,20852
214
- sglang/srt/layers/attention/hybrid_attn_backend.py,sha256=Mp1M83ODwHENVvefP2JEjv47ifDt5SA1hoyrJo4OJyU,5128
215
- sglang/srt/layers/attention/hybrid_linear_attn_backend.py,sha256=e8O2h82ZDwgDEXt8QF23IznOY3vq1-LB9vcWum7Y68k,21938
216
- sglang/srt/layers/attention/intel_amx_backend.py,sha256=IU_E7HkPrBLfNG2ArhI1ozHZ_pROujUzdI6g2JuToL0,4154
234
+ sglang/srt/layers/attention/flashattention_backend.py,sha256=0bbODTKS-DADucy-GmR_1LQzwezvXuXGuP21Y6WH5EU,105314
235
+ sglang/srt/layers/attention/flashinfer_backend.py,sha256=R06qwUhhfeBL2qAD1CRS9KzmdoiGxO10QjAoAouNDjA,63332
236
+ sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=LrhlHUVn0ZlvCIhK8iAjqEEqUUvRydJn7TZ7Hs4o3B4,39462
237
+ sglang/srt/layers/attention/flashmla_backend.py,sha256=HijFHZZ-pGE75NytFXsS0MIv8d-zWJGRRdfjdF1ViJ8,20860
238
+ sglang/srt/layers/attention/hybrid_attn_backend.py,sha256=_Gol1e_m6vMKhpUw2-OQ37ymC5sIuSTntDylVKSZtpA,5121
239
+ sglang/srt/layers/attention/hybrid_linear_attn_backend.py,sha256=tqwPna30r1zriVhKlit-iVfpfy6hJGxumGKsnlJ20C8,26119
240
+ sglang/srt/layers/attention/intel_amx_backend.py,sha256=8AcbJn0u8ifvhml9iocDzjrtzLEj0oJ7V7bOmkQPefo,4168
217
241
  sglang/srt/layers/attention/merge_state.py,sha256=OnWmNV6LYTUj0y8SCy_IK7A9q6v9bZwR4_XiLOIvbrk,1423
218
- sglang/srt/layers/attention/nsa_backend.py,sha256=yyN3TRmPyxDBaYKsV-c5upK_wEVV3MyjJocw20DCAVo,33190
242
+ sglang/srt/layers/attention/nsa_backend.py,sha256=68NXSaTzqQKL7aVSgmWgDRgPc0OYI3HNU-f9JsEV79E,45516
219
243
  sglang/srt/layers/attention/tbo_backend.py,sha256=MyEQ29I41LCOHXm4_g7J7sXSs5bNKWRlSa2EfqploD4,9185
220
244
  sglang/srt/layers/attention/torch_flex_backend.py,sha256=MnnZLxi41R-d4P0cyklNyefSWOU-AdFEjr8pxJWNgdI,11711
221
245
  sglang/srt/layers/attention/torch_native_backend.py,sha256=NdWD2ArmS1lQN9mZIbS2rcHueBWColNxvhcLaQGAKGQ,9728
222
- sglang/srt/layers/attention/triton_backend.py,sha256=3nIh_oQXVPDZw07m-bkXkAAddW39exOxzNMCDQbc5YA,43564
223
- sglang/srt/layers/attention/trtllm_mha_backend.py,sha256=l6ZbRIZ9Q4rHbsULJ49_MKd32vWdr3IRF5Pi8Dnzv0M,27503
224
- sglang/srt/layers/attention/trtllm_mla_backend.py,sha256=k3e-tD-YjiVs8kOzEXaakCI7g6MDLD99NXMtAscrBZY,29396
225
- sglang/srt/layers/attention/utils.py,sha256=lx_jNw2VwlBe2VnDb1eXRRdN9WArw9rdWHTHqndUEFk,3174
226
- sglang/srt/layers/attention/vision.py,sha256=F_dBh1DpepBt97JOhvQo0sI9tSKBU3w3LOxLT66wBQg,21780
246
+ sglang/srt/layers/attention/triton_backend.py,sha256=30z1z_aJ9jUKGG3rc-2DI6h-3HO3w3hVpcFM18BVSQY,50504
247
+ sglang/srt/layers/attention/trtllm_mha_backend.py,sha256=IQUu3jkCuAY5foqvR6L1IYjjVD4qfmTwG6rfo05ZVkI,27516
248
+ sglang/srt/layers/attention/trtllm_mla_backend.py,sha256=7ceisj7_0X9mK1dDheEoVuIXHsMDjptoaw9HycBVxYQ,41679
249
+ sglang/srt/layers/attention/utils.py,sha256=uRyxLjpRMVesPDFtGHtzJDHQvWhS4AsGW5RGCsIYPBk,3230
250
+ sglang/srt/layers/attention/vision.py,sha256=-MX_K0_mX58xkpaS6O93vWIJVqha4iNgYNN5M5Yptnw,21763
227
251
  sglang/srt/layers/attention/vision_utils.py,sha256=6hPPAt8p3SOm7tgHNUesnMLxvQiKbaOM5EK6K-ig5dI,2771
228
252
  sglang/srt/layers/attention/wave_backend.py,sha256=dMsR7GsfDYgVizY8QJ94ASrxiiJ5_MNOuTUDDQzvpPQ,22915
229
- sglang/srt/layers/attention/fla/chunk.py,sha256=N8ToAspPlgR7sVJBImzpmlGV6rWsMA7aTaTa1iddcPg,8929
253
+ sglang/srt/layers/attention/xpu_backend.py,sha256=nYRnYi7ZVyeC1m5WPB8TKpux2mBxCjHOzKZ5QNnCBlo,47650
254
+ sglang/srt/layers/attention/fla/chunk.py,sha256=r8Tddl7p0ae0nH0FU1sU3EpWTtiipdzoijaTMX3_gGI,8913
230
255
  sglang/srt/layers/attention/fla/chunk_delta_h.py,sha256=Gf8RgLesGaR9GM4HTB7kDDCVirwR9XvO7O3I1HWdcuY,10681
231
- sglang/srt/layers/attention/fla/chunk_o.py,sha256=IZllM88Ap1ztEF9nOSfcx7KmRvmwIwiBMqwT9AjjH-U,4980
256
+ sglang/srt/layers/attention/fla/chunk_o.py,sha256=ngvGxIxeHhulkj_FfQgtNY0T-5cwV_4Ochc_6dP6oVo,4973
232
257
  sglang/srt/layers/attention/fla/chunk_scaled_dot_kkt.py,sha256=445twkm9l0Mu9Q_VFBIgUZQzTNLvc82gqIAe8ylip-4,4386
233
258
  sglang/srt/layers/attention/fla/cumsum.py,sha256=beIT2WTSn8Wk_wknoWM3JYQhzmzR1JJwMFzspsXvWng,8374
234
259
  sglang/srt/layers/attention/fla/fused_recurrent.py,sha256=yOSTwqcNSoPWwQD--tcCkVd2OwB5Ox0nLGnLLv8MRr8,20856
235
260
  sglang/srt/layers/attention/fla/fused_sigmoid_gating_recurrent.py,sha256=dlmOu-7DG6YoSNexT3YV8GudrFPn_RiYj-3hClWdy-c,6424
236
- sglang/srt/layers/attention/fla/index.py,sha256=kQGcR1doARV324QuA-faNoyo6u8a_wb-DfiPe_bOdhY,1050
261
+ sglang/srt/layers/attention/fla/index.py,sha256=u4yVogS7a2DrfsYwQ22t60DpO3Y7KF9eAHY1PUrfUt4,989
237
262
  sglang/srt/layers/attention/fla/l2norm.py,sha256=XOs5nGdWROp3FW4fHSObC8sa_x697yDV0jt5UKuLllE,3783
238
- sglang/srt/layers/attention/fla/layernorm_gated.py,sha256=gNAAUyRfnjf5vTx92Gkah5UeumrlgH7oCq0Tg5D_5mQ,9938
263
+ sglang/srt/layers/attention/fla/layernorm_gated.py,sha256=OJEzBNg4JQ6_Vk_ZHWnVPwy8PLbrwuBiw3rt9bLiBRc,10122
239
264
  sglang/srt/layers/attention/fla/op.py,sha256=Qc-zHwZY9-8Aw53AuuzNfpbPBwKgIvVMgtWcfJLl6A4,1695
240
265
  sglang/srt/layers/attention/fla/solve_tril.py,sha256=-Z51hFsLER_Lzn8h21WRUajbVOA1wuu5TSEvaC2AvK8,14405
241
- sglang/srt/layers/attention/fla/utils.py,sha256=yBYjW-blAsq_uZxZ961Dub3cUouIvl4DCKV9UqkQSJw,10474
242
- sglang/srt/layers/attention/fla/wy_fast.py,sha256=zf6_76vq7yYtn9Ir1Le4RVOKLaPNF_4bNST3ePuH0cU,4407
243
- sglang/srt/layers/attention/mamba/causal_conv1d.py,sha256=w1sBOwpJeDKeYK83vPaaep5Vhq2J_qey9JUaQ2vjnjU,4474
244
- sglang/srt/layers/attention/mamba/causal_conv1d_triton.py,sha256=M04m2D13KhSCvsC37vuslNpwbgS4HLaJwWzyWjqev2E,37539
245
- sglang/srt/layers/attention/mamba/mamba.py,sha256=HRGM1fFe_MzVY-6rdkYHndsaSaQB3cOWUCow8bPQYFY,24243
246
- sglang/srt/layers/attention/mamba/mamba_utils.py,sha256=3-iipUQzuHPUDlWYhse2XwtiPYgcblOsiOoozkIoOZs,2820
266
+ sglang/srt/layers/attention/fla/utils.py,sha256=CxcsCXLamjIhbCuj3NUqar1LasPsGGf8WX4acXnF_fE,10451
267
+ sglang/srt/layers/attention/fla/wy_fast.py,sha256=wS1sJq23pa5xK2tUDYRO5FhLLJ5JpHWozBghDl64pYY,4284
268
+ sglang/srt/layers/attention/mamba/causal_conv1d.py,sha256=0Im_XzEA965rT5r09-bm1We1BaPgq2g_yo5nbA7KwvI,4503
269
+ sglang/srt/layers/attention/mamba/causal_conv1d_triton.py,sha256=EqiIga4XzikCKeA9wvLAcK3uTCX-Fop9GQFyzLeNAg4,37660
270
+ sglang/srt/layers/attention/mamba/mamba.py,sha256=qGGEzMVZDDG0dEdUrLxVfWhRa1UI5OLis7dVBMqUpl0,22517
271
+ sglang/srt/layers/attention/mamba/mamba2_metadata.py,sha256=6hkbWuV0do1lFXucgGusqR5ha784g5CB7P7hZaigRNM,8551
272
+ sglang/srt/layers/attention/mamba/mixer2_rms_norm_gated.py,sha256=C60rddCKuf3eD6KVt5vB60LlGD2dYiU9WZGTlEPaoDM,4689
247
273
  sglang/srt/layers/attention/mamba/ops/__init__.py,sha256=r-IpDGRIwTqGJzZoWNGyHqsqqv8oF19pNHEb7_TZR9M,98
248
274
  sglang/srt/layers/attention/mamba/ops/layernorm_gated.py,sha256=hmuL7vQ77aWFENCDsJDB7Nki5DDdMTEiQywbaU4FC04,5229
249
275
  sglang/srt/layers/attention/mamba/ops/mamba_ssm.py,sha256=aCFsiBdBDYt3D5HT0lxt6Rru9-gPYZspBM_WpTGgHh4,13680
250
- sglang/srt/layers/attention/mamba/ops/ssd_bmm.py,sha256=xZEjoVv5zdUeu_36WcS0VO9Qkmob2BwGgJ1RqQmg6w4,8420
251
- sglang/srt/layers/attention/mamba/ops/ssd_chunk_scan.py,sha256=gyph59WoRu7rEuzARSK6731b_gCKx326vZ9X-Is1qbs,20380
252
- sglang/srt/layers/attention/mamba/ops/ssd_chunk_state.py,sha256=yaZ1Hpj3XNSvFA0wSXkEBBZZKgy0441VrHgLBcp8r6w,24392
253
- sglang/srt/layers/attention/mamba/ops/ssd_combined.py,sha256=ivE3zqD31W01W7_RgpRG8Tfh11Co4mjbz2H6fWzGBP8,8909
254
- sglang/srt/layers/attention/mamba/ops/ssd_state_passing.py,sha256=lCt7NzzUbyCcnfDB2ai_agVM_hoZvfrB1d-UbFO8WWs,10377
255
- sglang/srt/layers/attention/npu_ops/mla_preprocess.py,sha256=n6iR86qvKTYY_mC1EMxMiyHQaXZ8pF9o2iNCV68BA0E,14540
276
+ sglang/srt/layers/attention/mamba/ops/ssd_bmm.py,sha256=IGOJ67TLx2WQQwDFm9jw2OU8vTZc0daVUnQF6kcu2x4,6798
277
+ sglang/srt/layers/attention/mamba/ops/ssd_chunk_scan.py,sha256=n70BQM8Dpg7_shX87ay3QvBEUO4fEcmg1OopU88KPiE,18405
278
+ sglang/srt/layers/attention/mamba/ops/ssd_chunk_state.py,sha256=Qdzx_4DIwl1-g_c24lRWKfmLTL29rxn2aRELWfuUct0,20784
279
+ sglang/srt/layers/attention/mamba/ops/ssd_combined.py,sha256=evYcNq31qo1TeaJP8Q3yttBQODici594N4kpdgT7hrQ,8880
280
+ sglang/srt/layers/attention/mamba/ops/ssd_state_passing.py,sha256=pNjxxLYw2BsTwy5-m7RhgqTZ9H8uyQFX2GQVucWU4wE,10032
281
+ sglang/srt/layers/attention/npu_ops/mla_preprocess.py,sha256=3_jiUFd2um4mOwG2FaNHWfwbRbjko0c6EeDfdlUiGO4,14554
256
282
  sglang/srt/layers/attention/nsa/dequant_k_cache.py,sha256=ie1qLy7AAipFYS0EJFrunN8Mq97D9v-noWaJBYMiv0I,4973
257
283
  sglang/srt/layers/attention/nsa/index_buf_accessor.py,sha256=jPYRgFfTdH_g83OUs9q3ncj2Y036ikBvflMjYEjrHGw,11481
258
- sglang/srt/layers/attention/nsa/nsa_indexer.py,sha256=FgK_o31MRswHX8CQiX9jPp04z_P7GgBumC91v_pRJHM,26466
284
+ sglang/srt/layers/attention/nsa/nsa_indexer.py,sha256=qTzO557wWrB7RypNvX1i5_C5vr66X_YPjEgJiV_TP3E,25368
259
285
  sglang/srt/layers/attention/nsa/quant_k_cache.py,sha256=FYl6gp16uGU3ftIHkU5vFAjfdPnoKvWOg4l7TBKkGI4,8675
260
286
  sglang/srt/layers/attention/nsa/tilelang_kernel.py,sha256=Iifd9YYEnDGkRhjK0NH-pbyTiQX0kVpJynyGwZcnH8w,31554
261
287
  sglang/srt/layers/attention/nsa/transform_index.py,sha256=0yurXIDt5EQ9k_P5g_aDXohdzvSiBQcQpCHBcNf0ZBA,4745
262
- sglang/srt/layers/attention/nsa/utils.py,sha256=qiUetSApDNI3Qz4_3-NVh_-mknU8ZHgA9sejb6PQKfY,901
288
+ sglang/srt/layers/attention/nsa/triton_kernel.py,sha256=FyInDj54ux1IctSGlPd82iq-aGY-UfXJvd1KIPO9LTI,3974
289
+ sglang/srt/layers/attention/nsa/utils.py,sha256=_Ni-gYZTx5MXbIV2i5-7MexX6N5vsZNYTY-b0GczXRI,822
263
290
  sglang/srt/layers/attention/triton_ops/decode_attention.py,sha256=JnOtqtPXEgn_T0R4gGCROx1szlAhu_G_ODNKCazz0lE,20554
264
- sglang/srt/layers/attention/triton_ops/double_sparsity_attention.py,sha256=FbgrPO5GvEGEvojV7Ss0jX7384e9vuzX2goDCQuP1Zk,31124
265
- sglang/srt/layers/attention/triton_ops/extend_attention.py,sha256=eYg4xQoH5gBkM7bjzpBIpTdcelvUK3BujJ-8eXRCm70,17108
291
+ sglang/srt/layers/attention/triton_ops/double_sparsity_attention.py,sha256=TGnhUIoTsrFmOAVspsGpG0F_ORB7EMahM4v7nl7tNoQ,31105
292
+ sglang/srt/layers/attention/triton_ops/extend_attention.py,sha256=KzkbTOStDiIb76i5F7yLRZL0ThuZdBzv290KB2FZDow,32920
266
293
  sglang/srt/layers/attention/triton_ops/merge_state.py,sha256=v9nD01a5eTnkwZxMwERtrrRfC5rs6GxkYOpErkAPcYI,2877
267
294
  sglang/srt/layers/attention/triton_ops/prefill_attention.py,sha256=waZsmpKIp8rTgFSoM4QMabJuLaB3yW6ltOzAKJksBoE,6260
268
295
  sglang/srt/layers/attention/triton_ops/rocm_mla_decode_rope.py,sha256=664WnAJ91EiCUZOcnVDfbTQf4uGJ4ZDZB1CbxpEUFZc,13866
269
296
  sglang/srt/layers/attention/wave_ops/decode_attention.py,sha256=oJNBG57cySgxtmJe1MSEsZKOIQOXnH0iVAcFO6DUWvY,4732
270
297
  sglang/srt/layers/attention/wave_ops/extend_attention.py,sha256=LyZQQIvFYfcIcObgy_tETK5JxRLgAkOYlF-KhGcGEoA,3877
271
298
  sglang/srt/layers/attention/wave_ops/prefill_attention.py,sha256=viTUit0rxjVV5UahuwmVAhmL66YRFJD4g1YhH_oRBu8,2344
299
+ sglang/srt/layers/deep_gemm_wrapper/__init__.py,sha256=esJMd0Yuj68t6QYOpmIFuiWP2J2dxTMC4bRBNH0Xk6I,26
300
+ sglang/srt/layers/deep_gemm_wrapper/compile_utils.py,sha256=tvoJ2PmYJWm6j_JfRpmBhg7mUZyH27f5JJeDZ4xcZhg,8067
301
+ sglang/srt/layers/deep_gemm_wrapper/configurer.py,sha256=vkMBNZx3RqukEtxMUAbTfKJii3MDXLBs83ZlsgtxNiU,559
302
+ sglang/srt/layers/deep_gemm_wrapper/entrypoint.py,sha256=5VTBfCU6wTBS2uMJc-luyqawh1478w3Jh1qk39qhjlI,3199
272
303
  sglang/srt/layers/moe/__init__.py,sha256=P8OC-pUE5yeEr80QUDqSPwF9a9BAYPuaK7GNlQovsJw,863
273
- sglang/srt/layers/moe/cutlass_moe.py,sha256=JKJED-4709ndP5AwhQ7Vi04GJjw5d9Xl_mWOsZPZ3U4,14298
304
+ sglang/srt/layers/moe/cutlass_moe.py,sha256=335MeGbcVPsAI9oaEQCVSMxzzQ9YV1qPiNxINXtvO48,14206
274
305
  sglang/srt/layers/moe/cutlass_moe_params.py,sha256=9NRCmgP_Ug3gGqCcpi-x-QRbLjCNpw8792gKXwZsbEU,6522
275
- sglang/srt/layers/moe/cutlass_w4a8_moe.py,sha256=psvH2RhUQkK4oyaSE7xe0EncCqLvNbd_NwR4XHxk79w,7017
276
- sglang/srt/layers/moe/flashinfer_cutedsl_moe.py,sha256=4TS3YLrmxn5dEHYUKeY7aohBXYeAsU8UCx846NXFTw8,6197
306
+ sglang/srt/layers/moe/cutlass_w4a8_moe.py,sha256=yTSlr_B9y1jiAmp6pX88LHb7hQ351Ensa8SR2fgW3v8,13898
307
+ sglang/srt/layers/moe/flashinfer_cutedsl_moe.py,sha256=ULLAdfRad_sG2ZYXE4qMCOutQX0eckQt0fwwhfcsckA,6186
277
308
  sglang/srt/layers/moe/fused_moe_native.py,sha256=XzJPM9Z6YQ4ejrMrBFt3l1i7guBcdQTXo9-gT5H8AIA,3479
278
- sglang/srt/layers/moe/rocm_moe_utils.py,sha256=07Z99bTV3B-b2Cbm-odhGpx2twxtnVpYvaDMBE1K3LM,4555
279
- sglang/srt/layers/moe/router.py,sha256=eUNu_Uz5VB2FOZzZyYuZo5pokCVBS17_fcjHQbmvDSE,12181
280
- sglang/srt/layers/moe/topk.py,sha256=HcvKwbew1W4NJ-IGCp2aietW3o3KQPRuC7siRrjavt4,32240
281
- sglang/srt/layers/moe/utils.py,sha256=HPRJy9cYYPAV5jU4dPYidIpVuSyk1HgaJrePQyD21Fo,6361
309
+ sglang/srt/layers/moe/rocm_moe_utils.py,sha256=SglTXIzpiWKFKVEf9gS8SEocJYcSOmeKUKjHznfC_nI,4527
310
+ sglang/srt/layers/moe/router.py,sha256=ouSNu8XU2w-BICyAYPpFq2zPb11LyTDalZElh0AXGus,13675
311
+ sglang/srt/layers/moe/topk.py,sha256=reUXYWZdHVfNJnrRxd8kXjGVLhdNu3AxRqOt5N7NyGg,32306
312
+ sglang/srt/layers/moe/utils.py,sha256=lP4WESNZBjCaY-dOnuJ6jkrrAXl2e3pR3MTMjyWQFic,6782
282
313
  sglang/srt/layers/moe/ep_moe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
283
- sglang/srt/layers/moe/ep_moe/kernels.py,sha256=WfHn5Kt3NH6MzawvtycMSgo_WDqg1aJQXp1HuqgNAP4,46168
284
- sglang/srt/layers/moe/ep_moe/layer.py,sha256=7Aekn8YmGXThshcbMY7dk4fMVNLsTQ1_MnDLWwn5S6E,35667
314
+ sglang/srt/layers/moe/ep_moe/kernels.py,sha256=DjgEBHIS8-S1SO46xGbnREc2vQ8dO9dDKNRYKZuwMzM,32125
315
+ sglang/srt/layers/moe/ep_moe/layer.py,sha256=D8U42eegm1cwuS9zpwIOj_DV_LmiapMOh2hMWJOBWj8,26193
285
316
  sglang/srt/layers/moe/fused_moe_triton/__init__.py,sha256=tis0ZJmih7gKHCurbLtY_o-bY3K4MOzQLYLC3ftIOf0,977
286
317
  sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=mKH6zTTuh_Z8Ceg6d1VWjGBI3iPBn1YfGO6udxIRAtU,23306
287
- sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_config.py,sha256=1iX5ox2KT5sgLHrN6l4svsgtn1-q_6514Q_F1v83-iY,7747
318
+ sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_config.py,sha256=0jTqnuw8v6uwr4g2IJ6bc3PRq77HF96mEYaSOBmpTAQ,7983
288
319
  sglang/srt/layers/moe/fused_moe_triton/fused_moe_triton_kernels.py,sha256=QOdl5uhZ8--aryXnKObdspKonGcF6Tc_U9o_lC_opo8,27760
289
- sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=1FGnf9QRSEPYdOZzvu-DFuz2DYDY0u7TaW0IuDYm-i0,39690
320
+ sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=E2qURbonpdnEOqEV2MmgLgUdecCSyfxyua3rmWb5kiI,39806
290
321
  sglang/srt/layers/moe/fused_moe_triton/moe_align_block_size.py,sha256=U93mxPPU2RP7d3QRSvoG3OCtUQIK8YhQfHf1ZGeREmY,3284
291
- sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=Ai06BZ7uxMnk0nPWQelgvi1rV9Z72FetRo6p7E3rsYs,10986
322
+ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=8_LiuVJqeuMIsy0nBJExYH9RAftfyutCKh_2NWU10rg,10141
292
323
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=iNGsE2ZeVnQEnN4A8UJ9Jv0d3hbRF2MJ9oBgjup5Szk,2737
293
324
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json",sha256=JJN0hryyLr5Zv3dSS7C8cPFhAwTT6XxUVnBGMZvV6JA,2752
294
325
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=ouRyZ5PEMPP2njPftCNhs-1g1y6wueWLmhI7G1SjV1k,4131
@@ -473,6 +504,7 @@ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=Ai06BZ7uxMnk
473
504
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=385,N=128,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=rgF-KSAUXmI7QGrhMUywPVfeTxz_j8_IP4N-6bkYdak,3260
474
505
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=385,N=128,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=7aaoi0MI2xC5ZJkflkTZAH4tawTPdmUpmcBOgOInKxs,3268
475
506
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_3_1/E=8,N=7168,device_name=NVIDIA_H100_80GB_HBM3.json",sha256=a9XJZ0XudUTebAdN5guVq-3XSvZetHIRjatO1-_0xCk,3257
507
+ "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=128,N=192,device_name=NVIDIA_H200,dtype=fp8_w8a8.json",sha256=-MZaZ4R9r5Rk8a9OEa1eM_S6INlcsX68Bj5_pM4Aa0U,3257
476
508
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=128,N=352,device_name=NVIDIA_RTX_5880_Ada_Generation,dtype=fp8_w8a8.json",sha256=L7acUMDmYZOeA-riEds1-r9Wsq2KBWJlG7X7rilWjfA,3254
477
509
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=128,N=384,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=6JYGN4imwzIrQAEgboSO93wWYBuguzTgBjfTedq2c_Q,3250
478
510
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=129,N=352,device_name=NVIDIA_B200,dtype=fp8_w8a8.json",sha256=ClPogINm5AsnjDqx6Hz_rHrmnnCdUPid-jYIdIgjZxs,3250
@@ -480,6 +512,7 @@ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=Ai06BZ7uxMnk
480
512
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=129,N=704,device_name=NVIDIA_B200,dtype=fp8_w8a8.json",sha256=W8C1GtP4K43SK9128U52DD5WWofvPleAJE4us2Qju1k,3251
481
513
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=161,N=384,device_name=NVIDIA_RTX_PRO_6000_Blackwell_Max-Q_Workstation_Edition,dtype=fp8_w8a8.json",sha256=RMYwqtB7hYeaCyuZ1feVnRhBGlN4jMcmNQX2hqUqBlk,3254
482
514
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=256,N=256,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=T6kCtCUytCxiW8JOLfEF3YgdCD9_mKccJ85IqT0b8LU,3253
515
+ "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=256,N=256,device_name=NVIDIA_B200.json",sha256=NkLVci5u2GGeuFbC3d_6PicBS3mSuV77JICCSzU_8cc,3238
483
516
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=256,N=256,device_name=NVIDIA_H800,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=M3W1OQU6RgKAQL2EoYivAIidtz1cvgoK6_6ntNfn_lY,3265
484
517
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=256,N=512,device_name=NVIDIA_H20.json",sha256=bSe-KUwiVT3yM9jQuXlDmxe_KUft7FUn5zOby8bpSkc,3233
485
518
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=257,N=128,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=RbJYTRfjP_3-ytfj53W_w2jFpZ9xwMaqoKW52pkgP3c,3257
@@ -496,49 +529,52 @@ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=Ai06BZ7uxMnk
496
529
  "sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_4_0/E=512,N=64,device_name=NVIDIA_H200.json",sha256=phmhkQNz8DcLHPqN5tjmJqOgbX0BhQx9cP82fp_jyIQ,3236
497
530
  sglang/srt/layers/moe/moe_runner/__init__.py,sha256=Dc4PH6HfzQDjJWL7iuZ-0qh8oRu7OtnH6IEl675pYiU,172
498
531
  sglang/srt/layers/moe/moe_runner/base.py,sha256=GMdFI74BGO5HDjtel5QWI7W4CFix0BHkw_HrjVswhcw,8905
499
- sglang/srt/layers/moe/moe_runner/runner.py,sha256=7ZOqDu0r1GY-9ra1VICq4WmH1nJVSQoE5yBXuSUr2CI,2669
500
- sglang/srt/layers/moe/moe_runner/triton.py,sha256=YaPqGIX-5y25nxmjF54_ASYbr9Dw4RYze2cNV4cUg-Q,14433
501
- sglang/srt/layers/moe/token_dispatcher/__init__.py,sha256=I5I1ySCHbyAW5cFQy9mpuqkSWqLclLmi2AspCkoP8ig,993
502
- sglang/srt/layers/moe/token_dispatcher/base.py,sha256=BqqwuSETP47vTaHkUoQWTEeZcAkg0n_Dgka-PkFM4uc,4029
503
- sglang/srt/layers/moe/token_dispatcher/deepep.py,sha256=LtsaJ3bR-HBQL9ZWjgbw-HaP-hcAqAgrmpO-829PL94,26293
504
- sglang/srt/layers/moe/token_dispatcher/standard.py,sha256=_OSudEOHA5qHqR5TJqnylQxUYyk7ZnhRMGOf7sMCyt0,1526
505
- sglang/srt/layers/quantization/__init__.py,sha256=GmJvVSlkJXf2AmTfWBN6EBrOhhYlxPYNE_eAEXMZfjs,7813
506
- sglang/srt/layers/quantization/awq.py,sha256=YuAkweqSvQQGTGQvg4VpNXevSaJvT8CROpiNzmY_3tQ,26980
507
- sglang/srt/layers/quantization/awq_triton.py,sha256=4XwJbRNlFmlvjbMGtWF1Wvk26Kf96162vNEmuI5Kars,11737
508
- sglang/srt/layers/quantization/base_config.py,sha256=ql3kwwnjVzZGh8BUcimMt8K6kFxQtVbR5WgZHXqkOqA,7245
532
+ sglang/srt/layers/moe/moe_runner/deep_gemm.py,sha256=xhxZsQpD9U8OReNaA_qwXWA98hVUS6rvcbWukQcv8tc,9342
533
+ sglang/srt/layers/moe/moe_runner/runner.py,sha256=MCrPZQuuTxD4NGdnRaIkLc-xy8yOnXZW3ThJ2L-ymu4,2845
534
+ sglang/srt/layers/moe/moe_runner/triton.py,sha256=pYzFyJDocnBfNiF6kp1cnSZmKKTsLOYXpAUXFZYKOsI,14464
535
+ sglang/srt/layers/moe/token_dispatcher/__init__.py,sha256=0lIB1lkEcVYiW2iEL_hzAPk-AG85dFYAdyK9MBftHsw,1273
536
+ sglang/srt/layers/moe/token_dispatcher/base.py,sha256=ZisVo2ty9vx5Oj1V1_w570_v8e8zbIpcEeXl4UUeZVQ,4015
537
+ sglang/srt/layers/moe/token_dispatcher/deepep.py,sha256=lVBM2ZE4XgHX4eqVuFuoF5rPPrY54CKoiapa3txFvcc,26430
538
+ sglang/srt/layers/moe/token_dispatcher/mooncake.py,sha256=ZQpjlv-WvEvTgFE6R_zuzFZXOfbRwVvXFYpOnWuCBXk,11855
539
+ sglang/srt/layers/moe/token_dispatcher/standard.py,sha256=2il92nCW6HuuUrkT9MHumTQf0FZ-JhVBoWNzwaZ_Zwo,3461
540
+ sglang/srt/layers/quantization/__init__.py,sha256=f05hWlwXrtzH0Ugk4kY6xofrnMK4A63FbSyPj5GMi6w,6343
541
+ sglang/srt/layers/quantization/awq.py,sha256=jeGGkHIkmRsGHNWo27uNPB7B6M1uYSVmmjeCbhdIjew,33411
542
+ sglang/srt/layers/quantization/awq_triton.py,sha256=1QwpxPoqcfe3sDU8uRs3LXBRcDZvq-M9xQ7NE9RV0Mc,12658
543
+ sglang/srt/layers/quantization/base_config.py,sha256=v9apbnLDBUqQfm67kAYeky1Fe_RVyi1Upeua1w1ncK8,7895
509
544
  sglang/srt/layers/quantization/blockwise_int8.py,sha256=pqSLo4gwazZ4ajdVzyouwh_Z5oVDbWq9wo8RnrMdY8o,13998
510
- sglang/srt/layers/quantization/fp8.py,sha256=pMr42f5f4QDQcOYmo3g2VBv_Dh8li85KpnbKYa2oNyo,50739
511
- sglang/srt/layers/quantization/fp8_kernel.py,sha256=Mgigb6GmF66oCrgjS97IvDDSacNYb0u-VYAf4FChhqM,54849
512
- sglang/srt/layers/quantization/fp8_utils.py,sha256=sxsjlqL7sWXwbgsxwfzFSkojyN3w8KQh1R99JEWdBl0,29191
513
- sglang/srt/layers/quantization/fpgemm_fp8.py,sha256=dq7rJz-QB9LovmZZLBMK8YJEOr05wjVrtWLmSTkXjYw,7004
514
- sglang/srt/layers/quantization/gptq.py,sha256=Qe6XfBWd9aOW7jkLmQR61AjmJRe5MJi6FJvGno1HH4k,39433
515
- sglang/srt/layers/quantization/int8_kernel.py,sha256=GfRC9FOn9exNvK4QHbUeBj3Hhv32VcyGphapFPt5b84,12625
545
+ sglang/srt/layers/quantization/fp8.py,sha256=pyJxdl5jrXjzup27BI2hmIqKic_S9qI0siMR5qL_XeY,53442
546
+ sglang/srt/layers/quantization/fp8_kernel.py,sha256=noTju6oEzKQ4mOcgWF8s0sFL5g-PuxLrCivvSbKQJWI,56181
547
+ sglang/srt/layers/quantization/fp8_utils.py,sha256=enZUimrleDg7RJhoh7uxVLRYd1dSMKeCUhaXuwWAYyE,29831
548
+ sglang/srt/layers/quantization/fpgemm_fp8.py,sha256=OpDJAOBpy3PtAvDwG3ZIA4ItMFvrodxAHTkHQnT_cso,6967
549
+ sglang/srt/layers/quantization/gptq.py,sha256=oAlxR3qX06Pwc9-kkrzu7W4j0K-zWfi2JQL3yO0HHCI,39377
550
+ sglang/srt/layers/quantization/int8_kernel.py,sha256=nl3bmwcgvs8SCe3_jz0hC5f6HfdohhEMyeWM_t8Zx5Q,13124
516
551
  sglang/srt/layers/quantization/int8_utils.py,sha256=YK9CS-lb_n91kNCTKK5o5apYF31V2giDg5G5VKrpcUA,2356
517
552
  sglang/srt/layers/quantization/kv_cache.py,sha256=_9pF5rwvB7ta6Gdc5YKVVGbNzYwqmhIx4TrX1-xnodQ,3261
518
- sglang/srt/layers/quantization/marlin_utils.py,sha256=aM3GU7b7rHNZE-tZjRSrtOaPWzSaMcLxck4he8MlEVI,26344
553
+ sglang/srt/layers/quantization/marlin_utils.py,sha256=Zvasw0DpgMQKTNJm1ZNGLt3P1AKgDfYhTpePdI9BbQ4,26634
519
554
  sglang/srt/layers/quantization/marlin_utils_fp8.py,sha256=iSjq-ikPOTU5plrWNTW4MletKLySIrNl5NhQmY6FyAo,12508
520
- sglang/srt/layers/quantization/modelopt_quant.py,sha256=qDCoZxsZnZmi6RM3LbIw61Zzm3UM_vM9nRvIUOwcmCA,59352
555
+ sglang/srt/layers/quantization/modelopt_quant.py,sha256=yKs6xczPfjKV1UKB5S50nol4rRURMX4m7_7pYIYJZU4,60689
521
556
  sglang/srt/layers/quantization/moe_wna16.py,sha256=uoRhxJ8W_U_VFpbn03YEp0aCjbzqquWwonjuN7KBucw,19117
522
- sglang/srt/layers/quantization/mxfp4.py,sha256=mb_DeJgrmEBS2CREZ09WsQVetxLozq3a4HhxqMq2amY,32993
557
+ sglang/srt/layers/quantization/mxfp4.py,sha256=OpthUaglm7Yf9jojZenHqRSVLWLy3mFuGk6PvgPNsnQ,31829
523
558
  sglang/srt/layers/quantization/mxfp4_tensor.py,sha256=bGeCXlIOhmFZFGWp_lITkIRDEgGUaLpawDvMy1cTOmA,5389
524
- sglang/srt/layers/quantization/petit.py,sha256=74Jn0eICq23v_b4rEctDaYTINtbqkdM6IXycT-_FbbI,8954
559
+ sglang/srt/layers/quantization/petit.py,sha256=foRPfOfhq02h6yMt-8yHKofQB6l16Pz-bRCqUD3iiHU,8944
525
560
  sglang/srt/layers/quantization/petit_utils.py,sha256=-gy4zMhqNoIA1R0n7-5C0efV54jHonCUgPDUUFjGsyM,3245
526
561
  sglang/srt/layers/quantization/qoq.py,sha256=jM96uJfKz3vo1B6SSIrQXNT3vnD3UJrepK2eY-tSQU4,8139
527
562
  sglang/srt/layers/quantization/rocm_mxfp4_utils.py,sha256=Z4pYWl6ExOXq2qfTHorW16hVbJ-Rk4G8Wrxn_x8boHE,327
528
- sglang/srt/layers/quantization/unquant.py,sha256=T8w0mPvtBM1JhGhle6NoDY9C4xfmPWHU_VEJZWSnUNY,16079
529
- sglang/srt/layers/quantization/utils.py,sha256=d4eaS4-Z4q3GRgb4HDMr2EoWEdQCefrVdJufK6n_NQY,18509
530
- sglang/srt/layers/quantization/w4afp8.py,sha256=uSVtBXYIKPMa_Li1HHyZEifdaNzVCr-lTiEwRnIexD0,12148
563
+ sglang/srt/layers/quantization/unquant.py,sha256=T-KbIdvsYSqNdYfdnH7zSy9foSHMagPcFLfxkfF8e_g,15980
564
+ sglang/srt/layers/quantization/utils.py,sha256=yqgmoLvrrp5aRj-LTJZ6dI1hmP1UFgbpyjVWJJdomZQ,18472
565
+ sglang/srt/layers/quantization/w4afp8.py,sha256=yYvI7Tv4N3urK4m6QyO6cWa-SBz7bN6bZREnDqwX4wg,12969
531
566
  sglang/srt/layers/quantization/w8a8_fp8.py,sha256=ugLV4G4MDog-UuLqSnEasBqE3Hh6AqE5ZYI371ean90,10415
532
- sglang/srt/layers/quantization/w8a8_int8.py,sha256=e5mrRf7AWfit-5dOn3Ul9nTLt6OJth6SgrVpEdnVdE8,37076
533
- sglang/srt/layers/quantization/compressed_tensors/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
534
- sglang/srt/layers/quantization/compressed_tensors/compressed_tensors.py,sha256=Jfvvu0xL9WR075I2Qx8prTfGp77hKwkDH--V3R5pBpE,25928
535
- sglang/srt/layers/quantization/compressed_tensors/compressed_tensors_moe.py,sha256=tFw8PIF5r8yjdJFt2_3Ou72vUJvgLd3bXFOWdgsCeno,26732
567
+ sglang/srt/layers/quantization/w8a8_int8.py,sha256=WkhbRVnEamh78uyj9WyS9OfeSpZTsWh51kDCH4HICa4,37534
568
+ sglang/srt/layers/quantization/compressed_tensors/__init__.py,sha256=zMpLnf9GiRhV-jg1H2UiZ6OUMSKMcmLtrr2A4XjhuUs,217
569
+ sglang/srt/layers/quantization/compressed_tensors/compressed_tensors.py,sha256=P8RmY91K2a__xNQI69zqTuGFnFCBE41DGUlp9WutKJQ,24948
570
+ sglang/srt/layers/quantization/compressed_tensors/compressed_tensors_moe.py,sha256=yUITBLC024lXAkVh3qfvd6bX_U0prVMbX4me_gtqUWI,38895
536
571
  sglang/srt/layers/quantization/compressed_tensors/utils.py,sha256=mnUmKWFQUnY8bVoFHUuNVwqsfS-cefeR-ofyaihCXcY,7621
537
- sglang/srt/layers/quantization/compressed_tensors/schemes/__init__.py,sha256=ipQ5M4UkFHVsuAm2u4yZJd86NHtOenyeeahBtiLBLaM,448
572
+ sglang/srt/layers/quantization/compressed_tensors/schemes/__init__.py,sha256=qhx1YhMH6dzvnzLSSN1uQDE3wDHMoOA_HRkjn6lsvzU,589
538
573
  sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_scheme.py,sha256=tdKJC8c3SX8T3z8JL-1YCsg4ftcv55Wxt0vZrYftpX8,1635
539
- sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a16_fp8.py,sha256=VvqVpAr66AlS5IPVuIR5Nu0ESH0oAoKo545jNart6lI,5493
574
+ sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a16_fp8.py,sha256=kDkks4z5zCh3bBoAo0_I3Yyp0--a_sQBY2zNs2wzJ0w,4982
540
575
  sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a8_fp8.py,sha256=4cfB6pv7kt8Ek0e88vLyXymSW6VqbAUpIjNt_-KK9-M,6318
541
576
  sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a8_int8.py,sha256=6usNdpr8mL5QRlTK_pZQtGwgmSMNi0KdMfm57kq3lw0,6908
577
+ sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_wNa16.py,sha256=uG3dvlNuP5ZC3_NxIhjWWkrUVw4FQxlt5jobzaofAHM,12884
542
578
  "sglang/srt/layers/quantization/configs/N=1536,K=1536,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a8,block_shape=[128, 128].json",sha256=RdHQxWXwXqvio31192vsLaKjEr4f_DjpMPKlarY1IAk,3251
543
579
  "sglang/srt/layers/quantization/configs/N=1536,K=1536,device_name=NVIDIA_A800-SXM4-80GB,dtype=int8_w8a8,block_shape=[128, 128].json",sha256=0vLaJgo5B9ti-XMFKJuvSoMGjsZQ-RhHSx4cC8Xji-U,3254
544
580
  "sglang/srt/layers/quantization/configs/N=1536,K=1536,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=tkLjwLC_aVXhzuvo-2QHkojXZauPJsf3jNHFn1S7uRA,3244
@@ -691,325 +727,348 @@ sglang/srt/layers/quantization/compressed_tensors/schemes/compressed_tensors_w8a
691
727
  "sglang/srt/layers/quantization/configs/N=7168,K=256,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=PD4AJYCkHfy2ivv9baMouFXzBTy0eKMumbAfxfm91HI,3256
692
728
  "sglang/srt/layers/quantization/configs/N=7168,K=256,device_name=NVIDIA_H20,dtype=int8_w8a8,block_shape=[128, 128].json",sha256=FImA-TJ_tQDjqwoNWxS--sRDoKDXf9gamlME3tkxH58,3252
693
729
  "sglang/srt/layers/quantization/configs/N=7168,K=256,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=FFBjSWlpKXMxfAUUYUqXbOK_Hd7qBeBsfbcaa9uB4qY,3249
694
- sglang/srt/layers/quantization/deep_gemm_wrapper/__init__.py,sha256=esJMd0Yuj68t6QYOpmIFuiWP2J2dxTMC4bRBNH0Xk6I,26
695
- sglang/srt/layers/quantization/deep_gemm_wrapper/compile_utils.py,sha256=PI9r3PHCMK9EgpoFuBgR4jvokA5sBz8zyC47ps3wet4,8164
696
- sglang/srt/layers/quantization/deep_gemm_wrapper/configurer.py,sha256=a1b2P8-5PRNwW1ykXR7jJF94aUF3u3t3P9ad_R1k2PI,549
697
- sglang/srt/layers/quantization/deep_gemm_wrapper/entrypoint.py,sha256=qiUuQn-InDLYVNDPFOxde2XB-qlE0fol0HPTkY5KN8g,3197
698
730
  sglang/srt/layers/quantization/quark/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
699
- sglang/srt/layers/quantization/quark/quark.py,sha256=EqQvWzAc6nd_yl6UIMIwmozKif4I8fRNfBum040UUEQ,14613
700
- sglang/srt/layers/quantization/quark/quark_moe.py,sha256=fWUAEvLoaiw_6oNC7TQW2pUuR2AeNI9AaGWNcUGDiSQ,7446
731
+ sglang/srt/layers/quantization/quark/quark.py,sha256=Xt8e8Ds7wKV2UyQ3rJq9cFUtSNmTSAnRLnC2OgTBLds,14687
732
+ sglang/srt/layers/quantization/quark/quark_moe.py,sha256=-XW9mKSisXmqs7Ep9exPAFlGgCfZ0-N3P35B9HZdamA,7371
701
733
  sglang/srt/layers/quantization/quark/utils.py,sha256=zZHRe9mjxGp16_OJ5Qy_UtnQgipl3ZRZUmruYvyEm_w,7445
702
734
  sglang/srt/layers/quantization/quark/schemes/__init__.py,sha256=z1LHBPqkxAS6Wp70DWwESOSixWpIhIQwz1IHcWDdURQ,167
703
735
  sglang/srt/layers/quantization/quark/schemes/quark_scheme.py,sha256=b8-Djo-UQAwgxSWViKDoEP5dOSesnEBPyozX-osB3WY,1478
704
- sglang/srt/layers/quantization/quark/schemes/quark_w4a4_mxfp4.py,sha256=sW57dU7HoxQGVbzUhyhRirGWA8oVpENB4NTzO7URGgU,4198
736
+ sglang/srt/layers/quantization/quark/schemes/quark_w4a4_mxfp4.py,sha256=aASlSjoLgmEmiSAULaehpNOCSGy1OYiAFazWLmJB970,3935
737
+ sglang/srt/lora/eviction_policy.py,sha256=IaG1tlchPeT2iYwuaMGdHuma91wraO1K9qRIFoV4yko,5378
705
738
  sglang/srt/lora/layers.py,sha256=0XlVcBTT1InMsBoLfiOO7yOnlDrnpXD_08wKo84T4B4,11852
706
739
  sglang/srt/lora/lora.py,sha256=FooB4hOW5uvZJrDrdqKwBExb-lX5Uw_Y1gjU9an8hzc,7669
707
740
  sglang/srt/lora/lora_config.py,sha256=qDgMTx_69jyJUl29O5FxLzYa0BMhqYVXWXfyyVOvGm0,1684
708
- sglang/srt/lora/lora_manager.py,sha256=F5kO3A6NFNFfu0hFZcn4Yr6Hum6si_kH6eE3Aw_Wxjk,19247
709
- sglang/srt/lora/lora_registry.py,sha256=osbau-sQZ7BuCeGGpBMFy4w40GO5FGqRgRwDyxxgNmg,8167
710
- sglang/srt/lora/mem_pool.py,sha256=qh-AA7HhJDKG_xF5-67WGhrV6ohMM4TQU5oY40LVulc,11485
741
+ sglang/srt/lora/lora_manager.py,sha256=WkSFWbyWtR2jkG7Erled9PBLTMqkB3keVjaN31Cluq8,19950
742
+ sglang/srt/lora/lora_registry.py,sha256=Ox1n6ZmGAWGThpDVd8WjQbJACejnA8n2lGNCVzKReaQ,8173
743
+ sglang/srt/lora/mem_pool.py,sha256=WQex5E9lQ2Arzkc9X52EHx3OLWzMwQfoepv3OdL7Fv0,12412
711
744
  sglang/srt/lora/utils.py,sha256=FeIb51m5EIcetP1Pgn8X17EfuE5tGipm5iurRg3RAZw,4424
712
745
  sglang/srt/lora/backend/base_backend.py,sha256=kfkr-OxdPyUwMzi0HgjTNfX9bZC4z_ljt3srzRPgMfI,6139
713
746
  sglang/srt/lora/backend/chunked_backend.py,sha256=x2VNkjLHmrOXwI67v_2LgjpCH8R5wuSmY5jdTWV4K7g,12701
714
- sglang/srt/lora/backend/triton_backend.py,sha256=bKH8DPo6fg7JVZt73iFV5BHc8amEJkr4FopbCnJer94,6072
747
+ sglang/srt/lora/backend/triton_backend.py,sha256=XrOaZLlwldwvGjE1h0OOVKIwYIS98Ph0aWQetub3udo,6026
715
748
  sglang/srt/lora/triton_ops/__init__.py,sha256=no7N7uWnmCvHHbNZ6PZEadXDujIjHGP2jp_3N9j6vHM,495
716
- sglang/srt/lora/triton_ops/chunked_sgmv_expand.py,sha256=sW7vsjOvyoI_00KJLZ5g0JwjTY7-AGzPTpKo3tuYC6U,6812
717
- sglang/srt/lora/triton_ops/chunked_sgmv_shrink.py,sha256=sF9PzxK7XN3-MVqiz-S0DyVU2u1ADDhgnvpBe3GTaGI,5411
749
+ sglang/srt/lora/triton_ops/chunked_sgmv_expand.py,sha256=rllqrhX3NQTmFNXnfxm0v7sY06-hggZkNWIjU9TRBc4,6844
750
+ sglang/srt/lora/triton_ops/chunked_sgmv_shrink.py,sha256=n5ANXoEciOFgXuQkRZzZcW1WmdV2qtFDH7Yx83GYHUA,5462
718
751
  sglang/srt/lora/triton_ops/gate_up_lora_b.py,sha256=QURCYxHNR8Ls4SQtt3dvdgjvdDVhywI9tOzsK8SV9m8,5779
719
752
  sglang/srt/lora/triton_ops/qkv_lora_b.py,sha256=z9BB84Xu_MjwCu5v9Yvji-FkIzfEjDySAFybc4WYv7A,6483
720
753
  sglang/srt/lora/triton_ops/sgemm_lora_a.py,sha256=Ksova04wgeGsFqGOXWqJtMYaHgyUYcx8VU42BZQOkVA,5129
721
754
  sglang/srt/lora/triton_ops/sgemm_lora_b.py,sha256=VqCAFvUtq_l-0RGIkx3W_fzD55QcW2FAcqpvSHOBFp4,5115
722
755
  sglang/srt/managers/async_dynamic_batch_tokenizer.py,sha256=btIWhI15a3QCLabdZZhrJVEWZ3zZTgldbv7pGjAPZqo,7236
723
- sglang/srt/managers/cache_controller.py,sha256=G-2292PKRRUQR6Co3sFt0oGs7zk6bqJ6RldEH0JQMGA,29300
756
+ sglang/srt/managers/cache_controller.py,sha256=Wy0ygZ5FAiXLrz1xzczeinfJATk7aPkH6yvXqOzH5_A,30478
724
757
  sglang/srt/managers/configure_logging.py,sha256=8sNXZ2z9pBWOwn-X3wyz013Ob8Nbm1zDxRkxoZjH-l4,1633
725
- sglang/srt/managers/data_parallel_controller.py,sha256=YalvihRIJwph7OdSHf24rBsWYvmLQzUnJiDL261fyMM,14880
726
- sglang/srt/managers/detokenizer_manager.py,sha256=QhJDFju95xTw7epUXvBH0t2DfwU-sR13v4i4ZAcFyQo,11815
758
+ sglang/srt/managers/data_parallel_controller.py,sha256=TAJErsNQUomHFnekrPceMZbN95PfFadticjSup3JiLY,19236
759
+ sglang/srt/managers/detokenizer_manager.py,sha256=K6TLeBtDb8geRVKvTlFqZJN-26saYJxxLlRspvEOFe8,13080
727
760
  sglang/srt/managers/disagg_service.py,sha256=7VyRva5oniAPs8G-DYg2fv-mdjSxk9cLZPzl_TmB_2Q,1588
728
- sglang/srt/managers/io_struct.py,sha256=ZkxZpLbdEJTl92GtmaGfG0TDuuNpcC6YrvOXG6X75hI,48748
729
- sglang/srt/managers/mm_utils.py,sha256=b6n39SlbaFP2XdUvJYOfRQL1Gch8fP--VxpOGsRJ8tc,30917
730
- sglang/srt/managers/multi_tokenizer_mixin.py,sha256=audn1iSNNVu3d0DamslN1e-KGvhRJ5d_pw68nucQOUU,21676
761
+ sglang/srt/managers/io_struct.py,sha256=BEx_N4PwZnLoTBdvMp_zHz29btJvUevTM7S5gqVeB5k,50778
762
+ sglang/srt/managers/mm_utils.py,sha256=xJ7Pbk1ZxIyodLyeNv_t0JeSKCqrP7u5hpMcC-0Rpzc,31283
763
+ sglang/srt/managers/multi_tokenizer_mixin.py,sha256=nz_G1sLW-bN8Aa7Vy4ZUM7voaCPf7oMTe_M76H7vhyE,21050
731
764
  sglang/srt/managers/multimodal_processor.py,sha256=0mLkwu6CGRQtt3G2T1tS3PSsh6dpyivV-vAfIHfcMbQ,1764
732
- sglang/srt/managers/overlap_utils.py,sha256=QHeF3rQPI_kgMngPfDpAO8m80ZKSXOxB2G6r4Znyi2U,1809
733
- sglang/srt/managers/schedule_batch.py,sha256=qQVFsvoJev5vgoOkFS4Zo_3tjv-5Vg0zxdxQlFYWS1Y,81929
734
- sglang/srt/managers/schedule_policy.py,sha256=tdb81t-_zILXSGe5E3zNqg7N0_pbLWa8lfV1V7lAGnY,28192
735
- sglang/srt/managers/scheduler.py,sha256=9hjS_FeM7Qfy1EYqvCmdrkuANFGFhNXvIXibDmGlZHE,119572
765
+ sglang/srt/managers/overlap_utils.py,sha256=dDz1zUBlJ9Ohw4TPHgOxnuh6LPCsN037c14XIw3E-J8,5050
766
+ sglang/srt/managers/schedule_batch.py,sha256=0oWPNVtdgoX2bFHOc1RN_1IYyoIE1yKwCImll65dAbQ,72622
767
+ sglang/srt/managers/schedule_policy.py,sha256=BFWoHG3m-lkeVvOkLGoMeEbRplq4vF4thsjv-P8MG84,28818
768
+ sglang/srt/managers/scheduler.py,sha256=BQ3_X5uG2a9La955Mw8OGTrhhlgKkhe3nDUE006YVnU,114768
736
769
  sglang/srt/managers/scheduler_input_blocker.py,sha256=SYZ91JNTHtqiBHUpkk_MboAiBFyl5U7ardLcYDAQ0OU,3689
737
- sglang/srt/managers/scheduler_metrics_mixin.py,sha256=tvDovTLhtf8svgqVXIyoAc1xuf4PrH0AuCb0SPMYrGg,13197
738
- sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=-ObOi1TK7WBwbGOzB5usSKmnGYjAqMPsYXMP81hPC44,33753
739
- sglang/srt/managers/scheduler_profiler_mixin.py,sha256=62dv-rLS3acUncFNJd6S0P4jglJ5XY3CFIauB08xuJ4,11405
770
+ sglang/srt/managers/scheduler_metrics_mixin.py,sha256=duFJs6DlSFzV_1c7R2ESNGFEkGekxgDziJns4ttK-0Y,14962
771
+ sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=n6zvLqu-TpTaZuWfYxz7ivCBPP3Z7okTOOshTq0d4CQ,42449
772
+ sglang/srt/managers/scheduler_pp_mixin.py,sha256=oUl5oxbFPd2gxqn4JXk-Bn-uLrmJZ6_Km5SMpSe9Gtk,16433
773
+ sglang/srt/managers/scheduler_profiler_mixin.py,sha256=LKgAaQ9kNdjK7J6xSwQQzo2q_pViWnlGIvTpe5_yLLQ,13505
740
774
  sglang/srt/managers/scheduler_recv_skipper.py,sha256=8rVQCBjn9f26Th4XbeUS3fEsvo1GI029Me28wMjcKRY,1103
741
- sglang/srt/managers/scheduler_update_weights_mixin.py,sha256=K9gCx16TaoeRah4fSYpIw_sOzRKuNUw2AJa6__dt5Bk,6194
775
+ sglang/srt/managers/scheduler_runtime_checker_mixin.py,sha256=54z5p36M2BgTQYrEz30aAtQVXWCBI9VHBjgzOf19QPo,8521
776
+ sglang/srt/managers/scheduler_update_weights_mixin.py,sha256=AuOKrV943inXe5s4cPb4_BQiNAFwkiQGlpaBS-aal-M,6957
742
777
  sglang/srt/managers/session_controller.py,sha256=FGADRGSkRmS76o_BQ2fivpgw0Q5Q-K0Ws3aezH41YSc,6041
743
778
  sglang/srt/managers/template_manager.py,sha256=M4EshVv1OhKxUAGQPP4OntRkSkUVvG93457xsYfWnQk,11968
744
- sglang/srt/managers/tokenizer_communicator_mixin.py,sha256=NshY8ibxS7EQQGSYEp1PAAli0UL0-J_XZFtpQr9BIS8,25048
745
- sglang/srt/managers/tokenizer_manager.py,sha256=YVCCbNP9g_56neSBcLnQCN1vtcmAp3apd7XLUq-NCig,77943
746
- sglang/srt/managers/tp_worker.py,sha256=Qprdf6QhbddbKiKtO6Huu6J9a6jpWB_BH5qXADHvkas,14145
747
- sglang/srt/managers/tp_worker_overlap_thread.py,sha256=9EoJ5ZbolfC8atvs6i6AFz9L9xHGj6OseaSLPezkVX8,11858
748
- sglang/srt/managers/utils.py,sha256=fE_RZl5q0sZl9EQZNLlX9VNOHINxh-TJLQoH26GW2Lo,4279
749
- sglang/srt/mem_cache/allocator.py,sha256=O-te5k_xLVB7o_GhBWCvperdm0_hJAlsxmw1QD3d9o4,18038
750
- sglang/srt/mem_cache/allocator_ascend.py,sha256=aGsh_VMI0eYoAy3uKCYbpAMFxyXVTyu4JmdeGDWLLbw,4997
751
- sglang/srt/mem_cache/base_prefix_cache.py,sha256=Bv84HD6e_yYdtmIQemK1m1OUViO0PnuAvOS9tDpQOJM,2795
752
- sglang/srt/mem_cache/chunk_cache.py,sha256=5_yPQMGDP6TGLSxrEhOrBcrpd_7Z15Qewh6DOC6WyA8,3487
753
- sglang/srt/mem_cache/evict_policy.py,sha256=yX8hFNQ_pdzuN4rMjYcByhQZLs-lRZdD0qDLkPe2ht0,627
779
+ sglang/srt/managers/tokenizer_communicator_mixin.py,sha256=CHry04ONVx3YMGNN5KtNJFaafxnw4LfXHceMR1q2Nwc,26088
780
+ sglang/srt/managers/tokenizer_manager.py,sha256=RcK-EvZJj1iNDlhD0WPK7FxxM1cAfKlidnZeJUkpSJ8,90837
781
+ sglang/srt/managers/tp_worker.py,sha256=qENe8zAagoTs50RJmCJi2il9JsQtuQqBHII6XBBPLJg,16212
782
+ sglang/srt/managers/utils.py,sha256=HRPecRiWLHTX6QbkyYRY-tjlpJEb9N1k0fSJsqBxJl8,7324
783
+ sglang/srt/mem_cache/allocator.py,sha256=TEAkK32vyYz7wow5bpZLlrzb3KHVXtw9h1KtGWg6kIo,18246
784
+ sglang/srt/mem_cache/allocator_ascend.py,sha256=GVI1HbNQRy_rIlUHEn-6oRe2WS_OBXfqmoco2Hxta_w,5017
785
+ sglang/srt/mem_cache/base_prefix_cache.py,sha256=Z6c9YKJjInVxvZAZpIh8KRAPlOyE0-aowncm4JMXE70,2813
786
+ sglang/srt/mem_cache/chunk_cache.py,sha256=u4EIGuWNonVoCItF2wrKnXzh2OtoDM04XhoffEK6ykE,3923
787
+ sglang/srt/mem_cache/common.py,sha256=PEFKzoawIIPRVboyInPKWG56qht-inp34vcj6q_fsfg,16283
788
+ sglang/srt/mem_cache/evict_policy.py,sha256=FVI4QsFJoRR1CaxE9jpX4OzBPt4w9ftfM2Ndu4BSfhA,1012
754
789
  sglang/srt/mem_cache/flush_cache.py,sha256=GYcxmNXh4hsMpFfNOuCTpKilW7guZwTtAg_usVeM3J0,979
755
- sglang/srt/mem_cache/hicache_storage.py,sha256=5L57L_vzqYyNk5PRdKikxyaaMj1LkCkWD38Sd93IAe8,7958
756
- sglang/srt/mem_cache/hiradix_cache.py,sha256=hSsz8k1foizh-wJUxDi9h0NQZNNmSQoH_YP4A4uLtms,35414
757
- sglang/srt/mem_cache/memory_pool.py,sha256=FiJzy8V39Jt7mIkyMiaq8OEhhnwP_GggOUm8nLiY3Ws,57038
758
- sglang/srt/mem_cache/memory_pool_host.py,sha256=T3lgq0dyjyvOGdx4nGSGZzm6fqkX9H0S0JzYaNGJJ7k,27659
759
- sglang/srt/mem_cache/multimodal_cache.py,sha256=zPnQLQhBZ6zsUpCQPSoNkrB9EEvpoDQS4mU7c3sRWjE,2171
760
- sglang/srt/mem_cache/radix_cache.py,sha256=1K1MvZZOLZVrbDti3pRrI1-pHJMlxxB3Scz9d9XNMo4,26390
761
- sglang/srt/mem_cache/radix_cache_cpp.py,sha256=0twLAAR2EYWyfRiUVsb__s01ITraNEF9bXBPZFvul1U,9454
762
- sglang/srt/mem_cache/swa_radix_cache.py,sha256=Kf5HAfnwJl1mr86pT7Y03o4RBKtUXfI6udbii9xAirs,40138
790
+ sglang/srt/mem_cache/hicache_storage.py,sha256=t1Dl7OLamm4sPa93sKNIIjSHtX1Rom3D8G9n9GXTipw,8073
791
+ sglang/srt/mem_cache/hiradix_cache.py,sha256=BK52hyQjPoXKzn_PDn_LRk_3a0AjWBie1Xk4yAO1B3s,35984
792
+ sglang/srt/mem_cache/mamba_radix_cache.py,sha256=mpKTxCzA1_u4eoHk0SvXPPNVVG_JivEAb44miY3aNuw,38678
793
+ sglang/srt/mem_cache/memory_pool.py,sha256=6zpF492cuG4sEXTC41liHi5wSN_dQnDt3sLulRDOPQA,64880
794
+ sglang/srt/mem_cache/memory_pool_host.py,sha256=IBUKHCmU_Fu8d22_V5ssYp4Ff97w3EaMSpyFZvPD0Go,27634
795
+ sglang/srt/mem_cache/multimodal_cache.py,sha256=23d34nWEDtgiOM6fqAhmkQ8-OHnrNR1-n8Ert0K0n3U,2147
796
+ sglang/srt/mem_cache/radix_cache.py,sha256=7NQHMUKjdKaAGMFdx1z0pCPBPvwux9KcqymFRxFUAY4,28181
797
+ sglang/srt/mem_cache/radix_cache_cpp.py,sha256=PIJenIaR_ouY-pAmyYuI84KY0tDaLg6VAPvKBaNttPM,9663
798
+ sglang/srt/mem_cache/swa_radix_cache.py,sha256=xYK1K6tgyUErhWvfTDfm_TWDRiAWbRNWM1Wd4LSzv4Q,43420
763
799
  sglang/srt/mem_cache/cpp_radix_tree/radix_tree.py,sha256=tQZpz-H6HxNAQe9mYqt6aX8mfDZyu_fbJTcCNK-Ns1M,7179
764
800
  sglang/srt/mem_cache/storage/__init__.py,sha256=HDzHFUVeOHlry7HlfL5tRd5HUA02N94p8uzA_Va8nlM,251
765
- sglang/srt/mem_cache/storage/backend_factory.py,sha256=rN8OfnkROk1rFQpJeCkiXMucuI--Ez35h4physV6Ys4,7822
766
- sglang/srt/mem_cache/storage/aibrix_kvcache/aibrix_kvcache_storage.py,sha256=kYqfXHdWwmL8WPZ9Z5RtwPzKgb0Vq-QOTE-6YXndd5U,5463
767
- sglang/srt/mem_cache/storage/aibrix_kvcache/unit_test.py,sha256=X7-GU8X5-t9adyVuD09obHQUo8d_Rfu--7R0C631p_g,3718
768
- sglang/srt/mem_cache/storage/eic/eic_storage.py,sha256=V2isvEuzCsEZd1XzYFlwIyLbOm0P6rs4QXVqCDjRcPs,28628
801
+ sglang/srt/mem_cache/storage/backend_factory.py,sha256=ItY0f0YY7fto-oW_yuRxE7lxsv0e6Y3qnWCjgtr2BWE,7859
802
+ sglang/srt/mem_cache/storage/aibrix_kvcache/aibrix_kvcache_storage.py,sha256=0n8jH9Rrcv73X-qcQnaM4ozkb35UMWdxkmeBGfl-O1A,5573
803
+ sglang/srt/mem_cache/storage/aibrix_kvcache/unit_test.py,sha256=asSKZdmlPYxrEzQOqsscfx7fpzV8ueqYwO0npE20otk,3420
804
+ sglang/srt/mem_cache/storage/eic/eic_storage.py,sha256=UVPr5gMfm8TxaxRY2eYf9CsB8JM9VKVO6pI6MrpCvH8,28534
769
805
  sglang/srt/mem_cache/storage/eic/test_unit.py,sha256=PfNPpL624t23tyVgtmS5F1pGiuWDMrC39ZD6ZbkN828,3607
770
- sglang/srt/mem_cache/storage/hf3fs/hf3fs_client.py,sha256=le_iTE5HZAbQNToa5E_dq_3U5ztu60ej-58tmzRtndM,5245
806
+ sglang/srt/mem_cache/storage/hf3fs/hf3fs_client.py,sha256=3xG0dV5JmnbIJ8kB1_lk8jAeqshOcU7tXES27ldyb8I,5228
771
807
  sglang/srt/mem_cache/storage/hf3fs/hf3fs_usrbio_client.py,sha256=6oH4v_WF_pKH4FMSr252v6QPhBCnRHztHqzuS8j6_QI,5323
772
808
  sglang/srt/mem_cache/storage/hf3fs/hf3fs_utils.cpp,sha256=dDYPtxmL6OFhEyv_GuTgzkTDpBjcD0EK8kphnn7eaGc,1133
773
809
  sglang/srt/mem_cache/storage/hf3fs/mini_3fs_metadata_server.py,sha256=lJ9Jp2kOgQQaUihxlO9l-W8fYfOMa1h1y0WAtzzFGLM,17850
774
- sglang/srt/mem_cache/storage/hf3fs/storage_hf3fs.py,sha256=IeEc09wmBI5iRnN3rUSyfBxlFeHc92hHcA96dGRgCgM,21351
810
+ sglang/srt/mem_cache/storage/hf3fs/storage_hf3fs.py,sha256=MI-x2979lvJL8d4aJluTCx6DofIe0tkLTNbrAJbV0FI,21514
775
811
  sglang/srt/mem_cache/storage/hf3fs/test_hf3fs_utils.py,sha256=g2h0Woa2CK39pRTigHCVR_hq095dTaC70lCIAIs9THM,1089
776
- sglang/srt/mem_cache/storage/lmcache/lmc_radix_cache.py,sha256=AdujdsJ_3ODf11O0LpA59X6yWWJLPQELelxE4hKU5-U,9925
812
+ sglang/srt/mem_cache/storage/lmcache/lmc_radix_cache.py,sha256=pd5NC37FORcF-yHmOjbARZGGPcpc-Xd3iu3KGjgYnc4,10009
777
813
  sglang/srt/mem_cache/storage/lmcache/unit_test.py,sha256=DCSZDMJAe-HehL9hWzsP759pck36Q-8ijxWZKfgXmA8,3590
778
- sglang/srt/mem_cache/storage/mooncake_store/mooncake_store.py,sha256=OWHraCjil547NYf6SjTrB6dteznqJL8kPoCFA1DCgwc,16885
814
+ sglang/srt/mem_cache/storage/mooncake_store/mooncake_store.py,sha256=j4KVka-45-RaTnBoGLS8BQnGTxnTLPDOaT-jrFriPKg,20216
779
815
  sglang/srt/mem_cache/storage/mooncake_store/test_mooncake_store.py,sha256=6TiqbzEIL71DC7wL1B-Q-SMMZRYsz08sg-dZYeMzmAc,4930
780
- sglang/srt/mem_cache/storage/nixl/hicache_nixl.py,sha256=bau9Jsp50lpEiy_osgb-dYzeoUkPWM03x7Q8z2BpKaU,9920
781
- sglang/srt/mem_cache/storage/nixl/nixl_utils.py,sha256=KXkwMrbWwIOUOASINnUo4HyheiMd-93smmwGLv0CacU,7463
782
- sglang/srt/mem_cache/storage/nixl/test_hicache_nixl_storage.py,sha256=vENVvGAd3PqcQEFA812wPoSBYhRemLr8Sfh1LQa0INU,9609
783
- sglang/srt/metrics/collector.py,sha256=s1BpU0cLgG1nHWYH5Y0PT0NbqRVHIs_IWql-UxOEEYY,34078
784
- sglang/srt/metrics/func_timer.py,sha256=6-PYCeItVhsET6lc0BcFQfd0Tc3_wvJ8VHdp3mlWz7Y,3306
816
+ sglang/srt/mem_cache/storage/nixl/hicache_nixl.py,sha256=kfGOqJPtq_kiLO2m_bDMFGID9iO79D8iBWadPIgsanY,10911
817
+ sglang/srt/mem_cache/storage/nixl/nixl_utils.py,sha256=3ouXVNJ17nilYF5gKDqphWux2sHqdqD5ztusCv4aP9w,7457
818
+ sglang/srt/mem_cache/storage/nixl/test_hicache_nixl_storage.py,sha256=Jj3o2zkPZBBUYzbQeHWV1ujjlC70GYHXmQL_SPStp7Q,10031
819
+ sglang/srt/metrics/collector.py,sha256=Qvwsn5POBDbxsaNRfjwssLszdACtxNeIojq0zfy8O4Q,35327
820
+ sglang/srt/metrics/func_timer.py,sha256=Om9o4svdyPfUpgcwMt6tL560qmbPBQvkDPhPzTwCmvE,3300
785
821
  sglang/srt/metrics/startup_func_log_and_timer.py,sha256=PRVg3Z2d5GBMFifZXR-VhzGcn9nmKTkqEU41VJKZmaI,4937
786
822
  sglang/srt/metrics/utils.py,sha256=MGb3quRI39n4tgJS1e0UHI5TBX3D0MwsgiZFMW2EsSQ,1903
787
823
  sglang/srt/model_executor/cpu_graph_runner.py,sha256=ypp5yIW2OhRX-Xmido5mWuzEFpd-ohlq2c2wEuSW71I,23415
788
- sglang/srt/model_executor/cuda_graph_runner.py,sha256=GcD2FkWG6CJRO3A23HY3Cu24ZE2c2MSpCD1NbtoLLgY,34348
789
- sglang/srt/model_executor/forward_batch_info.py,sha256=834WSjXwpIeHGTgldRaBJ0R-YIjr8bops4YMzTHi9t4,42236
790
- sglang/srt/model_executor/model_runner.py,sha256=sTRCfbndxVaUXFOaBUy9u6VPOoFFZHvm0_RBKuBF2Y8,89531
791
- sglang/srt/model_executor/npu_graph_runner.py,sha256=HstTsIQF2QHCPMQH_AxKOu1Ulykw8q8Cpx7Q-u9Kq8I,3673
792
- sglang/srt/model_loader/__init__.py,sha256=_1Y5sUZGxEEG_bmvLbSgYGa__qO60_d0blGB8sIdOgo,1020
793
- sglang/srt/model_loader/loader.py,sha256=MhrqysDMxBTAuwoLbYyCfLJOluk_KSZWPhgiD-rP2Cw,64789
824
+ sglang/srt/model_executor/cuda_graph_runner.py,sha256=hz7y3q5J7e8lnDhDPxiJIGvtGG7Ws0Og8ztbaZ_mqXw,35580
825
+ sglang/srt/model_executor/forward_batch_info.py,sha256=9SsVdDZfGIF-HFm3ulEACjhj95tHQhCzVfe3vzUqZV4,42612
826
+ sglang/srt/model_executor/model_runner.py,sha256=ocjmkK3yKz_z_EAd6sgOZ8xd8qzmpw9f8G1004Ew-L4,100592
827
+ sglang/srt/model_executor/npu_graph_runner.py,sha256=B1YQla4jW9PiciBBisKg-qoC-vmnldRr8ut_aSmUB-E,3664
828
+ sglang/srt/model_executor/piecewise_cuda_graph_runner.py,sha256=-Kb1XILyAxRTbHgT2SzV_BLW-L161eg7vgPiOF1Wrpw,21992
829
+ sglang/srt/model_loader/__init__.py,sha256=Y4gehllriF0JNjly4rGhQPSkUrA9u9Lr-WbfZfBIs6k,1034
830
+ sglang/srt/model_loader/loader.py,sha256=73Pd71im3E56u9SCZmrMgeq5ZJxadeb-ENIIQW4LW9I,80809
794
831
  sglang/srt/model_loader/remote_instance_weight_loader_utils.py,sha256=_HnQD1Ab-Wv9oATOmwJe6aQaQD_Gs_yG9EsDCGJQWfs,2881
795
- sglang/srt/model_loader/utils.py,sha256=KrOpyd_eefZC3zFnhnwxIKNTx9G-MmA6jIK3NQbTW0E,5002
796
- sglang/srt/model_loader/weight_utils.py,sha256=QbeiJY8VXIM1iLdG8X_JAjuy37mZzAUQzhBY_HHsxMw,44383
797
- sglang/srt/models/apertus.py,sha256=UL2Rd1TDDXPb2N4rWyymI3JThG7KlrGIyBuDIFCitPE,26002
798
- sglang/srt/models/arcee.py,sha256=Q6fujRESEnljzs8ls3XGsPtWxzfKfUa0QAvAekYzeBY,18981
832
+ sglang/srt/model_loader/utils.py,sha256=cfMXqVGRppD7CglcFqdMzwhCeB__FHWovYN0IBqkMuw,5001
833
+ sglang/srt/model_loader/weight_utils.py,sha256=O8cdxYdEjMyXgZT0Jz0PdagQGnIgPwnSvAWsyovOHsA,45019
834
+ sglang/srt/models/apertus.py,sha256=Wuz4H8EQUMlqlcCTM3Fe7E0lE0eodb-cX9us1avQxwI,25937
835
+ sglang/srt/models/arcee.py,sha256=O5yGtgAeIdcmYwZNLURWVE6Hu1O0k34gNiUEtux8ozU,18966
799
836
  sglang/srt/models/baichuan.py,sha256=HbvlErnkCSK4pRQYCSDxMcrn-1DQyfiNoeDcnRrJas8,15807
800
- sglang/srt/models/bailing_moe.py,sha256=IbG4BCgll0f5LUPkKZttizPU2wbtV5E9-dciUmjZ-EM,37726
801
- sglang/srt/models/bailing_moe_nextn.py,sha256=ntuaXP8PXc_X_oqmd4fp_FzpRmnajKoWQynXwjsEN5M,6000
802
- sglang/srt/models/bert.py,sha256=ODJe8YfNRP-hHsomFWk4_QpcuiSsNfjzGf256EDS0Pc,15802
837
+ sglang/srt/models/bailing_moe.py,sha256=Av6psy73-ZzsHnYLI4OTFshDVvjWtitGn_KQ_CY0fjQ,36313
838
+ sglang/srt/models/bailing_moe_nextn.py,sha256=rzHElrOiXJTV90khQUdx74u4RTXXu07_JUIY_zTRbaw,5930
839
+ sglang/srt/models/bert.py,sha256=2aUAVMT-43VGIbrI8keRBZZdCMOi5PzssykHO00zT94,15791
803
840
  sglang/srt/models/chatglm.py,sha256=cajLN9caBl09e0TwOFkiTTKDqwlbmHo_yS-NCjdeQW8,13957
804
841
  sglang/srt/models/clip.py,sha256=kOPSXnmgH_QKu2-ENn49HLDS9yf7Gm1HCOE_YvoNhlA,19858
805
842
  sglang/srt/models/commandr.py,sha256=5Y_b3K0QY7D37nFGkyiGgY38RleRui_GJUYcHSuHUZo,15315
806
843
  sglang/srt/models/dbrx.py,sha256=117gwrB_o8VlACwDH5YlXkPfuS7t2Mh-nyJvpNpIYxs,15903
807
844
  sglang/srt/models/deepseek.py,sha256=M7nyHcAbTIs8vc1g6u00oy22-pp704Xp4T3clBzu4xM,17460
808
845
  sglang/srt/models/deepseek_janus_pro.py,sha256=td8xGs6ARfJ8AQCYwUhMOZoWigrAs7m3trF5-kXCqik,70418
809
- sglang/srt/models/deepseek_nextn.py,sha256=QRcl5mWGDbYblV1dmo8MxPVeEUQQ_UhXumB5FEgj4M4,6255
810
- sglang/srt/models/deepseek_v2.py,sha256=K6QdBihJEF64gurObwIVfJJ2icJroO538D2LQvSmoBw,132581
846
+ sglang/srt/models/deepseek_nextn.py,sha256=B-Xk9mh7op-Gx42yJKV353yzWzL68iwwR08r6jbNZ6A,6710
847
+ sglang/srt/models/deepseek_ocr.py,sha256=WAPLXeg3S1UB3x3iP-tiandHk5AEnCUMeMs0ak302Gg,52416
848
+ sglang/srt/models/deepseek_v2.py,sha256=EzPUoRGCcBoJIbZ9s_XztIVikp7FSNsTv42qUBzHoNQ,139536
811
849
  sglang/srt/models/deepseek_vl2.py,sha256=7X3gI4DE7guUtNJvMLf06jO8MUHKa2Aan8evZg5hsXc,13061
812
- sglang/srt/models/dots_ocr.py,sha256=Dr9O-VBY1aSOFoIzEKcqs_QKRipjs8OQTfKrO5fJd-I,6792
813
- sglang/srt/models/dots_vlm.py,sha256=0tbeQHbJryUMVqEnWelawDabzhcdwSj3Bb9-nj4YOKs,7242
814
- sglang/srt/models/dots_vlm_vit.py,sha256=K6QzcHx38XAq9fmNRJ-iApScZ9FoV0lkn3JYkRsxplk,12044
850
+ sglang/srt/models/dots_ocr.py,sha256=sWkFsENjX5b_CecLCqXjepsr6iyyCbNTmjZbRfoB4ek,6683
851
+ sglang/srt/models/dots_vlm.py,sha256=3uLSXO7W8UPKU7a3ixkC_gwSVDGYecCHK0kZAoD6vNs,7192
852
+ sglang/srt/models/dots_vlm_vit.py,sha256=JhX2E0UmjhdelDvR46-_ns5GCYsfnEpeqyDb9NNKUh4,12058
815
853
  sglang/srt/models/ernie4.py,sha256=3z14KFdYLR8J-zsm9oO1uBUeLlWrlkHoFKEYvKKJLKM,16079
816
854
  sglang/srt/models/ernie4_eagle.py,sha256=E7f-ygCcY8pIoyTMKFyVC2uRcG59-_RaQTO4gd5_uWI,7223
817
855
  sglang/srt/models/exaone.py,sha256=TpO-rtCpEZ8Ua7hGFnS8l2oAYhY0Pij50grc9WQ2mvc,13576
818
- sglang/srt/models/falcon_h1.py,sha256=vtFgy-P6Jc6VoUibjpLNDi7633rcw61Fdyo8RDabiUE,20825
856
+ sglang/srt/models/falcon_h1.py,sha256=UQZ8454btjoZ1kbktaqtIjHY1xdvaUZ1ZRnZZ2APlg4,20759
819
857
  sglang/srt/models/gemma.py,sha256=2atKwFN5wCsJCmBRmURX9vaCcFjxlFirL7xsnG5KPlI,14180
820
858
  sglang/srt/models/gemma2.py,sha256=n2s3WLGVM3XDvOXwbi_h7tgeh5SDDv1VvifH680DmV0,16785
821
859
  sglang/srt/models/gemma2_reward.py,sha256=V8U3_ADUHWPdOwvEe1jhGW-oJmBgL8t1TY3-67Ksv2A,2618
822
860
  sglang/srt/models/gemma3_causal.py,sha256=o46BNbaiOeoOv2xVU6-lWZhrrjyGskdebve0_wviWfU,27338
823
- sglang/srt/models/gemma3_mm.py,sha256=r4r7OcYqKE-ZpDBuPZCF4TnLmG10MCwXupKRDR3E76w,17195
861
+ sglang/srt/models/gemma3_mm.py,sha256=9JpkNj_u-8Af9RJJQbUNGOxWmvW3TbXUceoI6omb8jc,18030
824
862
  sglang/srt/models/gemma3n_audio.py,sha256=isgKfjA5UieYawxU6medL2ssXlzYPqAbagDBnLcemC0,36405
825
863
  sglang/srt/models/gemma3n_causal.py,sha256=kBDlpSWAg6ZDmUPe08Q7sj5CbdVD_0h07zwJw8sKu7I,36335
826
- sglang/srt/models/gemma3n_mm.py,sha256=94QLW3FfAcqhz0E-gti8rTizTL9ci6CjMTxYOv2vHac,20371
864
+ sglang/srt/models/gemma3n_mm.py,sha256=Il5LHjZdbHEXueUVdBp5lpSJHt56W7fpfPHD0Y7RED4,20301
827
865
  sglang/srt/models/glm4.py,sha256=dijzVTTgg8zyJ3gga95MKY0WwqwnuAaf-VIV93OFAmc,11433
828
- sglang/srt/models/glm4_moe.py,sha256=_H_ldIZCuR22kQJ-5wZ3D-NW8rg7Mi8crSzWdBGO_RE,42037
829
- sglang/srt/models/glm4_moe_nextn.py,sha256=pE9G2xr_hLBu6PpvWlyTVZ1BP_Eax2bVqwFHLv2d7kY,5962
830
- sglang/srt/models/glm4v.py,sha256=gn2a4Sb_txTKOguYIzIgw_3DQX8IG1vhJMulh2gfvPs,23761
831
- sglang/srt/models/glm4v_moe.py,sha256=wXbO-C3Kx6CEKGbzcs7CfdgH5giLjgrDDjJ7Nq7_rpw,17396
866
+ sglang/srt/models/glm4_moe.py,sha256=plEh-b5C2az6MMNF5hotXIusJAEdXOZy7KTRd4EIRLg,41209
867
+ sglang/srt/models/glm4_moe_nextn.py,sha256=fWuDWY8nwnHBXpdEYkhyMcBkUByIrBZvEMdLEtsTVi8,5947
868
+ sglang/srt/models/glm4v.py,sha256=LwiFQxYm2ksmaePeO57i5d4YGQjiQX52e-Dsjyh_P7I,23834
869
+ sglang/srt/models/glm4v_moe.py,sha256=MxuF0pFf2frKPCp4A_2YmrXx_uvZzOFdA4hVJFbLY6E,17375
832
870
  sglang/srt/models/gpt2.py,sha256=kclhxEs8oJk1KCyhmAqo7rZqecVGGHYkc-a1WZi3aIk,9841
833
871
  sglang/srt/models/gpt_bigcode.py,sha256=1D6bi8Zu760gCRZkvdLHFcg8kCkY35ARwQYaMDtYhl4,10307
834
- sglang/srt/models/gpt_oss.py,sha256=7cjyN1v2cxP9vZNrMqeDorX20U9_I4YcSpz_b4x0zj8,43720
872
+ sglang/srt/models/gpt_oss.py,sha256=K9g2c9xTE2eM74isijM-KSvGPHt6Cjgjl8L8EzBTLmM,43711
835
873
  sglang/srt/models/granite.py,sha256=8q92shxVPAp_cJDohJATffSGd7Z0Oi-vF5jpY6DlK4s,19840
836
874
  sglang/srt/models/granitemoe.py,sha256=j1rgZ62CbBioECjUblDCw_NneDQgY_QJODsI0fqXVO8,13779
837
- sglang/srt/models/grok.py,sha256=8KCR13LtdnhswJrIwgb0sdFW0OxCA8GQ0fbN8gb856E,40518
838
- sglang/srt/models/hunyuan.py,sha256=RSZErx-Swt65kmfvSXJQJJ6KhjucuNY4UUVLWC8hWaA,31102
875
+ sglang/srt/models/grok.py,sha256=qEuuoVg5aaVGPyjuYvx_rTRcAiUToDNv0IQ8XbCXOr4,40021
876
+ sglang/srt/models/hunyuan.py,sha256=i4RUEDDwvflGV6hciBjTS46G10ew0DJcmaUpONkxlF4,30950
839
877
  sglang/srt/models/idefics2.py,sha256=U3khd3hbdawJeRNXsxmaKHdssOCT5TPOZ1D-2_zHoQo,12079
840
878
  sglang/srt/models/internlm2.py,sha256=F_iNY1gUqzAjAuUatcE47gnrcoTh5_08PY2Rw9tKr9M,13150
841
879
  sglang/srt/models/internlm2_reward.py,sha256=ndfGmyqYZbVZ7C7rJ-v9oK3wa-EpoBGybS8MlyKZi2E,2522
842
- sglang/srt/models/interns1.py,sha256=E4SyJWocXZ5rAuAV8kj569OHo57r04W4hmq1CF6oiFs,12516
880
+ sglang/srt/models/interns1.py,sha256=VZAGsvjkjPhdUvvLuSy9qV40KXsBTy0KdiXg00EeOnE,12450
843
881
  sglang/srt/models/internvl.py,sha256=iQm2wDtkcyjPYoV9oY_jQ3_7WvhP315eP_vZEiQX3uw,27062
844
- sglang/srt/models/kimi_vl.py,sha256=XulRiufQzOSWZe8-bUl2OEdznvsVU9OBsEYipaX3YkM,12877
845
- sglang/srt/models/kimi_vl_moonvit.py,sha256=0X07KnCsp9m8ZxVpdMSDSMH_yDZXkToIjwDtoyGX0Mo,23894
846
- sglang/srt/models/llama.py,sha256=ZQc5XgkAtgr4etZ8tVp1B_hTk0pz_IehkVlCoaI5BXo,28263
882
+ sglang/srt/models/kimi_vl.py,sha256=Tm0-cZXzD3FNW6YEoAFGqCX7ExW4hni-RGFsK3GOCcg,12707
883
+ sglang/srt/models/kimi_vl_moonvit.py,sha256=qtS8ANHYJ_VPrnzg7oSN30nGAnxfn6LA7xQ8GPH9uQM,23939
884
+ sglang/srt/models/llama.py,sha256=Et_i6a1A3TL0pS6ccD8NIOiBpqTxjmSMl1KUQsAXotE,28248
847
885
  sglang/srt/models/llama4.py,sha256=i4-Vo5FVE9zf_6Y80dyft5VjPOQ-a-xWYfEV8s-ltKQ,19872
848
886
  sglang/srt/models/llama_classification.py,sha256=4QWTFaUZIFKYZvEzs8bx8VkOZNIwdYCLrnwrdAw4QK0,3108
849
887
  sglang/srt/models/llama_eagle.py,sha256=Ubh_jmtfiOnriwvHgQT0ZGID7JvYvdSi_QGHOIkEgPE,5028
850
- sglang/srt/models/llama_eagle3.py,sha256=lutyS4UaPg5QussPu08En3iO5e1lhsSm4dBXTm4R_XI,9201
888
+ sglang/srt/models/llama_eagle3.py,sha256=yezjnua5fBjTwJT2lKmybn0uAE7dKOJtazN2fWxqY_k,9182
851
889
  sglang/srt/models/llama_embedding.py,sha256=zq-_lNu35VBFc7eemiam0zdkGIE8fzrgk5OWYfirZnA,3254
852
890
  sglang/srt/models/llama_reward.py,sha256=LF2nqMV5XOrljGjAwJg43mBv3z6Q040I2EYlgZeCp8k,4681
853
891
  sglang/srt/models/llava.py,sha256=xzYip_BAwpzSIdZre43LZiyTpFISa0ZCLdO6LUSbaCg,37702
854
892
  sglang/srt/models/llavavid.py,sha256=-CSk0RJ2MQeb81sh-RISeVJFaI-XWY6nR6_I594MkME,12818
855
- sglang/srt/models/longcat_flash.py,sha256=g_WX1UQgvkAtGGkw0Zk5NmDU9ew35zWKXn50CptKsh4,41016
856
- sglang/srt/models/longcat_flash_nextn.py,sha256=MdXz-KDjvNexD1rT3tSjVCgAe1p0G24HKkO613fIG2k,29605
857
- sglang/srt/models/mimo.py,sha256=Mp-iFp4YHuiuq-H8enUF5K5QbMnVcvEa6mURH6vM3yM,6140
858
- sglang/srt/models/mimo_mtp.py,sha256=jSmqJAXu7G3OO7jW1oa2suI4H_Yl7u5ZT7w4lHFbHhg,7292
893
+ sglang/srt/models/longcat_flash.py,sha256=CjlGMrV5IYZ98DoCByiN61rVn2CFtVKEEH7oWNp0OwY,40507
894
+ sglang/srt/models/longcat_flash_nextn.py,sha256=tbM7UYNs8iP_N2SN3tgP1GA3S9oEEq9KDkVPV-DF4hY,29353
895
+ sglang/srt/models/mimo.py,sha256=TdiflXteo_HLH7Q1Yf6xDAOXRzNrOpLR4kjVXMueltM,5662
896
+ sglang/srt/models/mimo_mtp.py,sha256=HbdSi0ZXW30YfQYhubnU6JmUI0zceJLvRjI2ptmqbVw,7251
859
897
  sglang/srt/models/minicpm.py,sha256=CzBJyZtfMpp8jvlEl29DHI7HLVq-CxuqP1UHwxIbaUI,14567
860
898
  sglang/srt/models/minicpm3.py,sha256=Cflu4Tb2hxpjapRBZ5n4kX8a1nnFwffK-M8uHPRUra4,19276
861
- sglang/srt/models/minicpmo.py,sha256=st8I13Ere5RkRHHQQN1LgZh1ybUA3_buxaaE4XlV8ag,76123
899
+ sglang/srt/models/minicpmo.py,sha256=1bNtbJM5wbMjV4ax8gesVsYVbMz4ozaIHAvvi8_d0iE,76175
862
900
  sglang/srt/models/minicpmv.py,sha256=_CnCR2y3RaYxhONAKFpBIuPQBrqn9Od4o7QnJw8CLR4,35884
863
901
  sglang/srt/models/mistral.py,sha256=ni7PppA_5X4ivTnIps3yoEaMEL-G6Gaf9b5hGC1vU5Q,3475
864
- sglang/srt/models/mixtral.py,sha256=ohZVFJ75QWuE2kBKD7Sd4fcx9YbbjA7JxnYAsOIfORU,17166
902
+ sglang/srt/models/mixtral.py,sha256=bZdsTw4A3B-MIHSR8U26mBv3sLYkawVM4V1VXEyBrmE,16992
865
903
  sglang/srt/models/mixtral_quant.py,sha256=UUIq7lpUonD9IoGePyl59oJYEcVwT9wUXvtVp5tjQ9Y,15406
866
- sglang/srt/models/mllama.py,sha256=OdX7brhyfGiMFPulxF77QOUi-Kcscg3Qo4ipyxzs9yA,39670
867
- sglang/srt/models/mllama4.py,sha256=ux93c-eLcG9LuL91f0euYHcMtYUt64VYmWXOo4JRzHQ,36255
904
+ sglang/srt/models/mllama.py,sha256=mMhDrLd1jJ-4lwMMHKRC5Uzcs3kWdzRJJzdjhQN4LOw,39671
905
+ sglang/srt/models/mllama4.py,sha256=z6YKfmHu0lJ-oyALZNlL9-EcHzFvNgkxWU_mURyS7z4,36694
906
+ sglang/srt/models/nemotron_h.py,sha256=clbTirOxve6yefRaf2eE0dT0IqhPDfknOtnsAEsnZOM,17904
868
907
  sglang/srt/models/nemotron_nas.py,sha256=CoSAKqlbej4Xe30uY4w76iASBqeuJf8-imisDK00zEU,15964
869
908
  sglang/srt/models/olmo.py,sha256=7-q_fA6XXdG7kPUjpUzYkzMUWJobuSjhqjYw9xSUs_c,12671
870
- sglang/srt/models/olmo2.py,sha256=azmljhJF4ivcQfUtfsAUxq3ducE4tRKTL6iwe0IKYMg,14327
909
+ sglang/srt/models/olmo2.py,sha256=zprucQEogxPV38E_IU0edcTYP-d-dqLVeTmt2kRLznA,15448
871
910
  sglang/srt/models/olmoe.py,sha256=zryYUQEhEdhd6xcR_HyLV7gHCcKt-HWHeEeIUqmhmcc,16100
872
- sglang/srt/models/opt.py,sha256=1fdsQU7yXSN9HEWb0ZVdiAF8wLzAunW4XomIrlHyu2o,23476
911
+ sglang/srt/models/opt.py,sha256=-nCg_g2I84JtJQ7Fhh2eyp1cko3TxxicheM7gGpX0A0,23415
873
912
  sglang/srt/models/persimmon.py,sha256=86Duo3HiZqDj9O2UzWbJgUEhQOXzGBUdhUofQhcs1VE,11244
874
- sglang/srt/models/phi.py,sha256=n6A1d47MvnR1lmSsZ3TuzXk5kT1Lntj_YQ5uNvR0s5o,10287
913
+ sglang/srt/models/phi.py,sha256=tnhdiD_zo7KeHMTI8UxDfJN5brpHSAaKPSN-2e2iGk0,10280
875
914
  sglang/srt/models/phi3_small.py,sha256=eJb8aS_3KLObrq3PNkoIyVHaQ6SZTAJe42rbpC54QKg,16012
876
- sglang/srt/models/phi4mm.py,sha256=TKOFM4k8o_JGwYM5mBb2hHbbOMLjbveu5izIHCbT7ug,20617
915
+ sglang/srt/models/phi4mm.py,sha256=Pe5IjZcu7N8w_UmEXO0Mb98-tihc50ih6y5cS7b6BIY,20597
877
916
  sglang/srt/models/phi4mm_audio.py,sha256=0ChekwoYudAnbY0-JyNwz_inzMlxM8FmULqR9mwkPhQ,48877
878
917
  sglang/srt/models/phi4mm_utils.py,sha256=bW3un4x3SHDvSkAOHQEFO286FGdOPeKhBpJCOmNlC9E,66956
879
- sglang/srt/models/phimoe.py,sha256=EGaKFi02MZP20qFrILA4o2SJ0wb1HoJagFTSqVUbJcQ,19223
880
- sglang/srt/models/pixtral.py,sha256=ZkZrV0mEfmbBdgRko2AvsMFZbAVskgp_5a5p1xCSRN0,16835
881
- sglang/srt/models/qwen.py,sha256=j0OU3JjznWi_TbayI09yYGM-Obov6mQzJO82Hs0qBGw,11868
918
+ sglang/srt/models/phimoe.py,sha256=cZQIGjEvArPDiJzC3uKYje-o48QZC699P8TTLwfVIas,19172
919
+ sglang/srt/models/pixtral.py,sha256=H378jvdhwjgdAuUszhCe5tmcEPYvw2YPhg_d8QrjLZE,16776
920
+ sglang/srt/models/points_v15_chat.py,sha256=HV_GRgLTcetKh0B2agJry02N_atcWI5NPjjQELarUGk,6415
921
+ sglang/srt/models/qwen.py,sha256=_X1mUt_MczEE2jFK7rfGyRRtpd4U93jdD1SVpCTNsns,11856
882
922
  sglang/srt/models/qwen2.py,sha256=kHNZCtT0jnQXC2aJN7Bp1DzaEzKWuhUAGL3hAmt8OU8,23598
883
- sglang/srt/models/qwen2_5_vl.py,sha256=rMmmoc1ba3GjIE5bfcaEBSh62hNuBZT0tlEpiY-9N8Y,25031
884
- sglang/srt/models/qwen2_audio.py,sha256=Q6zUfBdUTXDa7qx_aDVw6et7wonJsvBbrABmxLa_1YA,7782
923
+ sglang/srt/models/qwen2_5_vl.py,sha256=X7Hh-75gsoGqaK2iJg7eBUFR_8qwJRLhhkii3yxc-KA,25084
924
+ sglang/srt/models/qwen2_audio.py,sha256=Hr4j9W-q23XjQUX4kk1NxUGA-EQkj8AKDqKVK741TjI,7097
885
925
  sglang/srt/models/qwen2_classification.py,sha256=dGrMm4ebd30_lBhHOhaV57ig2iOTx3nqB4GEzsrRIM8,2747
886
926
  sglang/srt/models/qwen2_eagle.py,sha256=6spFg6JYQGeUXLv2Q5eMkVzZvnqGyvW6SdVBtFMxlTM,4806
887
- sglang/srt/models/qwen2_moe.py,sha256=LfqgHflkQFhiRVSuRnKBaCHW-zf4HKRN7q5ZGm6bGl8,30854
927
+ sglang/srt/models/qwen2_moe.py,sha256=-pkURmqiLazr7oq11-3hQCFKrdj1crx30Z7iK7DBs90,30920
888
928
  sglang/srt/models/qwen2_rm.py,sha256=-mQXDEv11p-I1HXgYLTtY6ROem6UYorO958WsDrzsgs,2837
889
- sglang/srt/models/qwen2_vl.py,sha256=HwNc08L3zgVfpD59QFcyrDefbems_dfLgapJpTBRhRw,21372
929
+ sglang/srt/models/qwen2_vl.py,sha256=xV8s6kgyjZ37SqLi9nF9J6n3gq9piUmlXOe2PVPQqjI,21488
890
930
  sglang/srt/models/qwen3.py,sha256=2OSKkk-AdIpg6ZnNcQ9tqZLlF-VH-QxncY1J_g8k-bc,19637
891
931
  sglang/srt/models/qwen3_classification.py,sha256=bdjAylXJCjXKjAho74nmtIMpEG0Af98N-aZQ-pKKMY0,3262
892
- sglang/srt/models/qwen3_moe.py,sha256=AcOGpft3b-p31LII8jA2sRDK497fIicxFNIDGQbKG28,34083
893
- sglang/srt/models/qwen3_next.py,sha256=nvQ2VVUNjHvU5cxXgx5Bh5EWMtkPMfHPYP9Ni45J3hI,37364
894
- sglang/srt/models/qwen3_next_mtp.py,sha256=F-NnFGer8KxijNKIZoKICDfp6iFwct-XV0-q0KxAApg,4465
895
- sglang/srt/models/qwen3_vl.py,sha256=2kFQAZ9yq9GNj7aVF9ktyghsTFtNOyHczBYLNF2X4UQ,29368
896
- sglang/srt/models/qwen3_vl_moe.py,sha256=Bvx7dqzg0XzipiYqioCtVkwqxGSh8Y1zyvbMQ6D7HL0,18625
932
+ sglang/srt/models/qwen3_moe.py,sha256=W27Yaut4mNOutT91D31MxaLfAPXJF9jItTmANkFArCM,33363
933
+ sglang/srt/models/qwen3_next.py,sha256=hbIiLXcPBNa41lRnqZqdXa7Q8FDYX9JlaviXIZN_BEk,37279
934
+ sglang/srt/models/qwen3_next_mtp.py,sha256=nua9MgSa0_2Dz2Zju0chk6VXGDndBqr-1xMQ-_OirTU,4387
935
+ sglang/srt/models/qwen3_omni_moe.py,sha256=X5dB2zB1LAAD6_baK84y6MGvEm5ArgcFDmarUyoaS9c,25444
936
+ sglang/srt/models/qwen3_vl.py,sha256=fNTKorRODMDFOkARN0vcC8sLrcwLZlLpNCf_JQJKohM,29489
937
+ sglang/srt/models/qwen3_vl_moe.py,sha256=rY87FpfVOpHw0PuYu7l5nt3sFdSIHrn964XLVQjLyLY,13708
897
938
  sglang/srt/models/registry.py,sha256=BpYy-E2m5jPmCNmue_o3G9lCQza1ge7ftmTJQ78pFGc,4276
898
- sglang/srt/models/roberta.py,sha256=3k53V2Gbezk3jU-D03thXx8csGn5DxFK01ZQ9WFiWPI,9828
899
- sglang/srt/models/sarashina2_vision.py,sha256=P71n-U3XqUcavrWNBAjpQ2V4P1fkZJOKMOqrIvfbNSg,10945
939
+ sglang/srt/models/roberta.py,sha256=h5lLKiLIjBxYEFgUORWXWdW6bJ8skKyFWNnEqVJXBt4,11907
940
+ sglang/srt/models/sarashina2_vision.py,sha256=tvH4Zb-U9pgcrxm_7Uurnmr5Xeo0xXcWYHuucIDseks,10913
900
941
  sglang/srt/models/siglip.py,sha256=DIVJRwdtpLD2QT1kVPIHw7Bn9BE40xJbkHujDNzkjgA,9892
901
942
  sglang/srt/models/solar.py,sha256=BM30Eyn5Ptc0PCA6Lx3Hn7LZ_fV05n0rVm0vY_ILv5Y,18347
902
943
  sglang/srt/models/stablelm.py,sha256=0x_31uIr3WcWwecdPAI3ek9KkyKBJS7VwknTk2y0gjY,12281
903
944
  sglang/srt/models/starcoder2.py,sha256=ts6LDIjQ2FVnyLk4s2K9COD01RRhewJDW-VlvoyAk24,12377
904
- sglang/srt/models/step3_vl.py,sha256=4j7drPJT2h-QwFH7tK7zR96xnuGvrxNbestuZsflCxg,35666
945
+ sglang/srt/models/step3_vl.py,sha256=QeU7RQ5YnU6FcAi4c-ICVABpM1PJ5E65w5XE3UJmIbE,35557
905
946
  sglang/srt/models/torch_native_llama.py,sha256=3xf6CzCiizJ8i94GIChpOLq9q64Xa519RtuEspPTZQk,18501
906
947
  sglang/srt/models/transformers.py,sha256=laA2h39MPeiAWKv4DEg0ydre-1pyXWFSRga-nwy1HUk,10244
907
- sglang/srt/models/utils.py,sha256=NNKR-N_BGXRxbO6hCSwcq9kF9gZXCOfFc_8PPyo_aFs,1748
948
+ sglang/srt/models/utils.py,sha256=yB1rHC9Xk6hTQ59Fy2ExdrtntuSn6vkm-idf3CFrYP4,2032
908
949
  sglang/srt/models/vila.py,sha256=3NiRHWOqXnCRjXmswAldsNtiE5zRILbScEsbhUzLZF4,9846
909
950
  sglang/srt/models/xverse.py,sha256=DsNVI9JpzN4jj0Ry6aTrj7r-xq5YLOoDX2kH4YLJA-I,14035
910
951
  sglang/srt/models/xverse_moe.py,sha256=nBtG_PAK8wcp1tW2l2Zby2oEOmtWAYzH5COH-_N5IAM,17072
911
952
  sglang/srt/models/yivl.py,sha256=oToK7-u5IGO7xwpJIQ7VtudlK6-zPqJX4bt6_wv0SH8,4850
912
953
  sglang/srt/multimodal/mm_utils.py,sha256=6bV1_a7Iet9W0y3qdd0E-hFM78zalIzNZCYbLzJX2y8,12640
913
- sglang/srt/multimodal/processors/base_processor.py,sha256=1u6ewRgHL-svE1JSZ95iJVDFZIslfvBZne_LDR8YMPc,24902
954
+ sglang/srt/multimodal/processors/base_processor.py,sha256=RAJYoUI8XGTa97rJKz72V0UzTMzfpKvU3206GjRJ0ZQ,25053
914
955
  sglang/srt/multimodal/processors/clip.py,sha256=5nXZuQYbyf-5mlqPwjhQrlWqxvswImWZQXivChsiHfQ,1057
915
- sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=Pymag9f0U5L_bBOTFs2q94BbuPJ-VwqSixs3meO0nsM,2569
916
- sglang/srt/multimodal/processors/dots_vlm.py,sha256=1Lk8eE7y4g1Sdn_1CfR4EOI4deVHeJRlgHLmS7UUNBw,3533
956
+ sglang/srt/multimodal/processors/deepseek_ocr.py,sha256=ZuP-zHNjPV3-lb6NkmNIitwIiXtNopNIwOLPttLjBYI,1234
957
+ sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=nKqWQ9PmtY66cMx0YhIHGPaGIW-VyPKt_KeRqFLU60c,2479
958
+ sglang/srt/multimodal/processors/dots_vlm.py,sha256=azazFc_lFj40NJKWf1X1MGgJ5FXgv2RlgVS-R6IhFdk,3521
917
959
  sglang/srt/multimodal/processors/gemma3.py,sha256=7aD6cR60iSC_MqjzdCDMAgtrb_cmy9YJyqLgVRClBT8,1986
918
960
  sglang/srt/multimodal/processors/gemma3n.py,sha256=mtmvBasOMxb3Y2NLZR02nMYX30RLUXhDYJ5uVOElr10,2776
919
- sglang/srt/multimodal/processors/glm4v.py,sha256=SQXatu6t-YgE8wNSavBRliN7J4DqiP57lmA47-zRlYQ,4953
920
- sglang/srt/multimodal/processors/internvl.py,sha256=Po3_Dv71vKJidyyTY-KJRzGtxU2mCYIsETtcg9GhDg0,9853
921
- sglang/srt/multimodal/processors/janus_pro.py,sha256=_4ltWmdtFjbh1VCMRbcgxW61eWIABIzHG-YgwHWaYq8,1471
961
+ sglang/srt/multimodal/processors/glm4v.py,sha256=EPPILSirXexpRkWZfIhxWGgWKZGk1q6eENZS5gWyfjw,4899
962
+ sglang/srt/multimodal/processors/internvl.py,sha256=vvOlWmJ4AzbXnDxHED1NkRgHQfOnZlmEaWMA3-1_2cQ,9765
963
+ sglang/srt/multimodal/processors/janus_pro.py,sha256=nd1v0--5733pOwWTpArnOHCfh4aHHVBUOJPOhk9rLd4,1395
922
964
  sglang/srt/multimodal/processors/kimi_vl.py,sha256=5i8KmGxnnDtQc7XqUBNyanAfGxhxj8iRFBFONHmpiFg,1565
923
965
  sglang/srt/multimodal/processors/llava.py,sha256=-YtDc_7TsMWmwKkD4KJZW2Y0jPFlZtbQ38K_N24hk0w,8231
924
966
  sglang/srt/multimodal/processors/minicpm.py,sha256=ysJlUaxcBcWjKliz5VmXKVv0ec4QWRHXZk4ga-hXVf0,5354
925
967
  sglang/srt/multimodal/processors/mlama.py,sha256=FgPm2JQzfPFDcGYDm0mqfDfO_eJKy-NiVgF-vId6w8Y,1233
926
- sglang/srt/multimodal/processors/mllama4.py,sha256=1YGETKSzMZIa7BOwq3T9cbsYjUcW5sopcpc9JNJ000g,1911
927
- sglang/srt/multimodal/processors/phi4mm.py,sha256=8GaUVpGucV4UKoa0XkxN0gDpMZax6UyCiRBX_QaJK78,3857
968
+ sglang/srt/multimodal/processors/mllama4.py,sha256=pYzqbuV9Hb5RMYNLRabTMIMTwL8C5SCToZdhSg403go,1653
969
+ sglang/srt/multimodal/processors/phi4mm.py,sha256=8Co-UPT8Am2P5dfW8bjZcy-pVAPqFXW7hbK8v23NMiA,3781
928
970
  sglang/srt/multimodal/processors/pixtral.py,sha256=Lx5Z-9NkovLDTHlRBznHxGn4r2XhDz8am2XpOskOVQY,3203
971
+ sglang/srt/multimodal/processors/points_v15_chat.py,sha256=n1lwAnAYk1xPhnZRpAtDDpyP8N7NlZGwX7Pdun9Kv50,1581
929
972
  sglang/srt/multimodal/processors/qwen_audio.py,sha256=xkIFrHepF8Ok6MB-1OwVz1BmzPmEPgUe8lIb0azO2Bc,2411
930
- sglang/srt/multimodal/processors/qwen_vl.py,sha256=3ZjxgINjukJ953Vj6c67v8_x0Kh_9xq-1jOgVO-mqa8,10983
973
+ sglang/srt/multimodal/processors/qwen_vl.py,sha256=h26WSDFJiXvyCmUxNwetjgDANxXoQGxocdd_uudC2Vw,13537
931
974
  sglang/srt/multimodal/processors/sarashina2_vision.py,sha256=E0KSOw_yzc7prHkQfMHS_DzOcYL1GZJ77NopVkd_V5M,3024
932
- sglang/srt/multimodal/processors/step3_vl.py,sha256=9OI6UW9ybGbAnYN_S-5jh7TN8BGM_bQkvh1AHBJKzAQ,18350
975
+ sglang/srt/multimodal/processors/step3_vl.py,sha256=2zNf1gT-fSrA88-cvkr6xJDE0sEWFKdBDUWsMiFx_uY,18330
933
976
  sglang/srt/multimodal/processors/vila.py,sha256=vWgV1lTdjiFiTR8w-7fC66-L_tpOOD59c-c9NljGelE,2192
934
977
  sglang/srt/parser/code_completion_parser.py,sha256=KFa95OU0TeVjJkOqIgS4xV3kaJ5dFWOmAAgISyc1oEc,3803
935
- sglang/srt/parser/conversation.py,sha256=cmVT4SCqRYxprYvmftUC_z_TkhXCqYC9B2rVZsmQe30,38869
978
+ sglang/srt/parser/conversation.py,sha256=r5Fp4BGNjGeuvBw7dAUt-aUl3ExsTSG00Gq8dS8_hj0,40089
936
979
  sglang/srt/parser/harmony_parser.py,sha256=YweG4azWm5jmzYGaAHEXSaORpgWctPpSGQk_jp5H-CE,23227
937
980
  sglang/srt/parser/jinja_template_utils.py,sha256=_rtLpriMmodo-tBD8B9ifu3BsZFdaQQCDPRUqF26pIg,8006
938
- sglang/srt/parser/reasoning_parser.py,sha256=3P5viZ4oCsz695rZULWnRKSYBJxouHjihdpZMBuY9yc,11159
939
- sglang/srt/sampling/custom_logit_processor.py,sha256=AwODYVJdRkcQ8PGtJrhzKsqAgn8XZLQbAmR9fGiQzmc,1608
940
- sglang/srt/sampling/sampling_batch_info.py,sha256=a-t8Al8D4x4DRqTnvmnTA4jHzOVp6JEFNJxUat7mDqE,15498
941
- sglang/srt/sampling/sampling_params.py,sha256=yRkiwoZz0OrmmdMn2v63O5qkbns3Gv9MonxKYvyYcKc,6690
981
+ sglang/srt/parser/reasoning_parser.py,sha256=Q5yC-Giug7fA0W5d1BarTKUWWFO5QUwtnonMeuDziOw,11149
982
+ sglang/srt/sampling/custom_logit_processor.py,sha256=phIOI0ttJHQ_yCZhnqD5qNs98QG0gdY9evbXkgS3544,4272
983
+ sglang/srt/sampling/sampling_batch_info.py,sha256=xlkEs3zgrwZCNBs69JHL3og9-jJnFbDD3_RLJJ-M36U,15544
984
+ sglang/srt/sampling/sampling_params.py,sha256=ULhZRhA9C1oK34T3cbwqaODV3iMX8HL1VOlo_gewzZw,9193
942
985
  sglang/srt/sampling/penaltylib/__init__.py,sha256=mtN8grFEcaBUhl4yBHmw8NNirt_i6uKO2cDNLHOpZQE,496
943
986
  sglang/srt/sampling/penaltylib/frequency_penalty.py,sha256=Loc3qjJTksNc5s-DV7QZHjgqoo5pxk7-nZzxwyhD2tQ,2144
944
987
  sglang/srt/sampling/penaltylib/min_new_tokens.py,sha256=rdU_D7RoIcrQPhysNQEzmr4TO2OoEi___p-i3QdwkgU,3331
945
988
  sglang/srt/sampling/penaltylib/orchestrator.py,sha256=Romk41ahToaVlNMnnd1Enko7_kRA4KdMGO94qnEbDHA,6061
946
989
  sglang/srt/sampling/penaltylib/presence_penalty.py,sha256=NRh10AJrrQlGJ6S-enGdRefrTrWpyqrSm-aNnyqQNQQ,2119
947
- sglang/srt/speculative/build_eagle_tree.py,sha256=O9LJNaBflgJdWT94D-rGH1gJFJ18nst2oOD8HnA2mZ4,12859
948
- sglang/srt/speculative/eagle_draft_cuda_graph_runner.py,sha256=7QpNIGrZE8GEqe_B1vuLhpWPCAV9jY0Kr67Imbirycs,14201
949
- sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py,sha256=nqnlTLzqfz-zYJvIFALXzfgbCJdrtslIhfCnxEkvQ5I,15897
950
- sglang/srt/speculative/eagle_info.py,sha256=3JtRb60iCQzzi1JgreRhpGzC1aTs5Zbqv8XBDknnGHQ,29942
951
- sglang/srt/speculative/eagle_worker.py,sha256=bAvFoMs1Mc5YcwEQhfysuaKIPvZOLdb6QqUeqNSrrFA,46909
952
- sglang/srt/speculative/ngram_utils.py,sha256=U3a-c2bhNeIqZV4sKbzh3Hz_lAiqN1YFuFrbiaf0nsU,16600
953
- sglang/srt/speculative/ngram_worker.py,sha256=F4TDjVNiwzD-iQrqFArTybODtITdZLpFUYTtGdCPc2I,9727
954
- sglang/srt/speculative/spec_info.py,sha256=R3FK3ghFBUDSIUuNUYf41kFwEzP2fDBIlGdc45sRc4Y,2608
955
- sglang/srt/speculative/spec_utils.py,sha256=7l-jkBg-of_5NJJ1boH98GN4YyAbjxfs39gZzykfK_o,20072
956
- sglang/srt/speculative/standalone_worker.py,sha256=jcM_-7DMtRUMC9R0YeD6815kaWuftkFe8LIo7ThLVCc,4069
990
+ sglang/srt/speculative/base_spec_worker.py,sha256=M2hIHGmno1ew_gbgsU7rcIsNzR7pixDkN0UDJpZneEY,698
991
+ sglang/srt/speculative/draft_utils.py,sha256=E7u9u_-lrjOu82bBqmLB6zsbygRbWuLHO0Y1NwfbH4o,8261
992
+ sglang/srt/speculative/eagle_draft_cuda_graph_runner.py,sha256=LmqXLmMxLBuAFz8XiJpBQAsjpX77ZLrcDlv2hCXDRKs,14995
993
+ sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py,sha256=AucQHsYM9hktPgmjtygPCxjMyQhFikJX_pc41APXR4M,16737
994
+ sglang/srt/speculative/eagle_info.py,sha256=ucS_hYCxoKlHA8pGtDN5mdk9i6z-NHYq4vAz1uLGcwk,31479
995
+ sglang/srt/speculative/eagle_info_v2.py,sha256=2PmbYzDrMkgNky0xeTIVaL04hDI15JaEqaE8pUlsu8c,16548
996
+ sglang/srt/speculative/eagle_utils.py,sha256=HA_h9dkO9RLOBXn4dFFQHY3yiSw4CwjuYewer5BchHI,4581
997
+ sglang/srt/speculative/eagle_worker.py,sha256=m40xi1IAWZQLX48D297BZy7ohlCWbptqkOszXmWC9JA,39344
998
+ sglang/srt/speculative/eagle_worker_v2.py,sha256=nzW7KQFBwU8F7F4CRlBGr7i_7_uCJzjcdMA5zCHqdB8,26315
999
+ sglang/srt/speculative/ngram_info.py,sha256=WEpR-I6dGbzKPvH915pPysONO5TodtyfrX0mN9LNBMU,16777
1000
+ sglang/srt/speculative/ngram_worker.py,sha256=t05lgkBATs-mo45eloiqvMalsJKdHI7fZ2BTYEpXoxg,9720
1001
+ sglang/srt/speculative/spec_info.py,sha256=1AkkpJwifuOtB1ZEjLctrzzjC46O1qtJIkoAdY2rmas,2669
1002
+ sglang/srt/speculative/spec_utils.py,sha256=hxm84b37ADwntrlpJ6JOxVGdZ22Ek4uBICnHUy82AxU,21345
1003
+ sglang/srt/speculative/standalone_worker.py,sha256=9PfG1-aXG3W4j43vLnSvBuaOqgqs-MsfWRH1e7nbkSg,3745
957
1004
  sglang/srt/speculative/cpp_ngram/ngram.cpp,sha256=j8D4xNaa8dv8CN9F5TG_yHxil-A79XiuMjyEE3ZUOSs,12962
958
1005
  sglang/srt/speculative/cpp_ngram/ngram.h,sha256=9OMOzO3KXEVbT5gEXjK-IRATI63in54LjeT_Xba5DSU,2492
959
1006
  sglang/srt/speculative/cpp_ngram/ngram_cache.py,sha256=Y22AM1CC0zOOarMWJzZQKz1-IMk3d4isSGkk-Uti74I,4383
960
1007
  sglang/srt/speculative/cpp_ngram/ngram_cache_binding.cpp,sha256=yrRXulpjivoSveCRL5ORfZ0hj2yXqjdVqc88APUJllg,1911
961
1008
  sglang/srt/speculative/cpp_ngram/param.h,sha256=tLSD_Ke1c2GjTY9tl3p1UgpbrBfaZqPRsHfw2YJ87hw,4375
962
1009
  sglang/srt/speculative/cpp_ngram/queue.h,sha256=m8OK4Nd6_yWnJkWxx-JRqUIOfzQwi3apy_3TvyxSY4Q,1288
963
- sglang/srt/tokenizer/tiktoken_tokenizer.py,sha256=KJwr6Xlc7AdHegMTnAVKJlPpW59Z7AE27GTzFL78GwI,6222
1010
+ sglang/srt/tokenizer/tiktoken_tokenizer.py,sha256=xIi7o38MB-pWPLC6sTdmGC9NN_kgRDvMStIo0nJZulw,6246
964
1011
  sglang/srt/tracing/trace.py,sha256=5SKy8XA4KLaTcBO6ZJvJSP_IYK5--2RJN0Q6O6Vg10g,16110
965
- sglang/srt/utils/__init__.py,sha256=M47TWjBX488QHsDCOTKHv-979SGOsnSu1wIWEqUaXnI,86
966
- sglang/srt/utils/common.py,sha256=gbj2-BL4ffLEkdQBqBs93NYU8QWwA3UN8qOEVZua2w0,108529
967
- sglang/srt/utils/hf_transformers_utils.py,sha256=7nUwqdrlkJMbi4aB5Ebvcf5NDVkLTzX4VVTNZav9Nps,17263
1012
+ sglang/srt/utils/__init__.py,sha256=zuoHoZnKrciwFy11a6p5Ua8mYU67QUI_09L0SfEjpeo,102
1013
+ sglang/srt/utils/aio_rwlock.py,sha256=6LYtOdeTUY3hkfa1dmYkgsaF2ttrwIF3hUWz2AZ2fqw,2970
1014
+ sglang/srt/utils/bench_utils.py,sha256=0xXUeDk61RynxbOV0P_okb-5rLPpc-ZqfCGx3W35K4I,4421
1015
+ sglang/srt/utils/common.py,sha256=uSu4JABt4oSwJiLFSaqLgkMkw8QDXn5ydrkslOUXb48,113357
1016
+ sglang/srt/utils/hf_transformers_utils.py,sha256=x5HyF75geb7vskOU9FaHarxK_u2MprUZm1SrmgMQX0E,17696
1017
+ sglang/srt/utils/host_shared_memory.py,sha256=0tO3qMlbmEIs11XvdI7BB0AtH4Z5hm9vWEkEyau4vlM,2264
1018
+ sglang/srt/utils/offloader.py,sha256=mKN1Vd0ftr2mjcVIXKCZnc51pcQ6bfYvhqFvdAUyRC4,18771
968
1019
  sglang/srt/utils/patch_torch.py,sha256=yaVs6YNm63rFYBw-v59usYR3cmb_qX6F69L5dMfQCxg,3307
969
1020
  sglang/srt/utils/poll_based_barrier.py,sha256=9vjn32ROlSueEk7EuZjWKUrrL7XVR9KJsSVliGTYB_4,937
1021
+ sglang/srt/utils/profile_merger.py,sha256=bvnz-yHMb7zHE1Bv09JKgCgYZY1n4h_UK7Wz2wNAmro,7202
970
1022
  sglang/srt/utils/rpd_utils.py,sha256=F8FWL_mT05xKQYLrzCJ8Q_5zfZJ86dHxX6LEqpwC7rw,20743
971
1023
  sglang/srt/utils/slow_rank_detector.py,sha256=81-KXp33wevk4jG2QuThsc17fLdmdeMouxwVfSXscic,2052
1024
+ sglang/srt/utils/torch_memory_saver_adapter.py,sha256=WFwPsOBvnWu6N2yTHmiOjLbDAYosslHwNSfyFHjz-7w,2511
972
1025
  sglang/srt/weight_sync/tensor_bucket.py,sha256=vp_LRrhULNnxiw9Tf56FcEckgUg07lifgv1lasG6y7o,3695
973
1026
  sglang/srt/weight_sync/utils.py,sha256=1FHM5kBav1GJUyYQLKHSJAh9MXwsuizDWxAVJMg1ZgE,4155
974
1027
  sglang/test/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
975
1028
  sglang/test/doc_patch.py,sha256=P9PYjBIVlZHvP9M34qS-8m1scmDP27ciNJNvZOdrUKE,1614
976
1029
  sglang/test/few_shot_gsm8k.py,sha256=zalplyHOYCnIwAnSQg-xlZl-Q-wGuMfjLdl9EJnUN7U,4333
977
- sglang/test/few_shot_gsm8k_engine.py,sha256=h88s3HzEStA1zjQkR-AgIEOQMwJMSnPHkX_wGBWXUYw,3907
1030
+ sglang/test/few_shot_gsm8k_engine.py,sha256=Vgs0SBguumrdlGOY1Hjjc8nTIdv5mxiTAmR4Isa4g4I,3793
978
1031
  sglang/test/get_logits_ut.py,sha256=XotfHBDbQDRuSrJLRErsrdIOA0WDflnrK9171E-2iWE,1822
979
- sglang/test/run_eval.py,sha256=1WaGfgsxCQWrvaIWS-m4lWjfTW-Y7IcASKvTG0Q-9gM,6420
980
- sglang/test/runners.py,sha256=Tn__rDchJRP7pAorTS6gAAtqdPIeexpoEvwOwohTsB8,34105
981
- sglang/test/send_one.py,sha256=XNZdfZs21tXDBwrDj2pq46WQd5smiKoYETY8U09c1Z8,5079
982
- sglang/test/simple_eval_common.py,sha256=Fm9PYFk6bYCb8RyMWr-ODfoNMUIftahTTOCBh84qiM0,12888
983
- sglang/test/simple_eval_gpqa.py,sha256=M6hpPs8l2Z4wUiyE7rCU1zyKoImXB4Z395Hgz43uvvQ,3293
984
- sglang/test/simple_eval_humaneval.py,sha256=s8YuKIBkNUEOBP4XKsTMRdXGv5aRhl0oJyl-89lGk1w,5687
1032
+ sglang/test/kit_matched_stop.py,sha256=60YESivdEqn6XXUa9oLu1UeLozp4ahteEEvWyOUVDx8,5382
1033
+ sglang/test/run_eval.py,sha256=88EUq7X9L1jN83IO9kijEoBXq9CS0DHgKaiX4QtgmUk,7829
1034
+ sglang/test/runners.py,sha256=dz4ZlbsF7BePTrS84BmlVt8LnxkoZhkyCPdjGg1hd04,34203
1035
+ sglang/test/send_one.py,sha256=sxdAVh6nxq8IgPf1behPiWF7ZVugwoOE4DjdJyY6qzo,6392
1036
+ sglang/test/simple_eval_common.py,sha256=06wMMTLf8kpbySBtImD9xdjmYCPuJSghhKcJ_D_KdB4,12976
1037
+ sglang/test/simple_eval_gpqa.py,sha256=Ui416_9Fh8TYU_51bClhEXi6wVCLEhLG28a7qPJfJYQ,3276
1038
+ sglang/test/simple_eval_humaneval.py,sha256=AhB-0dimur6_vSH9qHVyCRag_VZ8Jf3gH6PdmTkPHAU,5658
1039
+ sglang/test/simple_eval_longbench_v2.py,sha256=LLa3qAmF8PF1HGC-ubNcaB4jaz22NhZBY67rIzTH5Dk,12169
985
1040
  sglang/test/simple_eval_math.py,sha256=6kGKNwNbLN-Af3Wj8WTimWhH-Xp3enDmSvvSjsgWUpk,2550
986
1041
  sglang/test/simple_eval_mgsm.py,sha256=rd7TSUyxdKbrXaVoewo24V8lCo_6kO8zxPhhmvylpw8,10259
987
1042
  sglang/test/simple_eval_mmlu.py,sha256=FkwamjGMjueTixymkedF-YiPloSLiy4ftILFUrKZ9XI,4357
988
1043
  sglang/test/simple_eval_mmmu_vlm.py,sha256=XpADoB825LUX-n4hDFOR3wkuowdLPB6sMHJEvM2dah8,15195
989
1044
  sglang/test/test_activation.py,sha256=bDBFl4Y30siXj7Ifl66fc2HytOrcZdHFiP2i9K8TIsY,3140
990
- sglang/test/test_block_fp8.py,sha256=CNQE3CildtLO49ZegwhWBIN3QyvA0qI6p25xQeuUrWE,21824
991
- sglang/test/test_block_fp8_deep_gemm_blackwell.py,sha256=Hnhq4kkyINHb4ONedkp5Kf7Xx0MjOoOBYL8J7ETvOVA,8180
992
- sglang/test/test_block_fp8_ep.py,sha256=n4X6ZKwuUUbV5Ofjg64ptlaFGI1LbRXDfFiJW1ELHgY,10546
1045
+ sglang/test/test_block_fp8.py,sha256=z7cVJLy9jfD-xer3lALeBWkzRxhseqSboBAw75LZGgE,21828
1046
+ sglang/test/test_block_fp8_deep_gemm_blackwell.py,sha256=G6Yw6npnUO8OSuu4L2fOl-vP3mYCI7Mcrst6hc96t4s,8170
993
1047
  sglang/test/test_custom_ops.py,sha256=PenQ8zM1wj5xwiVEPVzD37pO-x90aOfFMpCRZenaKsY,5709
994
- sglang/test/test_cutlass_moe.py,sha256=WHCruIMzxzRzxQEeFEUtk0e0IefjiO0Kjfgnx42r0UI,10069
995
- sglang/test/test_cutlass_w4a8_moe.py,sha256=Ku9VCXEMJ3BwXtvb1A3FzY-zek-S-A4thWyX6m-1v-A,9219
1048
+ sglang/test/test_cutlass_moe.py,sha256=0kzalShZCSSbV1JLKv77mx8bXgK2wvskTuPGqK_qNnQ,10051
1049
+ sglang/test/test_cutlass_w4a8_moe.py,sha256=iQIZ1K43emzqI9WVKlb2fplLPcvlpm3D7qCNK-wJfa4,8924
996
1050
  sglang/test/test_deepep_utils.py,sha256=749ysTBGNzh6rYUCJhhZBtZpeD15eWTeNHYCytcvZtc,7448
997
- sglang/test/test_deterministic.py,sha256=3TW6QogzSrvARizRRwELesKy-_NM3NfQkLEGoAvpadI,10120
998
- sglang/test/test_disaggregation_utils.py,sha256=9LB6vCKr55iHhFN5saOwlKealG4ME20O3LTBbCCPbGI,2573
1051
+ sglang/test/test_deterministic.py,sha256=ISh_2dnEgRI1Ku7lxmDKs7mwNgLrBEhKnLnvW9Uei98,15689
1052
+ sglang/test/test_deterministic_utils.py,sha256=vVtwq_NjH9GzSkRUn4mep-IIvgAXtw-5l6iKjYDP8SA,2133
1053
+ sglang/test/test_disaggregation_utils.py,sha256=k_V_vw6qCEw3iZyUeujozMBkUgGRfCWxkLyCb9ktIbk,5588
999
1054
  sglang/test/test_dynamic_grad_mode.py,sha256=L76yUCuk_ymNpXD2CmO8r2GiGjIvD_gtTsuFDs2NolI,1638
1000
1055
  sglang/test/test_fp4_moe.py,sha256=wvHbGMH1UBr_XVWYgX57Y2bLy9h2DPQH10_Hmf2q6iw,22436
1001
1056
  sglang/test/test_layernorm.py,sha256=2GMWqqNDuGvSMSsEBF5eDCzwVSYA9E6hGhRo6s4ecKg,3764
1002
- sglang/test/test_marlin_moe.py,sha256=TOuYlVMx2Lv_IN3AMWsg5aGaxQF472E1B9ev_vvfU2Q,7971
1057
+ sglang/test/test_marlin_moe.py,sha256=d3LsMn9qT-r-DzHKhHikRTzSPSDWDtBNuIpz35AeM20,7958
1003
1058
  sglang/test/test_marlin_utils.py,sha256=kC7IzN364mJT9xw0nKUP1V1OK1hkw6fQTBvD4nRaOz4,5151
1004
1059
  sglang/test/test_programs.py,sha256=R-pzgNB-h_jjdJiW50hn83-nY7z5q5XcqPwugPnVF5Y,18916
1005
- sglang/test/test_utils.py,sha256=ED7Kktyg5tgaOv8UAFCg29XKMz0MLd7Zgl8ctQFwHOQ,54542
1060
+ sglang/test/test_utils.py,sha256=-i5Jh91gO7fDkr6PM1Lb7s7tyUqcI5v_qdhCKyDbgNg,56381
1006
1061
  sglang/test/attention/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
1007
- sglang/test/attention/test_flashattn_backend.py,sha256=_rTG849FwQdVTyGKkqhczaOqngBmRWXFmkl5NnuK1GM,13914
1008
- sglang/test/attention/test_flashattn_mla_backend.py,sha256=g4O50WblTpM7_Gq2b76k0i25_z01BOUBQ4i6PmyxpO4,10774
1009
- sglang/test/attention/test_prefix_chunk_info.py,sha256=hpoDe2wfSa6RlUbfyri_c0iyBTb35UXGL9I2Xh6jamM,7772
1010
- sglang/test/attention/test_trtllm_mla_backend.py,sha256=wp2_LSTwQ_vIdNPUCbEz7PA4doDU8sTWs6s6XVI0YnI,48874
1011
- sglang-0.5.3rc2.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
1012
- sglang-0.5.3rc2.dist-info/METADATA,sha256=9jumtyFrtne6z3uEpBy23xFvdJ59YgHVrXclky7_43k,24609
1013
- sglang-0.5.3rc2.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
1014
- sglang-0.5.3rc2.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
1015
- sglang-0.5.3rc2.dist-info/RECORD,,
1062
+ sglang/test/attention/test_flashattn_backend.py,sha256=Uh895KymXiRFH1pJ1NR9eSfoi6UI41YdPc4viLdUTBA,13904
1063
+ sglang/test/attention/test_flashattn_mla_backend.py,sha256=XW12ALYv2Ncs4t-Bz6omhYzNUQGe_P10K0gyqp9Y37U,10690
1064
+ sglang/test/attention/test_prefix_chunk_info.py,sha256=er0i3KGHMkw-4UZB1GCFd4oYwRcXfU5wpO1ORqpNGGA,7626
1065
+ sglang/test/attention/test_trtllm_mla_backend.py,sha256=UbtvkzTAqP-kHHEhhtPxVpuzG9QmyWBrFuJa0S7Z52g,54951
1066
+ sglang/test/longbench_v2/__init__.py,sha256=ZcOIPSyqbDI_tzB-qltXF67-4uMMPwCkkiWDVcDBDvQ,63
1067
+ sglang/test/longbench_v2/test_longbench_v2_eval.py,sha256=NI_Om4ODw5utUNsYjrj6nueebI4U5u4N2PKBtT5O27k,7352
1068
+ sglang/test/longbench_v2/validate_longbench_v2.py,sha256=mJa5Lh8XiSTXKrf5qopKuAfspSVbhoacnCkz6u4lYFQ,11635
1069
+ sglang/test/longbench_v2/validate_longbench_v2_standalone.py,sha256=gr0zif2c680hSyIHDVJ_NHYcrMquM3fpJ26mBtbm7zs,10909
1070
+ sglang-0.5.4.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
1071
+ sglang-0.5.4.dist-info/METADATA,sha256=M8BtBa6y1fGn0YOx6BJttNdVgtLNOPMbLM3t58ZNCy0,25668
1072
+ sglang-0.5.4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
1073
+ sglang-0.5.4.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
1074
+ sglang-0.5.4.dist-info/RECORD,,