sglang 0.4.4__py3-none-any.whl → 0.4.4.post1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- sglang/srt/function_call_parser.py +33 -2
- sglang/srt/layers/dp_attention.py +30 -2
- sglang/srt/layers/elementwise.py +411 -0
- sglang/srt/layers/logits_processor.py +1 -0
- sglang/srt/layers/moe/router.py +342 -0
- sglang/srt/managers/cache_controller.py +2 -0
- sglang/srt/managers/data_parallel_controller.py +1 -1
- sglang/srt/managers/schedule_batch.py +1 -1
- sglang/srt/managers/scheduler.py +52 -18
- sglang/srt/managers/scheduler_output_processor_mixin.py +4 -1
- sglang/srt/mem_cache/hiradix_cache.py +9 -1
- sglang/srt/mem_cache/memory_pool.py +4 -1
- sglang/srt/model_executor/cuda_graph_runner.py +59 -16
- sglang/srt/model_executor/forward_batch_info.py +13 -4
- sglang/srt/models/deepseek_v2.py +180 -177
- sglang/srt/models/grok.py +374 -119
- sglang/srt/openai_api/adapter.py +22 -20
- sglang/srt/server_args.py +5 -5
- sglang/version.py +1 -1
- {sglang-0.4.4.dist-info → sglang-0.4.4.post1.dist-info}/METADATA +1 -1
- {sglang-0.4.4.dist-info → sglang-0.4.4.post1.dist-info}/RECORD +24 -22
- {sglang-0.4.4.dist-info → sglang-0.4.4.post1.dist-info}/LICENSE +0 -0
- {sglang-0.4.4.dist-info → sglang-0.4.4.post1.dist-info}/WHEEL +0 -0
- {sglang-0.4.4.dist-info → sglang-0.4.4.post1.dist-info}/top_level.txt +0 -0
sglang/srt/openai_api/adapter.py
CHANGED
@@ -1115,27 +1115,29 @@ def v1_chat_generate_response(
|
|
1115
1115
|
else:
|
1116
1116
|
reasoning_text = None
|
1117
1117
|
|
1118
|
-
if tool_choice != "none" and
|
1119
|
-
|
1120
|
-
|
1121
|
-
|
1122
|
-
|
1123
|
-
|
1124
|
-
|
1125
|
-
|
1126
|
-
|
1127
|
-
|
1128
|
-
|
1129
|
-
|
1118
|
+
if tool_choice != "none" and tools:
|
1119
|
+
parser = FunctionCallParser(tools, tool_call_parser)
|
1120
|
+
if parser.has_tool_call(text):
|
1121
|
+
if finish_reason["type"] == "stop":
|
1122
|
+
finish_reason["type"] = "tool_calls"
|
1123
|
+
finish_reason["matched"] = None
|
1124
|
+
try:
|
1125
|
+
full_normal_text, call_info_list = parser.parse_non_stream(text)
|
1126
|
+
tool_calls = [
|
1127
|
+
ToolCall(
|
1128
|
+
id=str(call_info.tool_index),
|
1129
|
+
function=FunctionResponse(
|
1130
|
+
name=call_info.name, arguments=call_info.parameters
|
1131
|
+
),
|
1132
|
+
)
|
1133
|
+
for call_info in call_info_list
|
1134
|
+
]
|
1135
|
+
except Exception as e:
|
1136
|
+
logger.error(f"Exception: {e}")
|
1137
|
+
return create_error_response(
|
1138
|
+
HTTPStatus.BAD_REQUEST,
|
1139
|
+
"Failed to parse fc related info to json format!",
|
1130
1140
|
)
|
1131
|
-
for call_info in call_info_list
|
1132
|
-
]
|
1133
|
-
except Exception as e:
|
1134
|
-
logger.error(f"Exception: {e}")
|
1135
|
-
return create_error_response(
|
1136
|
-
HTTPStatus.BAD_REQUEST,
|
1137
|
-
"Failed to parse fc related info to json format!",
|
1138
|
-
)
|
1139
1141
|
|
1140
1142
|
if to_file:
|
1141
1143
|
# to make the choice data json serializable
|
sglang/srt/server_args.py
CHANGED
@@ -262,14 +262,14 @@ class ServerArgs:
|
|
262
262
|
|
263
263
|
# Data parallelism attention
|
264
264
|
if self.enable_dp_attention:
|
265
|
-
self.dp_size = self.tp_size
|
266
|
-
assert self.tp_size % self.dp_size == 0
|
267
|
-
self.chunked_prefill_size = self.chunked_prefill_size // 2
|
268
265
|
self.schedule_conservativeness = self.schedule_conservativeness * 0.3
|
266
|
+
assert (
|
267
|
+
self.dp_size > 1
|
268
|
+
), "Please set a dp-size > 1. You can use 1 < dp-size <= tp-size "
|
269
|
+
assert self.tp_size % self.dp_size == 0
|
270
|
+
self.chunked_prefill_size = self.chunked_prefill_size // self.dp_size
|
269
271
|
logger.warning(
|
270
272
|
f"DP attention is enabled. The chunked prefill size is adjusted to {self.chunked_prefill_size} to avoid MoE kernel issues. "
|
271
|
-
f"The schedule conservativeness is adjusted to {self.schedule_conservativeness}. "
|
272
|
-
"Data parallel size is adjusted to be the same as tensor parallel size. "
|
273
273
|
)
|
274
274
|
|
275
275
|
# Speculative Decoding
|
sglang/version.py
CHANGED
@@ -1 +1 @@
|
|
1
|
-
__version__ = "0.4.4"
|
1
|
+
__version__ = "0.4.4.post1"
|
@@ -9,7 +9,7 @@ sglang/global_config.py,sha256=xzLdk8W53fneFblNh8iIjGF9C3-7mnzR1-LleD9Btxg,1495
|
|
9
9
|
sglang/launch_server.py,sha256=mDXfwha8LHpWQJekcCosR98QhCQsbmilsBlI5jAIgg0,420
|
10
10
|
sglang/llama3_eval.py,sha256=gWSboDchIGybIce88bJlrCG0yiLZ513mw4gcutJlzGM,10017
|
11
11
|
sglang/utils.py,sha256=jMMRaAChfWgU_F2BMbDF9G896shiemdzCnWxFocy4QM,15195
|
12
|
-
sglang/version.py,sha256=
|
12
|
+
sglang/version.py,sha256=4ZEzfisb7CBE8mZJHsVVkqSmecAalLdtwfQHDTnpWTw,28
|
13
13
|
sglang/lang/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
14
14
|
sglang/lang/chat_template.py,sha256=VKI5RNydfo1-qz6HT-aYm6ecBsa1RjkTZLZLCiBb5Ig,18269
|
15
15
|
sglang/lang/choices.py,sha256=-W1DVw9N9ZliVpvmWrzIXG4cswAah8eMQrHWzkS3D8o,6234
|
@@ -28,13 +28,13 @@ sglang/srt/_custom_ops.py,sha256=0zKNhmLhtUNTBE_WwuzkG_Y_Kaufai84VGe4fJ8v6-o,497
|
|
28
28
|
sglang/srt/aio_rwlock.py,sha256=6LYtOdeTUY3hkfa1dmYkgsaF2ttrwIF3hUWz2AZ2fqw,2970
|
29
29
|
sglang/srt/conversation.py,sha256=qiOAs42rftnIgjPq5c8Ce0DSCMsaRlvFxyUTpUXR_4M,24664
|
30
30
|
sglang/srt/custom_op.py,sha256=vhdofFbWtpdtaA4NG4tkanWwEsfvBnjh6OPKOxmxXdU,3426
|
31
|
-
sglang/srt/function_call_parser.py,sha256
|
31
|
+
sglang/srt/function_call_parser.py,sha256=k_L4Ex4Lc5TUNWiCO6BcSJjlv2TQmvphyGZIxHfl0e0,20835
|
32
32
|
sglang/srt/hf_transformers_utils.py,sha256=FPoOvGdEy-lwrOOqHaQnb_tJCGmCW3CpKUjleY7Cwj4,8221
|
33
33
|
sglang/srt/mm_utils.py,sha256=1ScBunw_x4W8ebM_AcJ62-1T2mfT8NlMJqdAhkF1lb0,12367
|
34
34
|
sglang/srt/model_parallel.py,sha256=eLXZhvJ4wG6dh0FontNCIdVZvHYdWgaeY-5cu7TD9tE,6078
|
35
35
|
sglang/srt/reasoning_parser.py,sha256=45xsU9RCPfyG4_Zx4y3-JPyNgAtrqwKI4j5R2NT4g1s,5594
|
36
36
|
sglang/srt/server.py,sha256=PrQb9r6L9syWHKlggbbiQYsKtpwSmECqozRbf8qnoV8,874
|
37
|
-
sglang/srt/server_args.py,sha256=
|
37
|
+
sglang/srt/server_args.py,sha256=ZKYb3tL6m8pVNH-3m9yRRRMkz2mlLkRhV0acME7dn0Q,44864
|
38
38
|
sglang/srt/torch_memory_saver_adapter.py,sha256=--FgbrcvJxTcRe856plD9ktqgrHGPTE18eZCJlE50hY,1255
|
39
39
|
sglang/srt/utils.py,sha256=Nh85Igdbmi5nN09s2rFsnnAIUcijk5jljmktiYByZp8,50163
|
40
40
|
sglang/srt/warmup.py,sha256=FmJiYfjRr3X_eAe7ojQaPoN17LvHpjDmRWRnO-k86AQ,1469
|
@@ -68,10 +68,11 @@ sglang/srt/entrypoints/engine.py,sha256=xZmo4F6OuwjOV2CXQwmUAjpoj5tZTV7sJIEEXTFh
|
|
68
68
|
sglang/srt/entrypoints/http_server.py,sha256=lb5sFSBKYiI7NZeFPeFeypjQkhMm5hkYqIwo9AsFDZQ,24724
|
69
69
|
sglang/srt/entrypoints/verl_engine.py,sha256=ICo0F860JvoCy3aKTTLpEHqKcDX4WIN5V85q6873IxA,5798
|
70
70
|
sglang/srt/layers/activation.py,sha256=f097ndEIQ-lQ5JLa4HrcjqLLBeRcZbjYmj2gmVknnkA,5993
|
71
|
-
sglang/srt/layers/dp_attention.py,sha256=
|
71
|
+
sglang/srt/layers/dp_attention.py,sha256=gaWG5c6Np2OJls4ldZ5Ea2etpY3T-0uyru7IKBuEtVM,7199
|
72
|
+
sglang/srt/layers/elementwise.py,sha256=y2mQqjbF2FmFtNYBk5ecTyaj3ELoZyz-rWPY8rrxCtk,13765
|
72
73
|
sglang/srt/layers/layernorm.py,sha256=DI2Ih34bLh5Ex_yd8-X8L7kNRcYStpc9XpIS4zIoM_U,3860
|
73
74
|
sglang/srt/layers/linear.py,sha256=8HyDjnpUu1ZxdqVRt9jiuO4GvTr2JsO42jwgtl10Qjs,51063
|
74
|
-
sglang/srt/layers/logits_processor.py,sha256=
|
75
|
+
sglang/srt/layers/logits_processor.py,sha256=RHvuPECoMpdU4Fpv1UrQ3yVz9qHKfbYxLS6k6bNRh0s,23243
|
75
76
|
sglang/srt/layers/parameter.py,sha256=-jaiI-dIhiSPigwcQGydBiKEMSVg7XuMcg8Bzb8BHMo,15162
|
76
77
|
sglang/srt/layers/pooler.py,sha256=rj2lygvleBnyLCBZ8I11HGMgpfIDsT0l3PIkshJwdu4,1606
|
77
78
|
sglang/srt/layers/radix_attention.py,sha256=UDL0y4Zasay_Rk-_XmIU4kaGbaF26ONvEHX5EQzLrqI,2260
|
@@ -93,6 +94,7 @@ sglang/srt/layers/attention/triton_ops/extend_attention.py,sha256=SZezMpXMr2AEEI
|
|
93
94
|
sglang/srt/layers/attention/triton_ops/prefill_attention.py,sha256=Y66gZ37u0GKMPtI8n5MbO6uOxRuGEmKIG0IPbJTOqAM,6213
|
94
95
|
sglang/srt/layers/attention/triton_ops/rocm_mla_decode_rope.py,sha256=664WnAJ91EiCUZOcnVDfbTQf4uGJ4ZDZB1CbxpEUFZc,13866
|
95
96
|
sglang/srt/layers/moe/fused_moe_native.py,sha256=domK1jDc5-zJcdwDso-YgBp_O136VHifnvFVlfFvKsY,4325
|
97
|
+
sglang/srt/layers/moe/router.py,sha256=gvyK7hXlujfCZCmAIFc3oxfgjuAjzlpPe3mp1Blc6Y0,10419
|
96
98
|
sglang/srt/layers/moe/topk.py,sha256=MOwBNBwxxW__mgmpX08RIqrh77aXLEgr0F5b5iF7hRI,7512
|
97
99
|
sglang/srt/layers/moe/ep_moe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
98
100
|
sglang/srt/layers/moe/ep_moe/kernels.py,sha256=hG7E29bbj8HeXEkAd6N0HzJZPn7cwVx1VJptzpRWOv0,15376
|
@@ -394,17 +396,17 @@ sglang/srt/lora/triton_ops/gate_up_lora_b.py,sha256=qve4oNZHYUFk9ckmT2BVuDNMEvrN
|
|
394
396
|
sglang/srt/lora/triton_ops/qkv_lora_b.py,sha256=BmIcTZMnlSnie9rnMl4KvLpc4Njsk7_IppbUqitf9Xw,5738
|
395
397
|
sglang/srt/lora/triton_ops/sgemm_lora_a.py,sha256=kv-AvJ_Bi3yWjGvFnSwXvP66iJvY9n9pEnJzJ9-DWzo,3982
|
396
398
|
sglang/srt/lora/triton_ops/sgemm_lora_b.py,sha256=Ai5vPriT4OgACwK7xrpGgf5L1oaN9x0jwNKMChu3uI0,4299
|
397
|
-
sglang/srt/managers/cache_controller.py,sha256=
|
399
|
+
sglang/srt/managers/cache_controller.py,sha256=XB6UHFXVw5LAyKV2jK0iVzhAYT4fSzJVCNL42eKGUsk,18175
|
398
400
|
sglang/srt/managers/configure_logging.py,sha256=fOJaXAQ1n9m-8KPJndpsKvS885i69SMafoEADLIVfIM,1633
|
399
|
-
sglang/srt/managers/data_parallel_controller.py,sha256=
|
401
|
+
sglang/srt/managers/data_parallel_controller.py,sha256=px1SrFUUDDroXaHN4m9LcMNqGDt2vv9COiVNg1O-BqI,9561
|
400
402
|
sglang/srt/managers/detokenizer_manager.py,sha256=HTfpJWMF1EImhKOnLJ96xPmYXm71xzaisLMfxg3zpgs,10111
|
401
403
|
sglang/srt/managers/image_processor.py,sha256=o2ChZW3mWSw1I_4HFE8SV1ZsYtWp9G9w7Ij73BvugN4,1711
|
402
404
|
sglang/srt/managers/io_struct.py,sha256=XvXM6WRarwEtaNQWlzZpYKy2Zi4wCG3xnz_ojskYJjM,22791
|
403
405
|
sglang/srt/managers/multi_modality_padding.py,sha256=dkFKknxML8R3KrAZhKXO-A69u3pUUI1pRfOVMJfqHYw,5165
|
404
|
-
sglang/srt/managers/schedule_batch.py,sha256=
|
406
|
+
sglang/srt/managers/schedule_batch.py,sha256=NzT2ivSSKRqtFRiAr-d2MO6spH0z-cf0jANw3JyGrr8,55983
|
405
407
|
sglang/srt/managers/schedule_policy.py,sha256=E1qVq2G3jptKdX9nlqfayeRBUll9xB6bK8nBf3EW32E,19469
|
406
|
-
sglang/srt/managers/scheduler.py,sha256=
|
407
|
-
sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=
|
408
|
+
sglang/srt/managers/scheduler.py,sha256=bL1HiKey5ZgyqcYFur6pfEZLbBPcKLF-peAreiNnfK8,69433
|
409
|
+
sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=u2sj6MViFTov0lVZSysZ-wph2pEqRCtCjwA1UdttZ7I,26338
|
408
410
|
sglang/srt/managers/session_controller.py,sha256=YOv8cFcuVmdCE4OfQJ6aA5AosHRwtZF9WdUUfUXEp0I,5753
|
409
411
|
sglang/srt/managers/tokenizer_manager.py,sha256=_xIn-3BDgagqnmRKFhIQTkCg2jXk6jp607B7CeprNVw,44686
|
410
412
|
sglang/srt/managers/tp_worker.py,sha256=o9MY1a8x81nI3W0m64YvOXcAA4sCBvPPmnNU67vBXGs,8710
|
@@ -419,14 +421,14 @@ sglang/srt/managers/image_processors/qwen_vl.py,sha256=wJbbCW1DKPQp_RufQ4fz7Nd_h
|
|
419
421
|
sglang/srt/mem_cache/base_prefix_cache.py,sha256=NY62Zo0A0tLJ7ObRLOQqQcXCxoJUDZsK8f5U4dNQjKc,973
|
420
422
|
sglang/srt/mem_cache/chunk_cache.py,sha256=it5SfL1FwMbrdeOH-I-Eu_i-I9hFB1xL-z_brIUoCkk,1835
|
421
423
|
sglang/srt/mem_cache/flush_cache.py,sha256=GYcxmNXh4hsMpFfNOuCTpKilW7guZwTtAg_usVeM3J0,979
|
422
|
-
sglang/srt/mem_cache/hiradix_cache.py,sha256=
|
423
|
-
sglang/srt/mem_cache/memory_pool.py,sha256=
|
424
|
+
sglang/srt/mem_cache/hiradix_cache.py,sha256=UTdIqGosuU3PjGj27hmLuf2exPd9Rkg8GShVqi85FUA,15548
|
425
|
+
sglang/srt/mem_cache/memory_pool.py,sha256=xZc9pXgCwQyfv7rkgh4uoXDi2qPwueqTuw48poSV4OQ,22816
|
424
426
|
sglang/srt/mem_cache/paged_allocator.py,sha256=DRq7qZXLVeHKkCWRlEkoAmLP5IC_1ReHa_xL7-8Orzs,8594
|
425
427
|
sglang/srt/mem_cache/radix_cache.py,sha256=bLldgkFZvmFOVgc2xLI87an3UBYxIsOlRBsxenFEL7s,14912
|
426
428
|
sglang/srt/metrics/collector.py,sha256=0X40ZZ18182sx2t0eqeqoK7gspH36L343zNvSkgBvd0,9293
|
427
429
|
sglang/srt/metrics/func_timer.py,sha256=VFyNRrbnKVCwnQsrlLin1lITJfjQpf9m8sGPqL5LIsQ,3438
|
428
|
-
sglang/srt/model_executor/cuda_graph_runner.py,sha256
|
429
|
-
sglang/srt/model_executor/forward_batch_info.py,sha256=
|
430
|
+
sglang/srt/model_executor/cuda_graph_runner.py,sha256=EllAbxzJy6ULgJyboVYmqG1IFYhNM6zLAAmpWARsIRo,22197
|
431
|
+
sglang/srt/model_executor/forward_batch_info.py,sha256=wtByWmk7u4YUH2ZergdjT1tyl5Jhc75S1cVvd_GTEQI,17404
|
430
432
|
sglang/srt/model_executor/model_runner.py,sha256=zE3nWMBLI0eW2mDZHBvxj1bHW3VsAxtd-RP6uddyP5A,41581
|
431
433
|
sglang/srt/model_loader/__init__.py,sha256=zGZkOBz1zx-pkaIy47BasL3fjDlAcxAXUTjInOhXHAE,919
|
432
434
|
sglang/srt/model_loader/loader.py,sha256=bHsb3T9CGac32NgDeRt03cJXBy-t1WsyYOWcYkeMVLA,46813
|
@@ -439,7 +441,7 @@ sglang/srt/models/dbrx.py,sha256=0Vf4yhqe8YeQuKR3P-agvYJScmHwH3-tFbyU8kv5QJM,155
|
|
439
441
|
sglang/srt/models/deepseek.py,sha256=Le2MXij8m4hT7QYgD0bFMFmYhbgX7SMjoXZFB8BxgyA,16871
|
440
442
|
sglang/srt/models/deepseek_janus_pro.py,sha256=sduOYeAQrb2DFfoeJVzxMNOAgS7_CmTqaKWc8J3Ypeg,72528
|
441
443
|
sglang/srt/models/deepseek_nextn.py,sha256=8uR4k1qCBKL1JAcE8cCJz3HowrIgCgdMtbqQ4Xq8Tr4,13161
|
442
|
-
sglang/srt/models/deepseek_v2.py,sha256=
|
444
|
+
sglang/srt/models/deepseek_v2.py,sha256=oEREP6cErJxBuQRooXY6tZ7oMwLvWLTjDYZPAfXVAS8,48651
|
443
445
|
sglang/srt/models/exaone.py,sha256=5iibqQTjpgosuGRt2rj2lWR0ShK2XGhbdFSnOWpaQss,13386
|
444
446
|
sglang/srt/models/gemma.py,sha256=3XxMDOKz4xMP6VzWoW8f0hmMf8LP8fhzMw5prsYC4e8,12602
|
445
447
|
sglang/srt/models/gemma2.py,sha256=MDe_HNkSpEJpw426tbx3fp271GBlSVEuhIdGeOB_jYA,16356
|
@@ -447,7 +449,7 @@ sglang/srt/models/gemma2_reward.py,sha256=V8U3_ADUHWPdOwvEe1jhGW-oJmBgL8t1TY3-67
|
|
447
449
|
sglang/srt/models/gpt2.py,sha256=dAnfmsAL7JVHakryqrERR1jgL8mI1Op6nPHYfDCF7Ao,9802
|
448
450
|
sglang/srt/models/gpt_bigcode.py,sha256=EAN6xAXpa8m3DcBuH1D4rTPji2oG9NSozGXSNHtE2lw,10268
|
449
451
|
sglang/srt/models/granite.py,sha256=nu_Zl_PYn188gk1uYVZ76y4wwHZV7G0w7uanhqpSFUs,20813
|
450
|
-
sglang/srt/models/grok.py,sha256=
|
452
|
+
sglang/srt/models/grok.py,sha256=pQOXtpHOYVntwt5QQRLffYsnMHmMfPMmGyKMfR0k0Ic,27994
|
451
453
|
sglang/srt/models/internlm2.py,sha256=4eh9WVgK4yg13IsnH5qB2xUCWnixj_aLLz7qa_4m2_Q,13017
|
452
454
|
sglang/srt/models/internlm2_reward.py,sha256=ndfGmyqYZbVZ7C7rJ-v9oK3wa-EpoBGybS8MlyKZi2E,2522
|
453
455
|
sglang/srt/models/llama.py,sha256=FEtMrzjrbQLOOQvrqGFwslizjHPaU--9rEiXlr7MIiI,22958
|
@@ -481,7 +483,7 @@ sglang/srt/models/torch_native_llama.py,sha256=5tfFSMAXB3ScToqTALtCXa8Oo-qPCJh-K
|
|
481
483
|
sglang/srt/models/xverse.py,sha256=I7ivNsk6NRqPxlMUmdclpzDCvhAnWbv_GOj01MKHJrQ,13996
|
482
484
|
sglang/srt/models/xverse_moe.py,sha256=xLwn5pRwQrvj7zMmwl3o49m7xILb2ACRdWvm9hY8LDc,16743
|
483
485
|
sglang/srt/models/yivl.py,sha256=oToK7-u5IGO7xwpJIQ7VtudlK6-zPqJX4bt6_wv0SH8,4850
|
484
|
-
sglang/srt/openai_api/adapter.py,sha256=
|
486
|
+
sglang/srt/openai_api/adapter.py,sha256=GAAo_Vuf9aiKgUH0NPanDTB_eC1WqRRNnltVvAFeW4s,67412
|
485
487
|
sglang/srt/openai_api/protocol.py,sha256=6-vwYewe7JfmMMC56oRU13aRmmKUerZs50GPmiGeX7w,12490
|
486
488
|
sglang/srt/sampling/custom_logit_processor.py,sha256=tDvoLgLqn-sy1qcY6vSrpbnHCeqbdk0uhMOO-uy4p4E,1099
|
487
489
|
sglang/srt/sampling/sampling_batch_info.py,sha256=T4UJ_CRB6A0HnRwEsqmxy1CJQMwZaVdxbdlCeTK4BUI,11992
|
@@ -514,8 +516,8 @@ sglang/test/test_custom_ops.py,sha256=XBTWh3jEsoe9hZ93p3LAUtjEj5l0qNEaZM5Mto6pbJ
|
|
514
516
|
sglang/test/test_layernorm.py,sha256=IacByD5d-stXjzBz8Ypamc7povlcedpKPbb_4JLgo3c,3720
|
515
517
|
sglang/test/test_programs.py,sha256=VZ3vXtUDBnXz0M7gFdDH8hXg9Wa0j_qI8CVqjEgRN_E,18877
|
516
518
|
sglang/test/test_utils.py,sha256=UBBk-F4A5hEtmRdu7vEttlnSmPVPJLQgtNZxMn1Tdo4,29188
|
517
|
-
sglang-0.4.4.dist-info/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
|
518
|
-
sglang-0.4.4.dist-info/METADATA,sha256=
|
519
|
-
sglang-0.4.4.dist-info/WHEEL,sha256=52BFRY2Up02UkjOa29eZOS2VxUrpPORXg1pkohGGUS8,91
|
520
|
-
sglang-0.4.4.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
|
521
|
-
sglang-0.4.4.dist-info/RECORD,,
|
519
|
+
sglang-0.4.4.post1.dist-info/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
|
520
|
+
sglang-0.4.4.post1.dist-info/METADATA,sha256=P0EmlGnVHDnvAojlrFQw_2CrPN2qERG6VIUoR6kG4vo,24311
|
521
|
+
sglang-0.4.4.post1.dist-info/WHEEL,sha256=52BFRY2Up02UkjOa29eZOS2VxUrpPORXg1pkohGGUS8,91
|
522
|
+
sglang-0.4.4.post1.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
|
523
|
+
sglang-0.4.4.post1.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|