sglang 0.4.9.post4__py3-none-any.whl → 0.4.9.post5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- sglang/lang/chat_template.py +21 -0
- sglang/srt/configs/internvl.py +3 -0
- sglang/srt/configs/model_config.py +4 -0
- sglang/srt/constrained/base_grammar_backend.py +10 -2
- sglang/srt/constrained/xgrammar_backend.py +7 -5
- sglang/srt/conversation.py +16 -1
- sglang/srt/debug_utils/__init__.py +0 -0
- sglang/srt/debug_utils/dump_comparator.py +131 -0
- sglang/srt/debug_utils/dumper.py +108 -0
- sglang/srt/debug_utils/text_comparator.py +172 -0
- sglang/srt/disaggregation/decode_schedule_batch_mixin.py +13 -1
- sglang/srt/disaggregation/mooncake/conn.py +16 -0
- sglang/srt/disaggregation/prefill.py +13 -1
- sglang/srt/entrypoints/engine.py +4 -2
- sglang/srt/entrypoints/openai/serving_chat.py +132 -79
- sglang/srt/function_call/ebnf_composer.py +10 -3
- sglang/srt/function_call/function_call_parser.py +2 -0
- sglang/srt/function_call/glm4_moe_detector.py +164 -0
- sglang/srt/function_call/qwen3_coder_detector.py +1 -0
- sglang/srt/layers/attention/hybrid_attn_backend.py +100 -0
- sglang/srt/layers/attention/vision.py +56 -8
- sglang/srt/layers/layernorm.py +26 -1
- sglang/srt/layers/logits_processor.py +14 -3
- sglang/srt/layers/moe/ep_moe/layer.py +172 -206
- sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_2_0/E=160,N=320,device_name=NVIDIA_A800-SXM4-80GB,dtype=int8_w8a8.json +146 -0
- sglang/srt/layers/moe/fused_moe_triton/layer.py +38 -48
- sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py +11 -8
- sglang/srt/layers/moe/topk.py +84 -22
- sglang/srt/layers/multimodal.py +11 -8
- sglang/srt/layers/quantization/fp8.py +25 -247
- sglang/srt/layers/quantization/fp8_kernel.py +78 -48
- sglang/srt/layers/quantization/modelopt_quant.py +25 -10
- sglang/srt/layers/quantization/unquant.py +24 -76
- sglang/srt/layers/quantization/w4afp8.py +68 -17
- sglang/srt/lora/lora_registry.py +93 -29
- sglang/srt/managers/cache_controller.py +9 -7
- sglang/srt/managers/mm_utils.py +154 -35
- sglang/srt/managers/multimodal_processor.py +3 -14
- sglang/srt/managers/schedule_batch.py +14 -8
- sglang/srt/managers/scheduler.py +35 -1
- sglang/srt/managers/tokenizer_manager.py +37 -6
- sglang/srt/managers/tp_worker.py +3 -0
- sglang/srt/mem_cache/hiradix_cache.py +5 -2
- sglang/srt/model_executor/model_runner.py +68 -14
- sglang/srt/models/deepseek_v2.py +62 -28
- sglang/srt/models/glm4_moe.py +1035 -0
- sglang/srt/models/glm4_moe_nextn.py +167 -0
- sglang/srt/models/interns1.py +328 -0
- sglang/srt/models/internvl.py +143 -47
- sglang/srt/models/llava.py +9 -5
- sglang/srt/models/minicpmo.py +4 -1
- sglang/srt/models/qwen2_moe.py +2 -2
- sglang/srt/models/qwen3_moe.py +5 -2
- sglang/srt/multimodal/processors/base_processor.py +20 -6
- sglang/srt/multimodal/processors/clip.py +2 -2
- sglang/srt/multimodal/processors/deepseek_vl_v2.py +2 -2
- sglang/srt/multimodal/processors/gemma3.py +2 -2
- sglang/srt/multimodal/processors/gemma3n.py +2 -2
- sglang/srt/multimodal/processors/internvl.py +21 -8
- sglang/srt/multimodal/processors/janus_pro.py +2 -2
- sglang/srt/multimodal/processors/kimi_vl.py +2 -2
- sglang/srt/multimodal/processors/llava.py +4 -4
- sglang/srt/multimodal/processors/minicpm.py +2 -3
- sglang/srt/multimodal/processors/mlama.py +2 -2
- sglang/srt/multimodal/processors/mllama4.py +18 -111
- sglang/srt/multimodal/processors/phi4mm.py +2 -2
- sglang/srt/multimodal/processors/pixtral.py +2 -2
- sglang/srt/multimodal/processors/qwen_audio.py +2 -2
- sglang/srt/multimodal/processors/qwen_vl.py +2 -2
- sglang/srt/multimodal/processors/vila.py +3 -1
- sglang/srt/reasoning_parser.py +2 -1
- sglang/srt/server_args.py +57 -6
- sglang/srt/utils.py +96 -1
- sglang/srt/weight_sync/utils.py +119 -0
- sglang/test/runners.py +4 -0
- sglang/test/test_utils.py +65 -5
- sglang/utils.py +19 -0
- sglang/version.py +1 -1
- {sglang-0.4.9.post4.dist-info → sglang-0.4.9.post5.dist-info}/METADATA +4 -4
- {sglang-0.4.9.post4.dist-info → sglang-0.4.9.post5.dist-info}/RECORD +83 -73
- sglang/srt/debug_utils.py +0 -74
- {sglang-0.4.9.post4.dist-info → sglang-0.4.9.post5.dist-info}/WHEEL +0 -0
- {sglang-0.4.9.post4.dist-info → sglang-0.4.9.post5.dist-info}/licenses/LICENSE +0 -0
- {sglang-0.4.9.post4.dist-info → sglang-0.4.9.post5.dist-info}/top_level.txt +0 -0
sglang/test/test_utils.py
CHANGED
@@ -1,6 +1,7 @@
|
|
1
1
|
"""Common utilities for testing and benchmarking"""
|
2
2
|
|
3
3
|
import argparse
|
4
|
+
import asyncio
|
4
5
|
import copy
|
5
6
|
import json
|
6
7
|
import logging
|
@@ -14,8 +15,9 @@ import unittest
|
|
14
15
|
from concurrent.futures import ThreadPoolExecutor
|
15
16
|
from dataclasses import dataclass
|
16
17
|
from functools import partial
|
18
|
+
from pathlib import Path
|
17
19
|
from types import SimpleNamespace
|
18
|
-
from typing import Callable, List, Optional, Tuple
|
20
|
+
from typing import Awaitable, Callable, List, Optional, Tuple
|
19
21
|
|
20
22
|
import numpy as np
|
21
23
|
import requests
|
@@ -26,6 +28,7 @@ from sglang.bench_serving import run_benchmark
|
|
26
28
|
from sglang.global_config import global_config
|
27
29
|
from sglang.lang.backend.openai import OpenAI
|
28
30
|
from sglang.lang.backend.runtime_endpoint import RuntimeEndpoint
|
31
|
+
from sglang.lang.interpreter import ProgramState
|
29
32
|
from sglang.srt.utils import (
|
30
33
|
get_bool_env_var,
|
31
34
|
get_device,
|
@@ -347,6 +350,7 @@ def add_common_sglang_args_and_parse(parser: argparse.ArgumentParser):
|
|
347
350
|
help="Device type (auto/cuda/rocm/cpu). Auto will detect available platforms",
|
348
351
|
)
|
349
352
|
parser.add_argument("--result-file", type=str, default="result.jsonl")
|
353
|
+
parser.add_argument("--raw-result-file", type=str)
|
350
354
|
args = parser.parse_args()
|
351
355
|
|
352
356
|
return args
|
@@ -714,6 +718,7 @@ def get_benchmark_args(
|
|
714
718
|
seed: int = 0,
|
715
719
|
device="auto",
|
716
720
|
pd_separated: bool = False,
|
721
|
+
lora_name=None,
|
717
722
|
):
|
718
723
|
return SimpleNamespace(
|
719
724
|
backend="sglang",
|
@@ -741,7 +746,7 @@ def get_benchmark_args(
|
|
741
746
|
extra_request_body=None,
|
742
747
|
apply_chat_template=False,
|
743
748
|
profile=None,
|
744
|
-
lora_name=
|
749
|
+
lora_name=lora_name,
|
745
750
|
prompt_suffix="",
|
746
751
|
device=device,
|
747
752
|
pd_separated=pd_separated,
|
@@ -764,6 +769,8 @@ def run_bench_serving(
|
|
764
769
|
need_warmup=False,
|
765
770
|
seed: int = 0,
|
766
771
|
device="auto",
|
772
|
+
background_task: Optional[Callable[[str, asyncio.Event], Awaitable[None]]] = None,
|
773
|
+
lora_name: Optional[str] = None,
|
767
774
|
):
|
768
775
|
if device == "auto":
|
769
776
|
device = auto_config_device()
|
@@ -791,14 +798,35 @@ def run_bench_serving(
|
|
791
798
|
disable_ignore_eos=disable_ignore_eos,
|
792
799
|
seed=seed,
|
793
800
|
device=device,
|
801
|
+
lora_name=lora_name,
|
794
802
|
)
|
795
803
|
|
796
|
-
|
804
|
+
async def _run():
|
797
805
|
if need_warmup:
|
798
806
|
warmup_args = copy.deepcopy(args)
|
799
807
|
warmup_args.num_prompts = 16
|
800
|
-
run_benchmark
|
801
|
-
|
808
|
+
await asyncio.to_thread(run_benchmark, warmup_args)
|
809
|
+
|
810
|
+
start_event = asyncio.Event()
|
811
|
+
stop_event = asyncio.Event()
|
812
|
+
task_handle = (
|
813
|
+
asyncio.create_task(background_task(base_url, start_event, stop_event))
|
814
|
+
if background_task
|
815
|
+
else None
|
816
|
+
)
|
817
|
+
|
818
|
+
try:
|
819
|
+
start_event.set()
|
820
|
+
result = await asyncio.to_thread(run_benchmark, args)
|
821
|
+
finally:
|
822
|
+
if task_handle:
|
823
|
+
stop_event.set()
|
824
|
+
await task_handle
|
825
|
+
|
826
|
+
return result
|
827
|
+
|
828
|
+
try:
|
829
|
+
res = asyncio.run(_run())
|
802
830
|
finally:
|
803
831
|
kill_process_tree(process.pid)
|
804
832
|
|
@@ -1284,3 +1312,35 @@ class CustomTestCase(unittest.TestCase):
|
|
1284
1312
|
lambda: super(CustomTestCase, self)._callTestMethod(method),
|
1285
1313
|
max_retry=max_retry,
|
1286
1314
|
)
|
1315
|
+
|
1316
|
+
|
1317
|
+
def dump_bench_raw_result(
|
1318
|
+
path: str,
|
1319
|
+
states,
|
1320
|
+
preds,
|
1321
|
+
labels,
|
1322
|
+
):
|
1323
|
+
if not path:
|
1324
|
+
return
|
1325
|
+
|
1326
|
+
rows = []
|
1327
|
+
for i in range(len(states)):
|
1328
|
+
state = states[i]
|
1329
|
+
output = state["answer"]
|
1330
|
+
prompt = _ensure_remove_suffix(state.text(), output)
|
1331
|
+
rows.append(
|
1332
|
+
dict(
|
1333
|
+
prompt_id=i,
|
1334
|
+
prompt=prompt,
|
1335
|
+
output=output,
|
1336
|
+
correct=bool(preds[i] == labels[i]),
|
1337
|
+
)
|
1338
|
+
)
|
1339
|
+
|
1340
|
+
print(f"BenchRawResultDumper save results to {path}")
|
1341
|
+
Path(path).write_text("\n".join(json.dumps(row) for row in rows))
|
1342
|
+
|
1343
|
+
|
1344
|
+
def _ensure_remove_suffix(text: str, suffix: str):
|
1345
|
+
assert text.endswith(suffix)
|
1346
|
+
return text.removesuffix(suffix)
|
sglang/utils.py
CHANGED
@@ -14,6 +14,7 @@ import traceback
|
|
14
14
|
import urllib.request
|
15
15
|
import weakref
|
16
16
|
from concurrent.futures import ThreadPoolExecutor
|
17
|
+
from functools import wraps
|
17
18
|
from io import BytesIO
|
18
19
|
from json import dumps
|
19
20
|
from typing import Any, Callable, List, Optional, Tuple, Type, Union
|
@@ -28,6 +29,24 @@ from tqdm import tqdm
|
|
28
29
|
logger = logging.getLogger(__name__)
|
29
30
|
|
30
31
|
|
32
|
+
def execute_once(func):
|
33
|
+
has_run = None
|
34
|
+
|
35
|
+
@wraps(func)
|
36
|
+
def wrapper(*args, **kwargs):
|
37
|
+
nonlocal has_run
|
38
|
+
if not has_run:
|
39
|
+
func(*args, **kwargs)
|
40
|
+
has_run = True
|
41
|
+
|
42
|
+
return wrapper
|
43
|
+
|
44
|
+
|
45
|
+
@execute_once
|
46
|
+
def info_once(message: str):
|
47
|
+
logger.info(message)
|
48
|
+
|
49
|
+
|
31
50
|
def convert_json_schema_to_str(json_schema: Union[dict, str, Type[BaseModel]]) -> str:
|
32
51
|
"""Convert a JSON schema to a string.
|
33
52
|
Parameters
|
sglang/version.py
CHANGED
@@ -1 +1 @@
|
|
1
|
-
__version__ = "0.4.9.
|
1
|
+
__version__ = "0.4.9.post5"
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: sglang
|
3
|
-
Version: 0.4.9.
|
3
|
+
Version: 0.4.9.post5
|
4
4
|
Summary: SGLang is yet another fast serving framework for large language models and vision language models.
|
5
5
|
License: Apache License
|
6
6
|
Version 2.0, January 2004
|
@@ -246,7 +246,7 @@ Requires-Dist: sentencepiece; extra == "runtime-common"
|
|
246
246
|
Requires-Dist: soundfile==0.13.1; extra == "runtime-common"
|
247
247
|
Requires-Dist: scipy; extra == "runtime-common"
|
248
248
|
Requires-Dist: torchao==0.9.0; extra == "runtime-common"
|
249
|
-
Requires-Dist: transformers==4.
|
249
|
+
Requires-Dist: transformers==4.54.0; extra == "runtime-common"
|
250
250
|
Requires-Dist: timm==1.0.16; extra == "runtime-common"
|
251
251
|
Requires-Dist: uvicorn; extra == "runtime-common"
|
252
252
|
Requires-Dist: uvloop; extra == "runtime-common"
|
@@ -259,7 +259,7 @@ Requires-Dist: torchaudio==2.7.1; extra == "srt"
|
|
259
259
|
Requires-Dist: torchvision==0.22.1; extra == "srt"
|
260
260
|
Requires-Dist: cuda-python; extra == "srt"
|
261
261
|
Requires-Dist: einops; extra == "srt"
|
262
|
-
Requires-Dist: flashinfer_python==0.2.
|
262
|
+
Requires-Dist: flashinfer_python==0.2.9rc2; extra == "srt"
|
263
263
|
Provides-Extra: blackwell
|
264
264
|
Requires-Dist: sglang[runtime_common]; extra == "blackwell"
|
265
265
|
Requires-Dist: sgl-kernel; extra == "blackwell"
|
@@ -268,7 +268,7 @@ Requires-Dist: torchaudio==2.7.1; extra == "blackwell"
|
|
268
268
|
Requires-Dist: torchvision==0.22.1; extra == "blackwell"
|
269
269
|
Requires-Dist: cuda-python; extra == "blackwell"
|
270
270
|
Requires-Dist: einops; extra == "blackwell"
|
271
|
-
Requires-Dist: flashinfer_python==0.2.
|
271
|
+
Requires-Dist: flashinfer_python==0.2.9rc2; extra == "blackwell"
|
272
272
|
Provides-Extra: srt-hip
|
273
273
|
Requires-Dist: sglang[runtime_common]; extra == "srt-hip"
|
274
274
|
Requires-Dist: torch; extra == "srt-hip"
|
@@ -9,11 +9,11 @@ sglang/compile_deep_gemm.py,sha256=H118s76CKdpZr-cDeFfBCePe7--c_teEBNVIzchYVSo,6
|
|
9
9
|
sglang/global_config.py,sha256=xzLdk8W53fneFblNh8iIjGF9C3-7mnzR1-LleD9Btxg,1495
|
10
10
|
sglang/launch_server.py,sha256=mDXfwha8LHpWQJekcCosR98QhCQsbmilsBlI5jAIgg0,420
|
11
11
|
sglang/profiler.py,sha256=tEHzHerXC-ymk4OrkoUcMbgcGHmb8VESthsNSP2Yx9w,4417
|
12
|
-
sglang/utils.py,sha256=
|
13
|
-
sglang/version.py,sha256=
|
12
|
+
sglang/utils.py,sha256=DSMD5Ch-gmkIO6Dh4JAmBMtRAu4JZ7uYO0NUMprGVO4,16770
|
13
|
+
sglang/version.py,sha256=GBi71Z9Lv3isXS33OtWCtTjl5apAGantvWQRrye9bj0,28
|
14
14
|
sglang/eval/llama3_eval.py,sha256=gWSboDchIGybIce88bJlrCG0yiLZ513mw4gcutJlzGM,10017
|
15
15
|
sglang/eval/loogle_eval.py,sha256=-CC2s2kh5qUoDrHRkQVkC_jNvBgNojXbf456ny5s78s,4557
|
16
|
-
sglang/lang/chat_template.py,sha256=
|
16
|
+
sglang/lang/chat_template.py,sha256=ZNcuDvDZE9781tQqfKpptck_zJVK0aggq7IxrNHltao,21934
|
17
17
|
sglang/lang/choices.py,sha256=-W1DVw9N9ZliVpvmWrzIXG4cswAah8eMQrHWzkS3D8o,6234
|
18
18
|
sglang/lang/compiler.py,sha256=MAuzoOOpb98njJ7Io2SDmFkhTroDYiq0te0ZpfHkMY4,7597
|
19
19
|
sglang/lang/interpreter.py,sha256=JneG-Yw-XyOTBZCIoxTiQluQjAlSz1YswnV0l6pqVPo,34811
|
@@ -30,20 +30,19 @@ sglang/srt/_custom_ops.py,sha256=9GPNUyqnybgvUnzdQ8n5_NgluHmQNw0Gptos0iLPfrY,534
|
|
30
30
|
sglang/srt/aio_rwlock.py,sha256=6LYtOdeTUY3hkfa1dmYkgsaF2ttrwIF3hUWz2AZ2fqw,2970
|
31
31
|
sglang/srt/code_completion_parser.py,sha256=KFa95OU0TeVjJkOqIgS4xV3kaJ5dFWOmAAgISyc1oEc,3803
|
32
32
|
sglang/srt/constants.py,sha256=0i-tEwG2BSYNDy96MxnGHV5HnBELkYcnsVGsE-R18o0,93
|
33
|
-
sglang/srt/conversation.py,sha256=
|
33
|
+
sglang/srt/conversation.py,sha256=ocpOVHIKV2C0Unp3ALwtW71HZo3tgaCzadXp62Omqdw,41604
|
34
34
|
sglang/srt/custom_op.py,sha256=7OPQAZe3PqDXk-xM0Wxl7pm9cazilNJfkNiYIWztWgI,3198
|
35
|
-
sglang/srt/debug_utils.py,sha256=slaFOY4BYDBFatkfu8FZlzai-u4LFS-5GUzdr-t50zE,2241
|
36
35
|
sglang/srt/hf_transformers_utils.py,sha256=UiGjp70ZpTaZDJ99Roc-2DTkxV3gR-2oJjjaNY9Ekh4,12391
|
37
36
|
sglang/srt/jinja_template_utils.py,sha256=0c6nQjkGukmyXsqQ9r85R5QK9CafnjqXyrXF4K3aFhE,7177
|
38
37
|
sglang/srt/model_parallel.py,sha256=eLXZhvJ4wG6dh0FontNCIdVZvHYdWgaeY-5cu7TD9tE,6078
|
39
38
|
sglang/srt/operations.py,sha256=ddQ8KO63L73OciaR8MZ9h2h83gKVY4-WuWgeEGowPJA,5346
|
40
39
|
sglang/srt/operations_strategy.py,sha256=Pwd2sKeRtKh9WJXgzlNr2tU9y6YMcI3MDLbatHqlMws,7145
|
41
40
|
sglang/srt/patch_torch.py,sha256=OUPCGQSQz3MVZB1zZ_Eq8lXiw0uIKJ_HWjqQolI8FsM,3088
|
42
|
-
sglang/srt/reasoning_parser.py,sha256=
|
43
|
-
sglang/srt/server_args.py,sha256=
|
41
|
+
sglang/srt/reasoning_parser.py,sha256=6lkrkR8Q25EU3VAE0jjSq__361e3CkX0gJIieSfjsZk,9247
|
42
|
+
sglang/srt/server_args.py,sha256=hfPgshfRHHq-_wI4jjMAjMGeXqmr3ZSBB_3ZVW7c8Bo,85937
|
44
43
|
sglang/srt/torch_memory_saver_adapter.py,sha256=K_eTx0UU84MHSTXI3iqYLdHV4IWtJMJ2FKdGFJR8v1E,2417
|
45
44
|
sglang/srt/two_batch_overlap.py,sha256=Lx4bIXJb3hd9vzuJbmp3Crf4I8_NrT9fUbs-4LRzQXk,28711
|
46
|
-
sglang/srt/utils.py,sha256=
|
45
|
+
sglang/srt/utils.py,sha256=6YkLoFlKyLpCNlk6zzaM5ys5_dMRTMOWNoLH09oEsOs,93321
|
47
46
|
sglang/srt/warmup.py,sha256=zldxhMlXpclRAJXmfBjJNUJd1eDizVdysibBvQyTVuA,1782
|
48
47
|
sglang/srt/configs/__init__.py,sha256=8EcVRP95epZ49DxBa6LgKWt7eO3Qe7Hrr3V1c6HkMnY,553
|
49
48
|
sglang/srt/configs/chatglm.py,sha256=j-b0YkdYUmQm2y1kNmMJtKeACxWKmBbvNNkDWbs6kbI,2907
|
@@ -51,12 +50,12 @@ sglang/srt/configs/dbrx.py,sha256=tdhIkXAQl1yr0MxqFmsDG1E0e2puRTTKm6UTyANBLac,11
|
|
51
50
|
sglang/srt/configs/deepseekvl2.py,sha256=sYMmoy5_LlDXht7MTi4QGYOaiE8iMGUO44bnuOu4i8I,23683
|
52
51
|
sglang/srt/configs/device_config.py,sha256=kdwFrk5myAURxdp4rSr8ANpBpSJfuBDoT-kuCyuscRs,442
|
53
52
|
sglang/srt/configs/exaone.py,sha256=Duxd4yQoKy8GWEzZD_kCY_OzmN_67CTJL_Kgn0eXk3g,10731
|
54
|
-
sglang/srt/configs/internvl.py,sha256=
|
53
|
+
sglang/srt/configs/internvl.py,sha256=meLG4M2s27bPI-yTleRimPdAuOH1DjiVwUf2U6vXzno,27844
|
55
54
|
sglang/srt/configs/janus_pro.py,sha256=yI2c_aWBIKiTcK6RZxK6hq8CIxyYRH_NN8uaSNKsrKI,19156
|
56
55
|
sglang/srt/configs/kimi_vl.py,sha256=4W7VQI3pr888ZsFA2SqCQo4mI0seXTOrGQ-x3oTvWew,1358
|
57
56
|
sglang/srt/configs/kimi_vl_moonvit.py,sha256=hx2Rt4JSFbvy2HUTeLjBpge87m8M6ITAhqsgdNf_Jd4,1163
|
58
57
|
sglang/srt/configs/load_config.py,sha256=qs-AxuplouBx2tsv9KGBOLZPbwzuVA4vbktbGP_cRp8,3309
|
59
|
-
sglang/srt/configs/model_config.py,sha256=
|
58
|
+
sglang/srt/configs/model_config.py,sha256=X7xirRQx1M0OhM7L-cOPJqHfBFIOfiZiiov3E847nqY,28613
|
60
59
|
sglang/srt/configs/update_config.py,sha256=D-myV9Ombwp6wTF0RX9qUO6m5rxFiUcyse32FQADG28,4787
|
61
60
|
sglang/srt/configs/utils.py,sha256=3nHUfisMs_Ltuhv8OZTNCJp63YJKJVF43h1QZB1zqx8,670
|
62
61
|
sglang/srt/connector/__init__.py,sha256=czLX5JOxuMhH-T9eSJzoc1qv1B4z9chyffDRL5I6wo4,1247
|
@@ -67,19 +66,23 @@ sglang/srt/connector/utils.py,sha256=isTvxauz1_8no5MW6p8Bwj2H9mQkweaRO_RSwAPA7R8
|
|
67
66
|
sglang/srt/connector/serde/__init__.py,sha256=MvBJ7FBJtnou-AD-EdsCdAIDCcA8kWvUNuRViILVJ-0,718
|
68
67
|
sglang/srt/connector/serde/safe_serde.py,sha256=Iv_mFsDvk-cXuw0WTykBZ2yGxW0jb82DwVqC7r3RmAU,750
|
69
68
|
sglang/srt/connector/serde/serde.py,sha256=n59I2MXLa7WCyN_8pEd8L-scJk7lMhmEX-GOUIhF0ZA,1004
|
70
|
-
sglang/srt/constrained/base_grammar_backend.py,sha256=
|
69
|
+
sglang/srt/constrained/base_grammar_backend.py,sha256=ATWX1LKp3GjUDVkauEaSc3MnS8Bt6hOiHUgeYDZtgNo,7059
|
71
70
|
sglang/srt/constrained/llguidance_backend.py,sha256=Au8G8x4EB39w7k9-GFLP2hOPETyeAPw53RRZYdLimpA,6191
|
72
71
|
sglang/srt/constrained/outlines_backend.py,sha256=4Er45scnqHuJQ14kggsVX3RoHlaUD9t0ALIoWDQEmFg,6913
|
73
72
|
sglang/srt/constrained/outlines_jump_forward.py,sha256=Gyubp-FVetxd6wP4FA_kD6cCXIRfr8k_ZDviJyte048,6824
|
74
73
|
sglang/srt/constrained/reasoner_grammar_backend.py,sha256=YFxWuOTTo4e6cGhxnaBwuwli6f8FTUJtszib8dBq_8I,3207
|
75
|
-
sglang/srt/constrained/xgrammar_backend.py,sha256=
|
74
|
+
sglang/srt/constrained/xgrammar_backend.py,sha256=y_pmPUHEkqLM1BCHcakRYC99j2_hzrsivd5uJIKeuJE,8149
|
76
75
|
sglang/srt/constrained/triton_ops/bitmask_ops.py,sha256=WjTen9iuuFWLzkE1mAHQZB9_7aIy5QH8Wjf-lB-Fams,4614
|
76
|
+
sglang/srt/debug_utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
77
|
+
sglang/srt/debug_utils/dump_comparator.py,sha256=8ZPwP0zojfRHvPiSKgpESYFcC3tR-sBjIej5SotOmpg,3947
|
78
|
+
sglang/srt/debug_utils/dumper.py,sha256=eyrg5lmwyYF88kn8b06kpu1__aGnWb6CLM8fxywtooI,3158
|
79
|
+
sglang/srt/debug_utils/text_comparator.py,sha256=pg58q3fzsnd3rJKRgZTdcOviOtAv8pSYZdwf-TLffMM,5522
|
77
80
|
sglang/srt/disaggregation/decode.py,sha256=P-0OyFjjDfthEVhlJugdscWST_uoOVmHZlSlx9NYLmE,34242
|
78
|
-
sglang/srt/disaggregation/decode_schedule_batch_mixin.py,sha256=
|
81
|
+
sglang/srt/disaggregation/decode_schedule_batch_mixin.py,sha256=sUXmqiJGwuYoJvZjRCgTMVEN7bLefnEUlCTJpVA6ecI,6416
|
79
82
|
sglang/srt/disaggregation/kv_events.py,sha256=yFbtwOeblcCmOXTjg00TopxnyjkmCBQIVz46KB8jetY,13555
|
80
83
|
sglang/srt/disaggregation/launch_lb.py,sha256=mcbAztN4gnHevw_T5R2_nWsymsDEY9vHkm7OJ1vr6cc,4211
|
81
84
|
sglang/srt/disaggregation/mini_lb.py,sha256=bpnz6d90nv7vAoiPxmxFKlM1Gjct0R4IPkF9SwwBk9I,14504
|
82
|
-
sglang/srt/disaggregation/prefill.py,sha256=
|
85
|
+
sglang/srt/disaggregation/prefill.py,sha256=u8eKfWPuXiHDqFCWmhqlYhco3wy7nt5DjSmekwJTkhQ,24286
|
83
86
|
sglang/srt/disaggregation/utils.py,sha256=ql5p9yjBCRcR0YMgcgRK6tH0kPGvLNTUgeXBr_BUcoI,12198
|
84
87
|
sglang/srt/disaggregation/ascend/__init__.py,sha256=-lxnica6fZYmYNpKwmE8yESUpQ5Sxf2DiZoBHzboKc8,146
|
85
88
|
sglang/srt/disaggregation/ascend/conn.py,sha256=FOYrGtEhj58iTjhYT1eP96DpyxBLFFR87icqYCzWmCY,1215
|
@@ -92,7 +95,7 @@ sglang/srt/disaggregation/common/utils.py,sha256=SxRhAWisNK8seGhb5BXBJ5u53DF7yeK
|
|
92
95
|
sglang/srt/disaggregation/fake/__init__.py,sha256=jJGWdXwaQiGIoR6atKqkQfkJmVyQ09l55VUN2WjwaeY,77
|
93
96
|
sglang/srt/disaggregation/fake/conn.py,sha256=oD1DArn1yDFZCu-X6p93uSLlAXEkt9lYxERICMznxGw,2286
|
94
97
|
sglang/srt/disaggregation/mooncake/__init__.py,sha256=0TgqkAdQI1YynbHY6c0QISvVoOSk-0SwCIq5rjPSmgE,156
|
95
|
-
sglang/srt/disaggregation/mooncake/conn.py,sha256=
|
98
|
+
sglang/srt/disaggregation/mooncake/conn.py,sha256=4TnmzcCDDm15j3XFFw_n_awq958-ljVahy8nC3CuFdc,61842
|
96
99
|
sglang/srt/disaggregation/mooncake/transfer_engine.py,sha256=-ulLhz6DBDsmEjwNjjH5Pj8ngZKISgwBc_zL3ViGDN0,4761
|
97
100
|
sglang/srt/disaggregation/nixl/__init__.py,sha256=qODVPIGWUXKXq4zsRIcMYoAoAeg6nBIN9vdQOlVMANE,136
|
98
101
|
sglang/srt/disaggregation/nixl/conn.py,sha256=eSof87fG21Dd4COszfnbeXIxne3TWvw0mSvCOkjsBZc,20323
|
@@ -112,13 +115,13 @@ sglang/srt/distributed/device_communicators/quick_all_reduce.py,sha256=4j1_E4azo
|
|
112
115
|
sglang/srt/distributed/device_communicators/shm_broadcast.py,sha256=IrSrnpZnii0EJTS1CYRwEwE7gyHxJBVgI2QuJS3AKW0,20906
|
113
116
|
sglang/srt/distributed/device_communicators/xpu_communicator.py,sha256=ajW6132BvA6jkeipEIgN27TFycI0U06Ih2Z8WNjlA4s,1593
|
114
117
|
sglang/srt/entrypoints/EngineBase.py,sha256=yKN76witT2jz1zhmLHmPNLGMpK2UiOTaKQ2KPD8l99U,2594
|
115
|
-
sglang/srt/entrypoints/engine.py,sha256=
|
118
|
+
sglang/srt/entrypoints/engine.py,sha256=dGazuzKYxQSfXjea1aeSqaZubvLER0EVZzD7CvpHq9A,31595
|
116
119
|
sglang/srt/entrypoints/http_server.py,sha256=-unKM0lCK7Scd3LLTxLl-3vhit6lMb-wWfjLywelRy0,37214
|
117
120
|
sglang/srt/entrypoints/http_server_engine.py,sha256=_--j4U04OeJLlnnv1f0XmCd_Ry0z1FlhkrbePX8rYV0,4938
|
118
121
|
sglang/srt/entrypoints/openai/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
119
122
|
sglang/srt/entrypoints/openai/protocol.py,sha256=UUc5oJ7E60fYoUqMb53H85i7HHhDfmYLIFZidhNrP0s,19147
|
120
123
|
sglang/srt/entrypoints/openai/serving_base.py,sha256=5NJ2S_6B2NFSwn4nLp6eaeJ5iC3IcQzMEY9lW_gPcdA,5246
|
121
|
-
sglang/srt/entrypoints/openai/serving_chat.py,sha256=
|
124
|
+
sglang/srt/entrypoints/openai/serving_chat.py,sha256=MbLFLLFhvCTpJ_j7t03seXHHoFjlXCZtzVjSg_L7iz8,39841
|
122
125
|
sglang/srt/entrypoints/openai/serving_completions.py,sha256=emIutVmnJgOgGRuAqdB80-kVHUfQbE67n1VS-76o4QY,16690
|
123
126
|
sglang/srt/entrypoints/openai/serving_embedding.py,sha256=hqPt2ELpT1yQ8sBXo801aLJ3sExoPXs_K5ZQtC2vpAs,6274
|
124
127
|
sglang/srt/entrypoints/openai/serving_rerank.py,sha256=8n6y5kC6UhRpWrDtzH0eIp0dznW12FT60MLCR4bvD2U,3333
|
@@ -139,14 +142,15 @@ sglang/srt/eplb/eplb_simulator/reader.py,sha256=OlsWqsuXqVQY7PfvvrP-vsl2Ww2Kg4vD
|
|
139
142
|
sglang/srt/function_call/base_format_detector.py,sha256=FKBzsGFHfNl3Wvccsdvv9ftjbCZIyyjOLj2kHgKvX9g,15901
|
140
143
|
sglang/srt/function_call/core_types.py,sha256=wLUsW8mUA-i-ISz5QUDL7Ejq72W-K1HIhFa9Wm-_oA8,786
|
141
144
|
sglang/srt/function_call/deepseekv3_detector.py,sha256=WzJbwCe8DoOi8guX9pdVMd70CViVrwoaxi8PZwIC9pg,9712
|
142
|
-
sglang/srt/function_call/ebnf_composer.py,sha256=
|
143
|
-
sglang/srt/function_call/function_call_parser.py,sha256=
|
145
|
+
sglang/srt/function_call/ebnf_composer.py,sha256=HvLTgfNnBNKFKW-L36DKh07yRLbdTYjSfbTcLRUxZUc,14948
|
146
|
+
sglang/srt/function_call/function_call_parser.py,sha256=YTFGRA0rJf18ox2veLzmSBEm85QiZsPMNvNwiq8-iyo,8009
|
147
|
+
sglang/srt/function_call/glm4_moe_detector.py,sha256=TD67qS7T-9iR4-P5fhrUbqqYWEYVTb30dDNd7lGj4Rk,6934
|
144
148
|
sglang/srt/function_call/kimik2_detector.py,sha256=7unW_GwH7I6jrh2BZbw22mWRZzQ0OMTYDz_xVX5abPU,10116
|
145
149
|
sglang/srt/function_call/llama32_detector.py,sha256=trZja7IXc2IWUko5PRj7p4pRU6XCVjtxr-7qJNr0EWo,3647
|
146
150
|
sglang/srt/function_call/mistral_detector.py,sha256=Ts2HrJdu5r2lCCMVKPZfnCds9pt1K5H1EaOQrF_HD60,4686
|
147
151
|
sglang/srt/function_call/pythonic_detector.py,sha256=yAatItKtVDf9uhlB78wPWKP3fbefLJDNGGzFV5ey-YA,8756
|
148
152
|
sglang/srt/function_call/qwen25_detector.py,sha256=nv83_sipZMU6Vie3J4HeNiZVCSRU5ei7601j50779HA,5181
|
149
|
-
sglang/srt/function_call/qwen3_coder_detector.py,sha256=
|
153
|
+
sglang/srt/function_call/qwen3_coder_detector.py,sha256=3QAoK9W3YFPrx_j3xIsDpmQSnbX0BixMAlJ6BoNJo8o,5517
|
150
154
|
sglang/srt/function_call/utils.py,sha256=__ImDF2kNyoLWsYO5RYoryvy1mmgEjnjXlCvLv-uLCM,1695
|
151
155
|
sglang/srt/layers/activation.py,sha256=uhfhh10N5iLoLEBCvFPRjCfDxu5jXe1ehHJb3ISIjig,7840
|
152
156
|
sglang/srt/layers/amx_utils.py,sha256=1mENgHK2B8mgaD1oMtgbZ15Jmy_Uu1QueBmo09Ff2iA,2865
|
@@ -154,10 +158,10 @@ sglang/srt/layers/communicator.py,sha256=c5pJObNyP_7JsIWgLau_E-1ovtPCpAcge254fjo
|
|
154
158
|
sglang/srt/layers/dp_attention.py,sha256=tOre7il5Cppu930-tzM6d4AgjHuIJMCMlg9hJkuBcjA,11382
|
155
159
|
sglang/srt/layers/elementwise.py,sha256=MyQUflyKEfPZ-BggW1Kd4hB53RFD6FXGc2S5LXjx_do,16026
|
156
160
|
sglang/srt/layers/flashinfer_comm_fusion.py,sha256=fkTcAB7qYwSWi95qI3Rqq0JUyDpJdcYkd4TYkWO01HI,5891
|
157
|
-
sglang/srt/layers/layernorm.py,sha256=
|
161
|
+
sglang/srt/layers/layernorm.py,sha256=Qkx4Jzb3KWOt2okAVM6Is4FDClpUIJShcPGoElUSnEQ,9598
|
158
162
|
sglang/srt/layers/linear.py,sha256=NzjLqZrZNYcc3z2KtA9-n6pnSdBHHwU6NF_BbcAWp48,52471
|
159
|
-
sglang/srt/layers/logits_processor.py,sha256=
|
160
|
-
sglang/srt/layers/multimodal.py,sha256=
|
163
|
+
sglang/srt/layers/logits_processor.py,sha256=uduvaN1pFHX3imlx8FbmIG6aJMniOoPmoP0AGimQn5s,26630
|
164
|
+
sglang/srt/layers/multimodal.py,sha256=wVo5-OLz-J4k8fM0ld1ZKMtzOsSue4aa-uILak-I8Bk,2398
|
161
165
|
sglang/srt/layers/parameter.py,sha256=jCg0G-12GZqTa9gGOqEtVCsnnuBGnYg0VmF6pc6oCFg,17455
|
162
166
|
sglang/srt/layers/pooler.py,sha256=uZ6WX1FLMEafZwusyZdm6KuVlIwSjbKrdwk2qzgqNGk,3812
|
163
167
|
sglang/srt/layers/radix_attention.py,sha256=vtzCPfEiWYunglcLfqO9dcATb-LXzU4sFBwIWsWHbiY,3513
|
@@ -175,13 +179,14 @@ sglang/srt/layers/attention/flashattention_backend.py,sha256=rYsBAsFS1qNNe-3CVIa
|
|
175
179
|
sglang/srt/layers/attention/flashinfer_backend.py,sha256=HQp14R29hQVXYjATKPoGaHY9LJ9e1cw2k-RhBEmFxt8,51505
|
176
180
|
sglang/srt/layers/attention/flashinfer_mla_backend.py,sha256=NirRlNFxD0S2EncvvmrerIxNfuTnYpvemZV3MR5_FnU,34040
|
177
181
|
sglang/srt/layers/attention/flashmla_backend.py,sha256=5iSic5ho-lkXNas9mR3uLbXbEl-do31gc8gjR7-a79k,20711
|
182
|
+
sglang/srt/layers/attention/hybrid_attn_backend.py,sha256=ZIzBeR5r0SMkNLekEWPUCas_TCNOmzZ725YaueYVUlM,3196
|
178
183
|
sglang/srt/layers/attention/intel_amx_backend.py,sha256=hH9lxXs_o66_IVs58oPhRCOXGUrHbXSz82FKtHr9GO8,4092
|
179
184
|
sglang/srt/layers/attention/merge_state.py,sha256=OnWmNV6LYTUj0y8SCy_IK7A9q6v9bZwR4_XiLOIvbrk,1423
|
180
185
|
sglang/srt/layers/attention/tbo_backend.py,sha256=CBnSDUmDvT-Tbhi9NHNo1LLkgUAcIsWMJgKa-sAIKW8,9318
|
181
186
|
sglang/srt/layers/attention/torch_native_backend.py,sha256=RsI4lYiQJAj-Xy0vKkzbyKOWHAVPOD9b0n0dEehwlos,9496
|
182
187
|
sglang/srt/layers/attention/triton_backend.py,sha256=AryrPc4kzioxkiucPkApMA__0HoQTKOHNpwN0GEgm98,36923
|
183
188
|
sglang/srt/layers/attention/utils.py,sha256=KiRSIHaGBhErUhPWCSD3Uiaqb0pSEF0NJFwTTQXoMks,2887
|
184
|
-
sglang/srt/layers/attention/vision.py,sha256
|
189
|
+
sglang/srt/layers/attention/vision.py,sha256=zI1Pq2Tx4SwOzYhIarxNtlTiZeVMWxVf8j-Pf7xhzCA,18111
|
185
190
|
sglang/srt/layers/attention/triton_ops/decode_attention.py,sha256=eN0Lqpu5h27lMPuRnisX4jrU0WR061pCFSrh3vLlSD0,18936
|
186
191
|
sglang/srt/layers/attention/triton_ops/double_sparsity_attention.py,sha256=FbgrPO5GvEGEvojV7Ss0jX7384e9vuzX2goDCQuP1Zk,31124
|
187
192
|
sglang/srt/layers/attention/triton_ops/extend_attention.py,sha256=ImpCuxszoeVdr6wzaLR3OGW3-50P9EAEvsRCdUVIrxE,14261
|
@@ -193,15 +198,15 @@ sglang/srt/layers/moe/cutlass_moe_params.py,sha256=9NRCmgP_Ug3gGqCcpi-x-QRbLjCNp
|
|
193
198
|
sglang/srt/layers/moe/cutlass_w4a8_moe.py,sha256=bc8s5Oc36pCF0VozxZuqFOOU2fov-4wGPlyduye3Imk,7296
|
194
199
|
sglang/srt/layers/moe/fused_moe_native.py,sha256=SkOFgU23aZfHmLhnkVhdUWGx0-2wbo6uu9ohKBp2yOI,3486
|
195
200
|
sglang/srt/layers/moe/router.py,sha256=UrPieRvemN7Ew48gtG7DA2xhNDBRSnZxzugTEBI-0_E,12006
|
196
|
-
sglang/srt/layers/moe/topk.py,sha256=
|
201
|
+
sglang/srt/layers/moe/topk.py,sha256=dOyJcpjIQYlgk8i_JsJyJzxaZZgmAcSMr9OgceG0arQ,26851
|
197
202
|
sglang/srt/layers/moe/ep_moe/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
198
203
|
sglang/srt/layers/moe/ep_moe/kernels.py,sha256=UFH-XacP3aBjAcn6_SeC641jGzjSrY0fz50IB9URix4,42706
|
199
|
-
sglang/srt/layers/moe/ep_moe/layer.py,sha256=
|
204
|
+
sglang/srt/layers/moe/ep_moe/layer.py,sha256=6fspJli5_89rItBZDua_gNMP8eAq9ZgFOv029aoIIwg,45701
|
200
205
|
sglang/srt/layers/moe/ep_moe/token_dispatcher.py,sha256=aiBE3mjvWV3eBrFGH9J44tuJncQwOjRS_XeyBNCEtqM,24379
|
201
206
|
sglang/srt/layers/moe/fused_moe_triton/__init__.py,sha256=4NXZHbCw-G-uSnNUj4up0yh3xBDPnT-x0pdoIr0lku8,831
|
202
207
|
sglang/srt/layers/moe/fused_moe_triton/fused_moe.py,sha256=6NcY-6UHQUSVP4qzc8jis4h-W9BEV4lnGmrJMx2S6eA,57164
|
203
|
-
sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=
|
204
|
-
sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=
|
208
|
+
sglang/srt/layers/moe/fused_moe_triton/layer.py,sha256=U3Qaffyj-aGFc6TvlB057eCbiv9oHbPDdwPVHsM7FJs,23278
|
209
|
+
sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=HOEJJyehKTUIjkcsTc29aEXHqVLgDlv_jQL5fjvuUxU,5856
|
205
210
|
"sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=iNGsE2ZeVnQEnN4A8UJ9Jv0d3hbRF2MJ9oBgjup5Szk,2737
|
206
211
|
"sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json",sha256=JJN0hryyLr5Zv3dSS7C8cPFhAwTT6XxUVnBGMZvV6JA,2752
|
207
212
|
"sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_1_0/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json",sha256=ouRyZ5PEMPP2njPftCNhs-1g1y6wueWLmhI7G1SjV1k,4131
|
@@ -346,6 +351,7 @@ sglang/srt/layers/moe/fused_moe_triton/triton_kernels_moe.py,sha256=hoWVdf8ry8ID
|
|
346
351
|
"sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_2_0/E=128,N=768,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=pdQ1RvXvdWDn8Y8-8MAX3vn-T-wbtkZvHV9GZZvNjnc,3266
|
347
352
|
"sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_2_0/E=128,N=768,device_name=NVIDIA_H200.json",sha256=JraM-Nvbg5V_TJkSl6UPFYZN1zHHoIbr2pAcksenoTY,3248
|
348
353
|
"sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_2_0/E=128,N=96,device_name=NVIDIA_H20.json",sha256=JtcHRlPz8xQEAqJ9EWI63oYvdmjQFG6VTHqtt85VOSA,3221
|
354
|
+
"sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_2_0/E=160,N=320,device_name=NVIDIA_A800-SXM4-80GB,dtype=int8_w8a8.json",sha256=ZRON2XIRRZrvJ3tbPuQ7-0HqGZ_FkPpRN3yj1isGmpg,3255
|
349
355
|
"sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_2_0/E=257,N=128,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=ttFuL1rKnEpShItmlGyClOfpUwLi5cZYFaVgo7CAxnA,3268
|
350
356
|
"sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_2_0/E=257,N=128,device_name=NVIDIA_H20,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=Pc2ri-qDByslfD8LgJtRB9QDWjI-KqMeA5ftltiwy8k,3262
|
351
357
|
"sglang/srt/layers/moe/fused_moe_triton/configs/triton_3_2_0/E=257,N=256,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128, 128].json",sha256=uuua9V6-1H38ASMPQ60t7UOtV0IQLZWBCl13MwQ25Ss,3264
|
@@ -375,23 +381,23 @@ sglang/srt/layers/quantization/awq.py,sha256=gLEOx6QoGQ0McBEURXPVidKGsdNUjqc9sJw
|
|
375
381
|
sglang/srt/layers/quantization/awq_triton.py,sha256=4XwJbRNlFmlvjbMGtWF1Wvk26Kf96162vNEmuI5Kars,11737
|
376
382
|
sglang/srt/layers/quantization/base_config.py,sha256=CiSxG5iuOa-12V9kIOh0Fu8Y7knZxfFbbNGTo6nEaRE,7173
|
377
383
|
sglang/srt/layers/quantization/blockwise_int8.py,sha256=3avetVUBjCiuYWBJQbElbVXWpx0SgsFsDc5F9F_zHgA,13879
|
378
|
-
sglang/srt/layers/quantization/fp8.py,sha256=
|
379
|
-
sglang/srt/layers/quantization/fp8_kernel.py,sha256=
|
384
|
+
sglang/srt/layers/quantization/fp8.py,sha256=sIA-PCDDu2-AtcwvPcvzitxjCtrvEx_dig_AoocCfhY,47100
|
385
|
+
sglang/srt/layers/quantization/fp8_kernel.py,sha256=8alryD9sEROh9Dh4cdPrGIpuOPbT6Hx6PNSe8fJc9zM,40856
|
380
386
|
sglang/srt/layers/quantization/fp8_utils.py,sha256=6FVR6_Y8akP4ihCaGG_bLYurcC_PShPtiPgiEvGN5bE,25605
|
381
387
|
sglang/srt/layers/quantization/gptq.py,sha256=3q9xfq5sJJHcrVr9C8-l9JdcLFvwKAAfWJEfZW6CzLs,39145
|
382
388
|
sglang/srt/layers/quantization/int8_kernel.py,sha256=GfRC9FOn9exNvK4QHbUeBj3Hhv32VcyGphapFPt5b84,12625
|
383
389
|
sglang/srt/layers/quantization/int8_utils.py,sha256=YK9CS-lb_n91kNCTKK5o5apYF31V2giDg5G5VKrpcUA,2356
|
384
390
|
sglang/srt/layers/quantization/kv_cache.py,sha256=_9pF5rwvB7ta6Gdc5YKVVGbNzYwqmhIx4TrX1-xnodQ,3261
|
385
391
|
sglang/srt/layers/quantization/marlin_utils.py,sha256=ShsoxcVTYo1Es3XKp9mlQNw-TsRF_o4mHIO5MfAP5HA,25906
|
386
|
-
sglang/srt/layers/quantization/modelopt_quant.py,sha256=
|
392
|
+
sglang/srt/layers/quantization/modelopt_quant.py,sha256=pJDavvIiy6oY__GoknDgeq1o8jVF99CzYgWy7i6Cz9E,38288
|
387
393
|
sglang/srt/layers/quantization/moe_wna16.py,sha256=NGcFjiMXwfOX10dkHAY3EgZHxox2k7I402Bvwj3jW1Q,19105
|
388
394
|
sglang/srt/layers/quantization/petit.py,sha256=74Jn0eICq23v_b4rEctDaYTINtbqkdM6IXycT-_FbbI,8954
|
389
395
|
sglang/srt/layers/quantization/petit_utils.py,sha256=-gy4zMhqNoIA1R0n7-5C0efV54jHonCUgPDUUFjGsyM,3245
|
390
396
|
sglang/srt/layers/quantization/qoq.py,sha256=jM96uJfKz3vo1B6SSIrQXNT3vnD3UJrepK2eY-tSQU4,8139
|
391
397
|
sglang/srt/layers/quantization/scalar_type.py,sha256=nBk4THjeRWMGW3hKWRdrjfQ0gwpuBxmYqapDBaRpnr4,12395
|
392
|
-
sglang/srt/layers/quantization/unquant.py,sha256=
|
398
|
+
sglang/srt/layers/quantization/unquant.py,sha256=zmxzCg46IOjIILRPFaZ4FPxodVT83X5nrFAKlkYUiVI,12330
|
393
399
|
sglang/srt/layers/quantization/utils.py,sha256=9ZmfS0MMqueQ6zIxMIFoQy2OFBQ5vHjOHBgVvUn7ews,16213
|
394
|
-
sglang/srt/layers/quantization/w4afp8.py,sha256=
|
400
|
+
sglang/srt/layers/quantization/w4afp8.py,sha256=cYLUuDARPP6NsiYSihDnJYZwLakDL-RGYokTIJ-v_2I,11074
|
395
401
|
sglang/srt/layers/quantization/w8a8_fp8.py,sha256=I_W9A4Pnluaf-SaT8zq-tAJTt1acpxfE_kG5mqdc5cE,10250
|
396
402
|
sglang/srt/layers/quantization/w8a8_int8.py,sha256=VGrVELArNuyw4FEtUefaeK8ayuX7cpXj1OOqCmOCzm4,34902
|
397
403
|
sglang/srt/layers/quantization/compressed_tensors/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
@@ -562,7 +568,7 @@ sglang/srt/lora/layers.py,sha256=FaTYf0w3zbKKKAT1nJdAzGRtxvySB6FpNKXvEi5RHH0,129
|
|
562
568
|
sglang/srt/lora/lora.py,sha256=sRoU7BdlTV4cnBv1-u3QjisVR9XQrrqAsmhxdNtd8dU,9433
|
563
569
|
sglang/srt/lora/lora_config.py,sha256=qDgMTx_69jyJUl29O5FxLzYa0BMhqYVXWXfyyVOvGm0,1684
|
564
570
|
sglang/srt/lora/lora_manager.py,sha256=ABuqg1IhY9LNXgJd_v3Yx_VHS52t4SapHmhLiH1thdc,20147
|
565
|
-
sglang/srt/lora/lora_registry.py,sha256=
|
571
|
+
sglang/srt/lora/lora_registry.py,sha256=z3Ib7nlr1gajeSwJjC7sL8eMiaLiZo7dOB3WZnlyBVM,7676
|
566
572
|
sglang/srt/lora/mem_pool.py,sha256=UYvTgEPvBoVsaX5rEnipebOAlo75pML6_NO9GfCFzl8,12148
|
567
573
|
sglang/srt/lora/utils.py,sha256=5G0KiDEn-Zg4OgIOjWnU2ZdQGNstZswoAog9xU4GVDA,5660
|
568
574
|
sglang/srt/lora/backend/base_backend.py,sha256=EIz8I-GIrdmK4fISw3ENhbJVVITaxKfyLxHXGPU4fPs,5044
|
@@ -573,21 +579,21 @@ sglang/srt/lora/triton_ops/gate_up_lora_b.py,sha256=QURCYxHNR8Ls4SQtt3dvdgjvdDVh
|
|
573
579
|
sglang/srt/lora/triton_ops/qkv_lora_b.py,sha256=iz5scFNo2YFTeiM8beWg9Z1oZI-6AM_T1wBMCQ6qp2Q,6485
|
574
580
|
sglang/srt/lora/triton_ops/sgemm_lora_a.py,sha256=Ksova04wgeGsFqGOXWqJtMYaHgyUYcx8VU42BZQOkVA,5129
|
575
581
|
sglang/srt/lora/triton_ops/sgemm_lora_b.py,sha256=VqCAFvUtq_l-0RGIkx3W_fzD55QcW2FAcqpvSHOBFp4,5115
|
576
|
-
sglang/srt/managers/cache_controller.py,sha256
|
582
|
+
sglang/srt/managers/cache_controller.py,sha256=HoI6_os2h8rrvyEJ6Kk4ibUF3aKH-9Z8K5pksc6BECQ,24603
|
577
583
|
sglang/srt/managers/configure_logging.py,sha256=8sNXZ2z9pBWOwn-X3wyz013Ob8Nbm1zDxRkxoZjH-l4,1633
|
578
584
|
sglang/srt/managers/data_parallel_controller.py,sha256=PZ-wOcAFn3PQqMB6I2vjIsFmplf0nlNl5hqTDKTHTG8,12112
|
579
585
|
sglang/srt/managers/detokenizer_manager.py,sha256=SpLxTsSPKBZfD-ZMhJ5zpPPGuUb8PmcYgFSL9CsurU4,10696
|
580
586
|
sglang/srt/managers/io_struct.py,sha256=LNLG7utMidF63eYWlWYxQ3G2GzOqaQzQc-9ld2yaycI,37859
|
581
|
-
sglang/srt/managers/mm_utils.py,sha256=
|
582
|
-
sglang/srt/managers/multimodal_processor.py,sha256=
|
583
|
-
sglang/srt/managers/schedule_batch.py,sha256=
|
587
|
+
sglang/srt/managers/mm_utils.py,sha256=VrJiv0k_zDa83BsfVv8rmckgXKsvF0Wz88bCAb6R1as,29601
|
588
|
+
sglang/srt/managers/multimodal_processor.py,sha256=mLnGcUHIvjruwoVhqiz4j7RMYMsZnvQMH8JnKCITDlY,1805
|
589
|
+
sglang/srt/managers/schedule_batch.py,sha256=xmWSPAsllmPaWtKNrf-P8IX6fuQMTD-vZuk1y01vUjA,76289
|
584
590
|
sglang/srt/managers/schedule_policy.py,sha256=BFYItMXtrsO5157tpFhYwLpZ8NSlzR4_gNZC1iE10D4,22400
|
585
|
-
sglang/srt/managers/scheduler.py,sha256=
|
591
|
+
sglang/srt/managers/scheduler.py,sha256=rwI-qSIeVkzxkmVXPPtbK0mkQ5WY3myU3lV_AImFJ-Y,122502
|
586
592
|
sglang/srt/managers/scheduler_output_processor_mixin.py,sha256=Ei-9lyfrSQAlL9_ULuJLAhA7qpvUzjsBDzBBTDdnt4Q,31394
|
587
593
|
sglang/srt/managers/session_controller.py,sha256=dzlMNZlo20FTSl64QqK7y7pElsdCy8ICOWWBPTBVwgs,6040
|
588
594
|
sglang/srt/managers/template_manager.py,sha256=RrwRA2oqId_PMQ98qJQGwIxMroOxiorl2sGC9ARou_0,8543
|
589
|
-
sglang/srt/managers/tokenizer_manager.py,sha256=
|
590
|
-
sglang/srt/managers/tp_worker.py,sha256=
|
595
|
+
sglang/srt/managers/tokenizer_manager.py,sha256=yAgnR5eYeiid8gwJSBNQ1tkrYd5dq0RHXWn8nO_UdvY,76284
|
596
|
+
sglang/srt/managers/tp_worker.py,sha256=D_NoiX69ry8cKRUYjX4nhtlPLdz1dipJEJekTouNG70,11363
|
591
597
|
sglang/srt/managers/tp_worker_overlap_thread.py,sha256=kK0pn8mz-XgLGvVlJK6LvDVp4lnFk5vJH-Cs9NQ5Un4,10959
|
592
598
|
sglang/srt/managers/utils.py,sha256=9_VGE48EK0PXVJ26aYvbRJ6n7gIZALvCcf6uZCccCgM,1369
|
593
599
|
sglang/srt/mem_cache/allocator.py,sha256=id4riucsG9d-P1ikj3-DLJbzhM8-MuJfvDmB8H4g9-o,23364
|
@@ -595,7 +601,7 @@ sglang/srt/mem_cache/base_prefix_cache.py,sha256=hLS2ncTMAz7Kpdk5pNwn5c6g8b61_K9
|
|
595
601
|
sglang/srt/mem_cache/chunk_cache.py,sha256=FU_fq8e_dodgU8EkRqE4Jr0sKwCXQnKmapO88k6_JfU,3207
|
596
602
|
sglang/srt/mem_cache/flush_cache.py,sha256=GYcxmNXh4hsMpFfNOuCTpKilW7guZwTtAg_usVeM3J0,979
|
597
603
|
sglang/srt/mem_cache/hicache_storage.py,sha256=pvNeooVmCZBeZFgSHWNGPZzqtHI_qJ5BpTy_A4i6gg8,5539
|
598
|
-
sglang/srt/mem_cache/hiradix_cache.py,sha256=
|
604
|
+
sglang/srt/mem_cache/hiradix_cache.py,sha256=3BXlIZUyQk2dkwuwsMvSUSXd8fCDLPvcTLOp9FnzxBY,24779
|
599
605
|
sglang/srt/mem_cache/memory_pool.py,sha256=jQdWgOr6hpMLbGaEJc4immBgZG_MZbx8LyOv029ASVw,40932
|
600
606
|
sglang/srt/mem_cache/memory_pool_host.py,sha256=xcjYyC94FOH_NguWbLUG4vF_CSBcxA_msuRsBasYCPo,10387
|
601
607
|
sglang/srt/mem_cache/multimodal_cache.py,sha256=wZl2KeEl3xeoEsYdH33UoM-FO8kqfLo_XUgereJVvoM,1348
|
@@ -605,7 +611,7 @@ sglang/srt/metrics/collector.py,sha256=FH6Wil2lMK7d7q74CfxfdULCaHKDXeAoo8UBZqqde
|
|
605
611
|
sglang/srt/metrics/func_timer.py,sha256=VFyNRrbnKVCwnQsrlLin1lITJfjQpf9m8sGPqL5LIsQ,3438
|
606
612
|
sglang/srt/model_executor/cuda_graph_runner.py,sha256=6njRGysrhBDi2bAt5DyjGnyrexYvuEVsAJwQBBW8Ut0,31886
|
607
613
|
sglang/srt/model_executor/forward_batch_info.py,sha256=NvUhReevoy6UfO4991P_5MPQyfefC3BOoTwTqUwMbYk,38430
|
608
|
-
sglang/srt/model_executor/model_runner.py,sha256=
|
614
|
+
sglang/srt/model_executor/model_runner.py,sha256=UkI7i73Noaar9__sYVDGA-xEQHYSllZPUxRIbLwduWU,72373
|
609
615
|
sglang/srt/model_loader/__init__.py,sha256=zGZkOBz1zx-pkaIy47BasL3fjDlAcxAXUTjInOhXHAE,919
|
610
616
|
sglang/srt/model_loader/loader.py,sha256=wxSUYrqv23w9yHYy9Lm0ozWggs9pf6Co4yqe1UO8PZk,59799
|
611
617
|
sglang/srt/model_loader/utils.py,sha256=svSrPQxViBz_-0_sByu4coCYrzJ51-4FCi_bFqa6rDo,4474
|
@@ -619,7 +625,7 @@ sglang/srt/models/dbrx.py,sha256=4pn_fdoATg01VEqNnIAxNEsKV5XU7gwHyd289eydq1s,155
|
|
619
625
|
sglang/srt/models/deepseek.py,sha256=sqobTr9a9c5pNLNJZE-WrJIE_qBq0lC5gCGv9NpGU_Q,17364
|
620
626
|
sglang/srt/models/deepseek_janus_pro.py,sha256=td8xGs6ARfJ8AQCYwUhMOZoWigrAs7m3trF5-kXCqik,70418
|
621
627
|
sglang/srt/models/deepseek_nextn.py,sha256=47fehxRdiOizr0rdLg5f1fzQEx6gGAOcDcWKtblloyk,5928
|
622
|
-
sglang/srt/models/deepseek_v2.py,sha256=
|
628
|
+
sglang/srt/models/deepseek_v2.py,sha256=d6itbiEH_Zj0DdvH10dbxwTN7kK4g7rQYJVQ6A2-B70,105428
|
623
629
|
sglang/srt/models/deepseek_vl2.py,sha256=7X3gI4DE7guUtNJvMLf06jO8MUHKa2Aan8evZg5hsXc,13061
|
624
630
|
sglang/srt/models/exaone.py,sha256=TpO-rtCpEZ8Ua7hGFnS8l2oAYhY0Pij50grc9WQ2mvc,13576
|
625
631
|
sglang/srt/models/gemma.py,sha256=2atKwFN5wCsJCmBRmURX9vaCcFjxlFirL7xsnG5KPlI,14180
|
@@ -631,6 +637,8 @@ sglang/srt/models/gemma3n_audio.py,sha256=isgKfjA5UieYawxU6medL2ssXlzYPqAbagDBnL
|
|
631
637
|
sglang/srt/models/gemma3n_causal.py,sha256=kBDlpSWAg6ZDmUPe08Q7sj5CbdVD_0h07zwJw8sKu7I,36335
|
632
638
|
sglang/srt/models/gemma3n_mm.py,sha256=pL_fvnkz9fKaC2Afms5KG3Me3u5sp1C2-mAUhqPGrQ4,18701
|
633
639
|
sglang/srt/models/glm4.py,sha256=2VQzUqFkQTy_2nfkxP9SF6_9kKLTZUExGRjge7r99Es,11265
|
640
|
+
sglang/srt/models/glm4_moe.py,sha256=vNJfab2DVhMEU-9RsPd7zyLofkX7SqYHRY97vFcYkDA,39864
|
641
|
+
sglang/srt/models/glm4_moe_nextn.py,sha256=cWB6o3w7xBvgi2ouGKsqZ3iovKH65QiRQul42wcgzMk,5897
|
634
642
|
sglang/srt/models/gpt2.py,sha256=kclhxEs8oJk1KCyhmAqo7rZqecVGGHYkc-a1WZi3aIk,9841
|
635
643
|
sglang/srt/models/gpt_bigcode.py,sha256=1D6bi8Zu760gCRZkvdLHFcg8kCkY35ARwQYaMDtYhl4,10307
|
636
644
|
sglang/srt/models/granite.py,sha256=5WOJyNYAlt5RNHSexNfPNihhSxIMd7wPzju1cTixKig,20852
|
@@ -640,7 +648,8 @@ sglang/srt/models/hunyuan.py,sha256=GVDeMKgcqW6HMFWPUukznL5JoDW4CpOpS5Q_PXlbHw8,
|
|
640
648
|
sglang/srt/models/idefics2.py,sha256=U3khd3hbdawJeRNXsxmaKHdssOCT5TPOZ1D-2_zHoQo,12079
|
641
649
|
sglang/srt/models/internlm2.py,sha256=F_iNY1gUqzAjAuUatcE47gnrcoTh5_08PY2Rw9tKr9M,13150
|
642
650
|
sglang/srt/models/internlm2_reward.py,sha256=ndfGmyqYZbVZ7C7rJ-v9oK3wa-EpoBGybS8MlyKZi2E,2522
|
643
|
-
sglang/srt/models/
|
651
|
+
sglang/srt/models/interns1.py,sha256=nResXUzfcHZoJie1gHuYwyVir7Ys2fWp3hjzTs6Utvk,14182
|
652
|
+
sglang/srt/models/internvl.py,sha256=o6XSAvnMYK5tTPbln9RI9BfRfAQZBE8_xmGPffrznnQ,27838
|
644
653
|
sglang/srt/models/kimi_vl.py,sha256=XulRiufQzOSWZe8-bUl2OEdznvsVU9OBsEYipaX3YkM,12877
|
645
654
|
sglang/srt/models/kimi_vl_moonvit.py,sha256=M5L7AJOJ2Zh2pqLZAq8aRqhbTSlipr8XOoD3ix6o2sU,23908
|
646
655
|
sglang/srt/models/llama.py,sha256=Nsxv2s1sOmLnZsTHkwbTh53cUFEQ2fnKDQi5BFbFcsk,28994
|
@@ -650,13 +659,13 @@ sglang/srt/models/llama_eagle.py,sha256=Ubh_jmtfiOnriwvHgQT0ZGID7JvYvdSi_QGHOIkE
|
|
650
659
|
sglang/srt/models/llama_eagle3.py,sha256=715soylDE3kOMWskbPy_70BFxaSc5ptaHCS1v3-ViA0,8579
|
651
660
|
sglang/srt/models/llama_embedding.py,sha256=zq-_lNu35VBFc7eemiam0zdkGIE8fzrgk5OWYfirZnA,3254
|
652
661
|
sglang/srt/models/llama_reward.py,sha256=LF2nqMV5XOrljGjAwJg43mBv3z6Q040I2EYlgZeCp8k,4681
|
653
|
-
sglang/srt/models/llava.py,sha256=
|
662
|
+
sglang/srt/models/llava.py,sha256=xzYip_BAwpzSIdZre43LZiyTpFISa0ZCLdO6LUSbaCg,37702
|
654
663
|
sglang/srt/models/llavavid.py,sha256=-CSk0RJ2MQeb81sh-RISeVJFaI-XWY6nR6_I594MkME,12818
|
655
664
|
sglang/srt/models/mimo.py,sha256=Mp-iFp4YHuiuq-H8enUF5K5QbMnVcvEa6mURH6vM3yM,6140
|
656
665
|
sglang/srt/models/mimo_mtp.py,sha256=jSmqJAXu7G3OO7jW1oa2suI4H_Yl7u5ZT7w4lHFbHhg,7292
|
657
666
|
sglang/srt/models/minicpm.py,sha256=CzBJyZtfMpp8jvlEl29DHI7HLVq-CxuqP1UHwxIbaUI,14567
|
658
667
|
sglang/srt/models/minicpm3.py,sha256=6-gfHSfXwyB5zw7AIj-c5TzjpEKR6CM0H67MrD8LVUE,19347
|
659
|
-
sglang/srt/models/minicpmo.py,sha256=
|
668
|
+
sglang/srt/models/minicpmo.py,sha256=st8I13Ere5RkRHHQQN1LgZh1ybUA3_buxaaE4XlV8ag,76123
|
660
669
|
sglang/srt/models/minicpmv.py,sha256=g4aAOG8PVGkZqGmlneVaScAtNpSLqSVbZGRAikyrBy8,30394
|
661
670
|
sglang/srt/models/mistral.py,sha256=ni7PppA_5X4ivTnIps3yoEaMEL-G6Gaf9b5hGC1vU5Q,3475
|
662
671
|
sglang/srt/models/mixtral.py,sha256=j2whKt4GdQqtpKL5iN0Vb4TO4el1E2qEpUCI57E_47Q,17222
|
@@ -680,11 +689,11 @@ sglang/srt/models/qwen2_5_vl.py,sha256=vOuIyK_NLuGgz9LlAdyM7cSQUU93VnBCYXUr_n4iO
|
|
680
689
|
sglang/srt/models/qwen2_audio.py,sha256=lVeYmC29eVZIR9I6ZjFe4xvC0wSXR0NtGCli6fSXtms,7870
|
681
690
|
sglang/srt/models/qwen2_classification.py,sha256=dGrMm4ebd30_lBhHOhaV57ig2iOTx3nqB4GEzsrRIM8,2747
|
682
691
|
sglang/srt/models/qwen2_eagle.py,sha256=6spFg6JYQGeUXLv2Q5eMkVzZvnqGyvW6SdVBtFMxlTM,4806
|
683
|
-
sglang/srt/models/qwen2_moe.py,sha256=
|
692
|
+
sglang/srt/models/qwen2_moe.py,sha256=drTwlJlP0PLDl-Rl2h4GaOmOxexV1SMjMP97izhVpLk,25822
|
684
693
|
sglang/srt/models/qwen2_rm.py,sha256=-mQXDEv11p-I1HXgYLTtY6ROem6UYorO958WsDrzsgs,2837
|
685
694
|
sglang/srt/models/qwen2_vl.py,sha256=ZRAL32Ymt4ZCBqB0JorXAm4ZBrECZ9EbaXKaTSikkQM,21366
|
686
695
|
sglang/srt/models/qwen3.py,sha256=COSC1TsCQNTq3E1QoVJYj1yTn-CFEVEX7keRwrrBXLs,20121
|
687
|
-
sglang/srt/models/qwen3_moe.py,sha256=
|
696
|
+
sglang/srt/models/qwen3_moe.py,sha256=Vcdt77gDniDoZiAgsdhcWHtw1GiH-3Pk8GpiUxpjXWc,34019
|
688
697
|
sglang/srt/models/registry.py,sha256=bH9H0OiNV0Cn7FRBM30Oh6dxICTs9mJscdLtHYPJvxc,3783
|
689
698
|
sglang/srt/models/roberta.py,sha256=3k53V2Gbezk3jU-D03thXx8csGn5DxFK01ZQ9WFiWPI,9828
|
690
699
|
sglang/srt/models/siglip.py,sha256=DIVJRwdtpLD2QT1kVPIHw7Bn9BE40xJbkHujDNzkjgA,9892
|
@@ -696,23 +705,23 @@ sglang/srt/models/xverse.py,sha256=DsNVI9JpzN4jj0Ry6aTrj7r-xq5YLOoDX2kH4YLJA-I,1
|
|
696
705
|
sglang/srt/models/xverse_moe.py,sha256=7KCM2-j12towDMNvXkuuYiBOmNauH6NG4Ip40x0khqA,16782
|
697
706
|
sglang/srt/models/yivl.py,sha256=oToK7-u5IGO7xwpJIQ7VtudlK6-zPqJX4bt6_wv0SH8,4850
|
698
707
|
sglang/srt/multimodal/mm_utils.py,sha256=6bV1_a7Iet9W0y3qdd0E-hFM78zalIzNZCYbLzJX2y8,12640
|
699
|
-
sglang/srt/multimodal/processors/base_processor.py,sha256=
|
700
|
-
sglang/srt/multimodal/processors/clip.py,sha256=
|
701
|
-
sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=
|
702
|
-
sglang/srt/multimodal/processors/gemma3.py,sha256=
|
703
|
-
sglang/srt/multimodal/processors/gemma3n.py,sha256=
|
704
|
-
sglang/srt/multimodal/processors/internvl.py,sha256=
|
705
|
-
sglang/srt/multimodal/processors/janus_pro.py,sha256=
|
706
|
-
sglang/srt/multimodal/processors/kimi_vl.py,sha256=
|
707
|
-
sglang/srt/multimodal/processors/llava.py,sha256=
|
708
|
-
sglang/srt/multimodal/processors/minicpm.py,sha256=
|
709
|
-
sglang/srt/multimodal/processors/mlama.py,sha256=
|
710
|
-
sglang/srt/multimodal/processors/mllama4.py,sha256=
|
711
|
-
sglang/srt/multimodal/processors/phi4mm.py,sha256=
|
712
|
-
sglang/srt/multimodal/processors/pixtral.py,sha256=
|
713
|
-
sglang/srt/multimodal/processors/qwen_audio.py,sha256=
|
714
|
-
sglang/srt/multimodal/processors/qwen_vl.py,sha256=
|
715
|
-
sglang/srt/multimodal/processors/vila.py,sha256=
|
708
|
+
sglang/srt/multimodal/processors/base_processor.py,sha256=duDeCOOeXRt8lYi34fCe40Gezz0-Ao-rN9Zenx8p4c8,24430
|
709
|
+
sglang/srt/multimodal/processors/clip.py,sha256=5nXZuQYbyf-5mlqPwjhQrlWqxvswImWZQXivChsiHfQ,1057
|
710
|
+
sglang/srt/multimodal/processors/deepseek_vl_v2.py,sha256=Pymag9f0U5L_bBOTFs2q94BbuPJ-VwqSixs3meO0nsM,2569
|
711
|
+
sglang/srt/multimodal/processors/gemma3.py,sha256=7aD6cR60iSC_MqjzdCDMAgtrb_cmy9YJyqLgVRClBT8,1986
|
712
|
+
sglang/srt/multimodal/processors/gemma3n.py,sha256=zml4ovgDzgFZxupnsTfmGtT69ymY_eY0Zp3hR6TkBY0,3056
|
713
|
+
sglang/srt/multimodal/processors/internvl.py,sha256=p8dba1LBEceGObJvPdq3auDhlMKQIXyp_fXM5VMd4BI,9771
|
714
|
+
sglang/srt/multimodal/processors/janus_pro.py,sha256=_4ltWmdtFjbh1VCMRbcgxW61eWIABIzHG-YgwHWaYq8,1471
|
715
|
+
sglang/srt/multimodal/processors/kimi_vl.py,sha256=5i8KmGxnnDtQc7XqUBNyanAfGxhxj8iRFBFONHmpiFg,1565
|
716
|
+
sglang/srt/multimodal/processors/llava.py,sha256=1pb47tlbgH8IUgxTb2YFsK87-x16xmC6BZFHc5r2x9g,8097
|
717
|
+
sglang/srt/multimodal/processors/minicpm.py,sha256=ysJlUaxcBcWjKliz5VmXKVv0ec4QWRHXZk4ga-hXVf0,5354
|
718
|
+
sglang/srt/multimodal/processors/mlama.py,sha256=FgPm2JQzfPFDcGYDm0mqfDfO_eJKy-NiVgF-vId6w8Y,1233
|
719
|
+
sglang/srt/multimodal/processors/mllama4.py,sha256=1YGETKSzMZIa7BOwq3T9cbsYjUcW5sopcpc9JNJ000g,1911
|
720
|
+
sglang/srt/multimodal/processors/phi4mm.py,sha256=8GaUVpGucV4UKoa0XkxN0gDpMZax6UyCiRBX_QaJK78,3857
|
721
|
+
sglang/srt/multimodal/processors/pixtral.py,sha256=Lx5Z-9NkovLDTHlRBznHxGn4r2XhDz8am2XpOskOVQY,3203
|
722
|
+
sglang/srt/multimodal/processors/qwen_audio.py,sha256=jxtArfNuBH4q9LQVEydMDsj85avqBGNl-v1ZZTjC9E0,2367
|
723
|
+
sglang/srt/multimodal/processors/qwen_vl.py,sha256=tZOpz8dabyNvjS4hn0UxLf-EaEZH8kmHjyZaYRm9EZ8,10498
|
724
|
+
sglang/srt/multimodal/processors/vila.py,sha256=vWgV1lTdjiFiTR8w-7fC66-L_tpOOD59c-c9NljGelE,2192
|
716
725
|
sglang/srt/sampling/custom_logit_processor.py,sha256=AwODYVJdRkcQ8PGtJrhzKsqAgn8XZLQbAmR9fGiQzmc,1608
|
717
726
|
sglang/srt/sampling/sampling_batch_info.py,sha256=Duk4Fp99QZyOFld3i4AGwkW9FlULY86CNKv6v0_kA4w,14683
|
718
727
|
sglang/srt/sampling/sampling_params.py,sha256=HbVcCeSXgPW19MRB-v0FTG1D-zHDAY6-toxyndSl-zI,6462
|
@@ -727,11 +736,12 @@ sglang/srt/speculative/eagle_draft_extend_cuda_graph_runner.py,sha256=hLjaD66K3Z
|
|
727
736
|
sglang/srt/speculative/eagle_utils.py,sha256=x5MKA2GkecNAXE58KKhPJRy5KxCLhRkD-C_kVSZIyzc,46433
|
728
737
|
sglang/srt/speculative/eagle_worker.py,sha256=8yPQZxpBvcr--Ooo4nov3LqzkLRL-GOLJlwu91wMAmQ,38650
|
729
738
|
sglang/srt/speculative/spec_info.py,sha256=rhaKG0TzyF9XZYHEWp1jccwTBohSNsUDvxHFtAoOl18,709
|
739
|
+
sglang/srt/weight_sync/utils.py,sha256=jpmfXtiCvUYpwWh4bMgQgv0JSulPi8TwIz4aTsxi0XU,4148
|
730
740
|
sglang/test/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
731
741
|
sglang/test/few_shot_gsm8k.py,sha256=qnEejCyPHGEMBEiNc7T4-t9lvoo2DNN72RXw-ei_TnY,4300
|
732
742
|
sglang/test/few_shot_gsm8k_engine.py,sha256=Yf1Dg0Tk-tY4v1oj_UTxJ7950CWn6kRMbQKDjT2Orgo,3902
|
733
743
|
sglang/test/run_eval.py,sha256=K4Z3OdMPvLeuGJhWWTBD0F-MOUFeBYLvsPnDQ44bd18,4036
|
734
|
-
sglang/test/runners.py,sha256=
|
744
|
+
sglang/test/runners.py,sha256=q01InkXESqxZe19NeH5SzK11HuQG13gFEfm3N7XAIpU,33714
|
735
745
|
sglang/test/send_one.py,sha256=XNZdfZs21tXDBwrDj2pq46WQd5smiKoYETY8U09c1Z8,5079
|
736
746
|
sglang/test/simple_eval_common.py,sha256=OW4Z7O33QqDySRFuHIC4Ouidfup4eaOEuR9i7xJzkDY,12379
|
737
747
|
sglang/test/simple_eval_gpqa.py,sha256=8Xt9Bw05c7SZTYrCZgB68OZUqUbLo69ywiyx0bTvSUk,3220
|
@@ -753,13 +763,13 @@ sglang/test/test_layernorm.py,sha256=2GMWqqNDuGvSMSsEBF5eDCzwVSYA9E6hGhRo6s4ecKg
|
|
753
763
|
sglang/test/test_marlin_moe.py,sha256=PITMGcGF4ci2csXJejdLSNuxpURnFmcflsipAZsGakU,7991
|
754
764
|
sglang/test/test_marlin_utils.py,sha256=gFMJwxbfEEJDeHI-HU5FDF9FFqqcM-yahK0TWyVIVgQ,5171
|
755
765
|
sglang/test/test_programs.py,sha256=DJIbTChloPwaDiEWHQoSTuKv3BGx0-K8Y5e1mDDTACM,18910
|
756
|
-
sglang/test/test_utils.py,sha256=
|
766
|
+
sglang/test/test_utils.py,sha256=hnT1lvTERIpmTapJKttFPfZCqHjNsTqiWNqpn5r-6CU,39454
|
757
767
|
sglang/test/attention/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
758
768
|
sglang/test/attention/test_flashattn_backend.py,sha256=_rTG849FwQdVTyGKkqhczaOqngBmRWXFmkl5NnuK1GM,13914
|
759
769
|
sglang/test/attention/test_flashattn_mla_backend.py,sha256=g4O50WblTpM7_Gq2b76k0i25_z01BOUBQ4i6PmyxpO4,10774
|
760
770
|
sglang/test/attention/test_prefix_chunk_info.py,sha256=hpoDe2wfSa6RlUbfyri_c0iyBTb35UXGL9I2Xh6jamM,7772
|
761
|
-
sglang-0.4.9.
|
762
|
-
sglang-0.4.9.
|
763
|
-
sglang-0.4.9.
|
764
|
-
sglang-0.4.9.
|
765
|
-
sglang-0.4.9.
|
771
|
+
sglang-0.4.9.post5.dist-info/licenses/LICENSE,sha256=FJXh51fvTQklojUFY89XVLsjxRcBqOxPs8XNy-2uZ0c,11346
|
772
|
+
sglang-0.4.9.post5.dist-info/METADATA,sha256=jv_hoxV9ahzQ3tRZRibHpMxmYK6-lCJUDCd09LK4dPU,27348
|
773
|
+
sglang-0.4.9.post5.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
774
|
+
sglang-0.4.9.post5.dist-info/top_level.txt,sha256=yxhh3pYQkcnA7v3Bg889C2jZhvtJdEincysO7PEB09M,7
|
775
|
+
sglang-0.4.9.post5.dist-info/RECORD,,
|