guidellm 0.3.0rc20250418__tar.gz → 0.3.0rc20250421__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of guidellm might be problematic. Click here for more details.
- {guidellm-0.3.0rc20250418/src/guidellm.egg-info → guidellm-0.3.0rc20250421}/PKG-INFO +2 -2
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/README.md +1 -1
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/pyproject.toml +1 -1
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/backend/openai.py +8 -1
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/config.py +3 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/dataset/file.py +9 -7
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/request/loader.py +4 -1
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421/src/guidellm.egg-info}/PKG-INFO +2 -2
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/LICENSE +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/MANIFEST.in +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/setup.cfg +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/__init__.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/__main__.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/backend/__init__.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/backend/backend.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/backend/response.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/benchmark/__init__.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/benchmark/aggregator.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/benchmark/benchmark.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/benchmark/benchmarker.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/benchmark/entrypoints.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/benchmark/output.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/benchmark/profile.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/benchmark/progress.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/data/__init__.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/data/prideandprejudice.txt.gz +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/dataset/__init__.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/dataset/creator.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/dataset/entrypoints.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/dataset/hf_datasets.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/dataset/in_memory.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/dataset/synthetic.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/logger.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/objects/__init__.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/objects/pydantic.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/objects/statistics.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/request/__init__.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/request/request.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/scheduler/__init__.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/scheduler/result.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/scheduler/scheduler.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/scheduler/strategy.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/scheduler/types.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/scheduler/worker.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/utils/__init__.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/utils/colors.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/utils/hf_transformers.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/utils/random.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/utils/text.py +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm.egg-info/SOURCES.txt +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm.egg-info/dependency_links.txt +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm.egg-info/entry_points.txt +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm.egg-info/requires.txt +0 -0
- {guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm.egg-info/top_level.txt +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: guidellm
|
|
3
|
-
Version: 0.3.
|
|
3
|
+
Version: 0.3.0rc20250421
|
|
4
4
|
Summary: Guidance platform for deploying and managing large language models.
|
|
5
5
|
Author: Neuralmagic, Inc.
|
|
6
6
|
License: Apache License
|
|
@@ -259,7 +259,7 @@ Dynamic: license-file
|
|
|
259
259
|
Scale Efficiently: Evaluate and Optimize Your LLM Deployments for Real-World Inference
|
|
260
260
|
</h3>
|
|
261
261
|
|
|
262
|
-
[](https://github.com/neuralmagic/guidellm/releases) [](https://github.com/neuralmagic/guidellm/tree/main/docs) [](https://github.com/neuralmagic/guidellm/blob/main/LICENSE) [](https://pypi.python.org/pypi/guidellm) [](https://github.com/neuralmagic/guidellm/releases) [](https://github.com/neuralmagic/guidellm/tree/main/docs) [](https://github.com/neuralmagic/guidellm/blob/main/LICENSE) [](https://pypi.python.org/pypi/guidellm) [](https://pypi.python.org/pypi/guidellm) [](https://github.com/neuralmagic/guidellm/actions/workflows/nightly.yml)
|
|
263
263
|
|
|
264
264
|
## Overview
|
|
265
265
|
|
|
@@ -9,7 +9,7 @@
|
|
|
9
9
|
Scale Efficiently: Evaluate and Optimize Your LLM Deployments for Real-World Inference
|
|
10
10
|
</h3>
|
|
11
11
|
|
|
12
|
-
[](https://github.com/neuralmagic/guidellm/releases) [](https://github.com/neuralmagic/guidellm/tree/main/docs) [](https://github.com/neuralmagic/guidellm/blob/main/LICENSE) [](https://pypi.python.org/pypi/guidellm) [](https://github.com/neuralmagic/guidellm/releases) [](https://github.com/neuralmagic/guidellm/tree/main/docs) [](https://github.com/neuralmagic/guidellm/blob/main/LICENSE) [](https://pypi.python.org/pypi/guidellm) [](https://pypi.python.org/pypi/guidellm) [](https://github.com/neuralmagic/guidellm/actions/workflows/nightly.yml)
|
|
13
13
|
|
|
14
14
|
## Overview
|
|
15
15
|
|
|
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
|
|
|
4
4
|
|
|
5
5
|
[project]
|
|
6
6
|
name = "guidellm"
|
|
7
|
-
version = "0.3.0.
|
|
7
|
+
version = "0.3.0.rc20250421"
|
|
8
8
|
description = "Guidance platform for deploying and managing large language models."
|
|
9
9
|
requires-python = ">=3.9.0,<4.0"
|
|
10
10
|
dependencies = [ "click", "datasets", "ftfy>=6.0.0", "httpx[http2]<1.0.0", "loguru", "numpy", "pillow", "protobuf", "pydantic>=2.0.0", "pydantic-settings>=2.0.0", "pyyaml>=6.0.0", "requests", "rich", "transformers",]
|
|
@@ -145,7 +145,7 @@ class OpenAIHTTPBackend(Backend):
|
|
|
145
145
|
elif self.model not in models:
|
|
146
146
|
raise ValueError(
|
|
147
147
|
f"Model {self.model} not found in available models:"
|
|
148
|
-
"{models} for target: {self.target}"
|
|
148
|
+
f"{models} for target: {self.target}"
|
|
149
149
|
)
|
|
150
150
|
|
|
151
151
|
async def prepare_multiprocessing(self):
|
|
@@ -202,6 +202,13 @@ class OpenAIHTTPBackend(Backend):
|
|
|
202
202
|
and a ResponseSummary for the final response.
|
|
203
203
|
"""
|
|
204
204
|
logger.debug("{} invocation with args: {}", self.__class__.__name__, locals())
|
|
205
|
+
|
|
206
|
+
if isinstance(prompt, list):
|
|
207
|
+
raise ValueError(
|
|
208
|
+
"List prompts (batching) is currently not supported for "
|
|
209
|
+
f"text_completions OpenAI pathways. Received: {prompt}"
|
|
210
|
+
)
|
|
211
|
+
|
|
205
212
|
headers = self._headers()
|
|
206
213
|
payload = self._completions_payload(
|
|
207
214
|
orig_kwargs=kwargs,
|
|
@@ -134,6 +134,9 @@ class Settings(BaseSettings):
|
|
|
134
134
|
Literal["request", "response", "local"]
|
|
135
135
|
] = "response"
|
|
136
136
|
preferred_backend: Literal["openai"] = "openai"
|
|
137
|
+
preferred_route: Literal["text_completions", "chat_completions"] = (
|
|
138
|
+
"text_completions"
|
|
139
|
+
)
|
|
137
140
|
openai: OpenAISettings = OpenAISettings()
|
|
138
141
|
|
|
139
142
|
# Output settings
|
|
@@ -71,19 +71,21 @@ class FileDatasetCreator(DatasetCreator):
|
|
|
71
71
|
|
|
72
72
|
dataset = Dataset.from_dict({"text": items}, **(data_args or {}))
|
|
73
73
|
elif path.suffix.lower() == ".csv":
|
|
74
|
-
dataset = load_dataset("csv", data_files=path, **(data_args or {}))
|
|
74
|
+
dataset = load_dataset("csv", data_files=str(path), **(data_args or {}))
|
|
75
75
|
elif path.suffix.lower() in {".json", ".jsonl"}:
|
|
76
|
-
dataset = load_dataset("json", data_files=path, **(data_args or {}))
|
|
76
|
+
dataset = load_dataset("json", data_files=str(path), **(data_args or {}))
|
|
77
77
|
elif path.suffix.lower() == ".parquet":
|
|
78
|
-
dataset = load_dataset("parquet", data_files=path, **(data_args or {}))
|
|
78
|
+
dataset = load_dataset("parquet", data_files=str(path), **(data_args or {}))
|
|
79
79
|
elif path.suffix.lower() == ".arrow":
|
|
80
|
-
dataset = load_dataset("arrow", data_files=path, **(data_args or {}))
|
|
80
|
+
dataset = load_dataset("arrow", data_files=str(path), **(data_args or {}))
|
|
81
81
|
elif path.suffix.lower() == ".hdf5":
|
|
82
|
-
dataset = Dataset.from_pandas(pd.read_hdf(path), **(data_args or {}))
|
|
82
|
+
dataset = Dataset.from_pandas(pd.read_hdf(str(path)), **(data_args or {}))
|
|
83
83
|
elif path.suffix.lower() == ".db":
|
|
84
|
-
dataset = Dataset.from_sql(con=path, **(data_args or {}))
|
|
84
|
+
dataset = Dataset.from_sql(con=str(path), **(data_args or {}))
|
|
85
85
|
elif path.suffix.lower() == ".tar":
|
|
86
|
-
dataset = load_dataset(
|
|
86
|
+
dataset = load_dataset(
|
|
87
|
+
"webdataset", data_files=str(path), **(data_args or {})
|
|
88
|
+
)
|
|
87
89
|
else:
|
|
88
90
|
raise ValueError(f"Unsupported file type: {path.suffix} given for {path}. ")
|
|
89
91
|
|
|
@@ -11,6 +11,7 @@ from typing import (
|
|
|
11
11
|
from datasets import Dataset, DatasetDict, IterableDataset, IterableDatasetDict
|
|
12
12
|
from transformers import PreTrainedTokenizerBase # type: ignore[import]
|
|
13
13
|
|
|
14
|
+
from guidellm.config import settings
|
|
14
15
|
from guidellm.dataset import ColumnInputTypes, load_dataset
|
|
15
16
|
from guidellm.objects import StandardBaseModel
|
|
16
17
|
from guidellm.request.request import GenerationRequest
|
|
@@ -61,6 +62,8 @@ class GenerativeRequestLoader(RequestLoader):
|
|
|
61
62
|
"content",
|
|
62
63
|
"conversation",
|
|
63
64
|
"conversations",
|
|
65
|
+
"turn",
|
|
66
|
+
"turns",
|
|
64
67
|
"text",
|
|
65
68
|
]
|
|
66
69
|
|
|
@@ -270,7 +273,7 @@ class GenerativeRequestLoader(RequestLoader):
|
|
|
270
273
|
)
|
|
271
274
|
|
|
272
275
|
return GenerationRequest(
|
|
273
|
-
request_type=
|
|
276
|
+
request_type=settings.preferred_route,
|
|
274
277
|
content=item[self.column_mappings["prompt_column"]],
|
|
275
278
|
stats=(
|
|
276
279
|
{"prompt_tokens": prompt_tokens} if prompt_tokens is not None else {}
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: guidellm
|
|
3
|
-
Version: 0.3.
|
|
3
|
+
Version: 0.3.0rc20250421
|
|
4
4
|
Summary: Guidance platform for deploying and managing large language models.
|
|
5
5
|
Author: Neuralmagic, Inc.
|
|
6
6
|
License: Apache License
|
|
@@ -259,7 +259,7 @@ Dynamic: license-file
|
|
|
259
259
|
Scale Efficiently: Evaluate and Optimize Your LLM Deployments for Real-World Inference
|
|
260
260
|
</h3>
|
|
261
261
|
|
|
262
|
-
[](https://github.com/neuralmagic/guidellm/releases) [](https://github.com/neuralmagic/guidellm/tree/main/docs) [](https://github.com/neuralmagic/guidellm/blob/main/LICENSE) [](https://pypi.python.org/pypi/guidellm) [](https://github.com/neuralmagic/guidellm/releases) [](https://github.com/neuralmagic/guidellm/tree/main/docs) [](https://github.com/neuralmagic/guidellm/blob/main/LICENSE) [](https://pypi.python.org/pypi/guidellm) [](https://pypi.python.org/pypi/guidellm) [](https://github.com/neuralmagic/guidellm/actions/workflows/nightly.yml)
|
|
263
263
|
|
|
264
264
|
## Overview
|
|
265
265
|
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm/data/prideandprejudice.txt.gz
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
{guidellm-0.3.0rc20250418 → guidellm-0.3.0rc20250421}/src/guidellm.egg-info/entry_points.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|