PyPI - guidellm - Versions diffs - 0.4.0a18__py3-none-any.whl → 0.4.0a155__py3-none-any.whl - Mend

guidellm 0.4.0a18py3-none-any.whl → 0.4.0a155py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of guidellm might be problematic. Click here for more details.

Files changed (116) hide show

guidellm/__init__.py +5 -2
guidellm/__main__.py +451 -252
guidellm/backends/__init__.py +33 -0
guidellm/backends/backend.py +110 -0
guidellm/backends/openai.py +355 -0
guidellm/backends/response_handlers.py +455 -0
guidellm/benchmark/__init__.py +53 -39
guidellm/benchmark/benchmarker.py +148 -317
guidellm/benchmark/entrypoints.py +466 -128
guidellm/benchmark/output.py +517 -771
guidellm/benchmark/profile.py +580 -280
guidellm/benchmark/progress.py +568 -549
guidellm/benchmark/scenarios/__init__.py +40 -0
guidellm/benchmark/scenarios/chat.json +6 -0
guidellm/benchmark/scenarios/rag.json +6 -0
guidellm/benchmark/schemas.py +2085 -0
guidellm/data/__init__.py +28 -4
guidellm/data/collators.py +16 -0
guidellm/data/deserializers/__init__.py +53 -0
guidellm/data/deserializers/deserializer.py +109 -0
guidellm/data/deserializers/file.py +222 -0
guidellm/data/deserializers/huggingface.py +94 -0
guidellm/data/deserializers/memory.py +192 -0
guidellm/data/deserializers/synthetic.py +346 -0
guidellm/data/loaders.py +145 -0
guidellm/data/preprocessors/__init__.py +25 -0
guidellm/data/preprocessors/formatters.py +412 -0
guidellm/data/preprocessors/mappers.py +198 -0
guidellm/data/preprocessors/preprocessor.py +29 -0
guidellm/data/processor.py +30 -0
guidellm/data/schemas.py +13 -0
guidellm/data/utils/__init__.py +10 -0
guidellm/data/utils/dataset.py +94 -0
guidellm/data/utils/functions.py +18 -0
guidellm/extras/__init__.py +4 -0
guidellm/extras/audio.py +215 -0
guidellm/extras/vision.py +242 -0
guidellm/logger.py +2 -2
guidellm/mock_server/__init__.py +8 -0
guidellm/mock_server/config.py +84 -0
guidellm/mock_server/handlers/__init__.py +17 -0
guidellm/mock_server/handlers/chat_completions.py +280 -0
guidellm/mock_server/handlers/completions.py +280 -0
guidellm/mock_server/handlers/tokenizer.py +142 -0
guidellm/mock_server/models.py +510 -0
guidellm/mock_server/server.py +168 -0
guidellm/mock_server/utils.py +302 -0
guidellm/preprocess/dataset.py +23 -26
guidellm/presentation/builder.py +2 -2
guidellm/presentation/data_models.py +25 -21
guidellm/presentation/injector.py +2 -3
guidellm/scheduler/__init__.py +65 -26
guidellm/scheduler/constraints.py +1035 -0
guidellm/scheduler/environments.py +252 -0
guidellm/scheduler/scheduler.py +140 -368
guidellm/scheduler/schemas.py +272 -0
guidellm/scheduler/strategies.py +519 -0
guidellm/scheduler/worker.py +391 -420
guidellm/scheduler/worker_group.py +707 -0
guidellm/schemas/__init__.py +31 -0
guidellm/schemas/info.py +159 -0
guidellm/schemas/request.py +216 -0
guidellm/schemas/response.py +119 -0
guidellm/schemas/stats.py +228 -0
guidellm/{config.py → settings.py} +32 -21
guidellm/utils/__init__.py +95 -8
guidellm/utils/auto_importer.py +98 -0
guidellm/utils/cli.py +46 -2
guidellm/utils/console.py +183 -0
guidellm/utils/encoding.py +778 -0
guidellm/utils/functions.py +134 -0
guidellm/utils/hf_datasets.py +1 -2
guidellm/utils/hf_transformers.py +4 -4
guidellm/utils/imports.py +9 -0
guidellm/utils/messaging.py +1118 -0
guidellm/utils/mixins.py +115 -0
guidellm/utils/pydantic_utils.py +411 -0
guidellm/utils/random.py +3 -4
guidellm/utils/registry.py +220 -0
guidellm/utils/singleton.py +133 -0
guidellm/{objects → utils}/statistics.py +341 -247
guidellm/utils/synchronous.py +159 -0
guidellm/utils/text.py +163 -50
guidellm/utils/typing.py +41 -0
guidellm/version.py +1 -1
{guidellm-0.4.0a18.dist-info → guidellm-0.4.0a155.dist-info}/METADATA +33 -10
guidellm-0.4.0a155.dist-info/RECORD +96 -0
guidellm/backend/__init__.py +0 -23
guidellm/backend/backend.py +0 -259
guidellm/backend/openai.py +0 -705
guidellm/backend/response.py +0 -136
guidellm/benchmark/aggregator.py +0 -760
guidellm/benchmark/benchmark.py +0 -837
guidellm/benchmark/scenario.py +0 -104
guidellm/data/prideandprejudice.txt.gz +0 -0
guidellm/dataset/__init__.py +0 -22
guidellm/dataset/creator.py +0 -213
guidellm/dataset/entrypoints.py +0 -42
guidellm/dataset/file.py +0 -92
guidellm/dataset/hf_datasets.py +0 -62
guidellm/dataset/in_memory.py +0 -132
guidellm/dataset/synthetic.py +0 -287
guidellm/objects/__init__.py +0 -18
guidellm/objects/pydantic.py +0 -89
guidellm/request/__init__.py +0 -18
guidellm/request/loader.py +0 -284
guidellm/request/request.py +0 -79
guidellm/request/types.py +0 -10
guidellm/scheduler/queues.py +0 -25
guidellm/scheduler/result.py +0 -155
guidellm/scheduler/strategy.py +0 -495
guidellm-0.4.0a18.dist-info/RECORD +0 -62
{guidellm-0.4.0a18.dist-info → guidellm-0.4.0a155.dist-info}/WHEEL +0 -0
{guidellm-0.4.0a18.dist-info → guidellm-0.4.0a155.dist-info}/entry_points.txt +0 -0
{guidellm-0.4.0a18.dist-info → guidellm-0.4.0a155.dist-info}/licenses/LICENSE +0 -0
{guidellm-0.4.0a18.dist-info → guidellm-0.4.0a155.dist-info}/top_level.txt +0 -0

guidellm/benchmark/profile.py CHANGED Viewed

@@ -1,20 +1,46 @@
-from collections.abc import Sequence
-from typing import Literal, Optional, Union
+"""
+Profile configurations for orchestrating multi-strategy benchmark execution.
+Provides configurable abstractions for coordinating sequential execution of
+scheduling strategies during benchmarking workflows. Profiles automatically
+generate strategies based on configuration parameters, manage runtime
+constraints, and track completion state across the execution sequence.
+"""
+from __future__ import annotations
+from abc import ABC, abstractmethod
+from collections.abc import Generator
+from typing import TYPE_CHECKING, Any, ClassVar, Literal
 import numpy as np
-from pydantic import Field, computed_field
+from pydantic import (
+    Field,
+    NonNegativeFloat,
+    PositiveFloat,
+    PositiveInt,
+    computed_field,
+    field_serializer,
+    field_validator,
+)
-from guidellm.config import settings
-from guidellm.objects import StandardBaseModel
+from guidellm import settings
 from guidellm.scheduler import (
     AsyncConstantStrategy,
     AsyncPoissonStrategy,
     ConcurrentStrategy,
+    Constraint,
+    ConstraintInitializer,
+    ConstraintsInitializerFactory,
     SchedulingStrategy,
     StrategyType,
     SynchronousStrategy,
     ThroughputStrategy,
 )
+from guidellm.utils import PydanticClassRegistryMixin
+if TYPE_CHECKING:
+    from guidellm.benchmark.schemas import Benchmark
 __all__ = [
     "AsyncProfile",
@@ -24,386 +50,660 @@ __all__ = [
     "SweepProfile",
     "SynchronousProfile",
     "ThroughputProfile",
-    "create_profile",
 ]
 ProfileType = Literal["synchronous", "concurrent", "throughput", "async", "sweep"]
-class Profile(StandardBaseModel):
+class Profile(
+    PydanticClassRegistryMixin["type[Profile]"],
+    ABC,
+):
+    """
+    Abstract base for coordinating multi-strategy benchmark execution.
+    Manages sequential execution of scheduling strategies with automatic strategy
+    generation, constraint management, and completion tracking. Subclasses define
+    specific execution patterns like synchronous, concurrent, throughput-focused,
+    rate-based async, or adaptive sweep profiles.
+    :cvar schema_discriminator: Field name used for polymorphic deserialization
+    """
+    schema_discriminator: ClassVar[str] = "type_"
+    @classmethod
+    def __pydantic_schema_base_type__(cls) -> type[Profile]:
+        if cls.__name__ == "Profile":
+            return cls
+        return Profile
+    @classmethod
+    def create(
+        cls,
+        rate_type: str,
+        rate: list[float] | None,
+        random_seed: int = 42,
+        **kwargs: Any,
+    ) -> Profile:
+        """
+        Factory method to create a profile instance based on type.
+        :param rate_type: Profile type identifier to instantiate
+        :param rate: Rate configuration for the profile strategy
+        :param random_seed: Seed for stochastic strategy reproducibility
+        :param kwargs: Additional profile-specific configuration parameters
+        :return: Configured profile instance for the specified type
+        :raises ValueError: If rate_type is not registered
+        """
+        profile_class: type[Profile] = cls.get_registered_object(rate_type)
+        resolved_kwargs = profile_class.resolve_args(
+            rate_type=rate_type, rate=rate, random_seed=random_seed, **kwargs
+        )
+        return profile_class(**resolved_kwargs)
+    @classmethod
+    @abstractmethod
+    def resolve_args(
+        cls,
+        rate_type: str,
+        rate: list[float] | None,
+        random_seed: int,
+        **kwargs: Any,
+    ) -> dict[str, Any]:
+        """
+        Resolve and validate arguments for profile construction.
+        :param rate_type: Profile type identifier
+        :param rate: Rate configuration parameter
+        :param random_seed: Seed for stochastic strategies
+        :param kwargs: Additional arguments to resolve and validate
+        :return: Resolved arguments dictionary for profile initialization
+        """
+        ...
     type_: Literal["profile"] = Field(
-        description="The type of benchmarking profile to use.",
-    )
-    completed_strategies: int = Field(
-        default=0,
-        description="The number of scheduling strategies generated so far.",
+        description="Profile type discriminator for polymorphic serialization",
     )
-    measured_rates: list[float] = Field(
+    completed_strategies: list[SchedulingStrategy] = Field(
         default_factory=list,
-        description=("The average rates measured for the strategies that have run."),
+        description="Strategies that have completed execution in this profile",
     )
-    measured_concurrencies: list[float] = Field(
-        default_factory=list,
-        description=(
-            "The average concurrency measured for the strategies that have run."
-        ),
+    constraints: dict[str, Any | dict[str, Any] | ConstraintInitializer] | None = Field(
+        default=None,
+        description="Runtime constraints applied to strategy execution",
     )
-    def completed_strategy(self, average_rate: float, average_concurrency: float):
-        self.measured_rates.append(average_rate)
-        self.measured_concurrencies.append(average_concurrency)
-        self.completed_strategies += 1
     @computed_field  # type: ignore[misc]
     @property
     def strategy_types(self) -> list[StrategyType]:
-        return []
+        """
+        :return: Strategy types executed or expected to execute in this profile
+        """
+        return [strat.type_ for strat in self.completed_strategies]
+    def strategies_generator(
+        self,
+    ) -> Generator[
+        tuple[
+            SchedulingStrategy | None,
+            dict[str, Any | dict[str, Any] | Constraint] | None,
+        ],
+        Benchmark | None,
+        None,
+    ]:
+        """
+        Generate strategies and constraints for sequential execution.
+        :return: Generator yielding (strategy, constraints) tuples and receiving
+            benchmark results after each execution
+        """
+        prev_strategy: SchedulingStrategy | None = None
+        prev_benchmark: Benchmark | None = None
+        while (
+            strategy := self.next_strategy(prev_strategy, prev_benchmark)
+        ) is not None:
+            constraints = self.next_strategy_constraints(
+                strategy, prev_strategy, prev_benchmark
+            )
+            prev_benchmark = yield (
+                strategy,
+                constraints,
+            )
+            prev_strategy = strategy
+            self.completed_strategies.append(prev_strategy)
+    @abstractmethod
+    def next_strategy(
+        self,
+        prev_strategy: SchedulingStrategy | None,
+        prev_benchmark: Benchmark | None,
+    ) -> SchedulingStrategy | None:
+        """
+        Generate the next strategy in the profile execution sequence.
+        :param prev_strategy: Previously completed strategy instance
+        :param prev_benchmark: Benchmark results from previous strategy execution
+        :return: Next strategy to execute, or None if profile complete
+        """
+        ...
+    def next_strategy_constraints(
+        self,
+        next_strategy: SchedulingStrategy | None,
+        prev_strategy: SchedulingStrategy | None,
+        prev_benchmark: Benchmark | None,
+    ) -> dict[str, Any | dict[str, Any] | Constraint] | None:
+        """
+        Generate constraints for the next strategy execution.
+        :param next_strategy: Strategy to be executed next
+        :param prev_strategy: Previously completed strategy instance
+        :param prev_benchmark: Benchmark results from previous strategy execution
+        :return: Constraints dictionary for next strategy, or None
+        """
+        _ = (prev_strategy, prev_benchmark)  # unused
+        return (
+            ConstraintsInitializerFactory.resolve(self.constraints)
+            if next_strategy and self.constraints
+            else None
+        )
+    @field_validator("constraints", mode="before")
+    @classmethod
+    def _constraints_validator(
+        cls, value: Any
+    ) -> dict[str, Any | dict[str, Any] | ConstraintInitializer] | None:
+        if value is None:
+            return None
+        if not isinstance(value, dict):
+            raise ValueError("Constraints must be a dictionary")
+        return {
+            key: (
+                val
+                if not isinstance(val, ConstraintInitializer)
+                else ConstraintsInitializerFactory.deserialize(initializer_dict=val)
+            )
+            for key, val in value.items()
+        }
+    @field_serializer
+    def _constraints_serializer(
+        self,
+        constraints: dict[str, Any | dict[str, Any] | ConstraintInitializer] | None,
+    ) -> dict[str, Any | dict[str, Any]] | None:
+        if constraints is None:
+            return None
-    def next_strategy(self) -> Optional[SchedulingStrategy]:
-        return None
+        return {
+            key: (
+                val
+                if not isinstance(val, ConstraintInitializer)
+                else ConstraintsInitializerFactory.serialize(initializer=val)
+            )
+            for key, val in constraints.items()
+        }
+@Profile.register("synchronous")
 class SynchronousProfile(Profile):
+    """Single synchronous strategy execution profile."""
     type_: Literal["synchronous"] = "synchronous"  # type: ignore[assignment]
+    @classmethod
+    def resolve_args(
+        cls,
+        rate_type: str,
+        rate: list[float] | None,
+        random_seed: int,
+        **kwargs: Any,
+    ) -> dict[str, Any]:
+        """
+        Resolve arguments for synchronous profile construction.
+        :param rate_type: Profile type identifier (ignored)
+        :param rate: Rate parameter (must be None)
+        :param random_seed: Random seed (ignored)
+        :param kwargs: Additional arguments passed through unchanged
+        :return: Resolved arguments dictionary
+        :raises ValueError: If rate is not None
+        """
+        _ = (rate_type, random_seed)  # unused
+        if rate is not None:
+            raise ValueError("SynchronousProfile does not accept a rate parameter")
+        return kwargs
     @property
     def strategy_types(self) -> list[StrategyType]:
+        """
+        :return: Single synchronous strategy type
+        """
         return [self.type_]
-    def next_strategy(self) -> Optional[SchedulingStrategy]:
-        if self.completed_strategies >= 1:
+    def next_strategy(
+        self,
+        prev_strategy: SchedulingStrategy | None,
+        prev_benchmark: Benchmark | None,
+    ) -> SynchronousStrategy | None:
+        """
+        Generate synchronous strategy or None if already completed.
+        :param prev_strategy: Previously completed strategy (unused)
+        :param prev_benchmark: Benchmark results from previous execution (unused)
+        :return: SynchronousStrategy for first execution, None afterward
+        """
+        _ = (prev_strategy, prev_benchmark)  # unused
+        if len(self.completed_strategies) >= 1:
             return None
         return SynchronousStrategy()
-    @staticmethod
-    def from_standard_args(
-        rate_type: Union[StrategyType, ProfileType],
-        rate: Optional[Union[float, Sequence[float]]],
-        **kwargs,
-    ) -> "SynchronousProfile":
-        if rate_type != "synchronous":
-            raise ValueError("Rate type must be 'synchronous' for synchronous profile.")
-        if rate is not None:
-            raise ValueError(
-                "Rate does not apply to synchronous profile, it must be set to None."
-            )
-        if kwargs:
-            raise ValueError(
-                "No additional arguments are allowed for synchronous profile."
-            )
-        return SynchronousProfile()
+@Profile.register("concurrent")
 class ConcurrentProfile(Profile):
+    """Fixed-concurrency strategy execution profile with configurable stream counts."""
     type_: Literal["concurrent"] = "concurrent"  # type: ignore[assignment]
-    streams: Union[int, Sequence[int]] = Field(
-        description="The number of concurrent streams to use.",
+    streams: list[PositiveInt] = Field(
+        description="Concurrent stream counts for request scheduling",
     )
+    startup_duration: NonNegativeFloat = Field(
+        default=0.0,
+        description=(
+            "Duration in seconds for distributing startup requests "
+            "before completion-based timing"
+        ),
+    )
+    @classmethod
+    def resolve_args(
+        cls,
+        rate_type: str,
+        rate: list[float] | None,
+        random_seed: int,
+        **kwargs: Any,
+    ) -> dict[str, Any]:
+        """
+        Resolve arguments for concurrent profile construction.
+        :param rate_type: Profile type identifier (ignored)
+        :param rate: Rate parameter remapped to streams
+        :param random_seed: Random seed (ignored)
+        :param kwargs: Additional arguments passed through unchanged
+        :return: Resolved arguments dictionary
+        :raises ValueError: If rate is None
+        """
+        _ = (rate_type, random_seed)  # unused
+        rate = rate if isinstance(rate, list) or rate is None else [rate]
+        kwargs["streams"] = [int(stream) for stream in rate] if rate else None
+        return kwargs
     @property
     def strategy_types(self) -> list[StrategyType]:
-        num_strategies = len(self.streams) if isinstance(self.streams, Sequence) else 1
-        return [self.type_] * num_strategies
-    def next_strategy(self) -> Optional[SchedulingStrategy]:
-        streams = self.streams if isinstance(self.streams, Sequence) else [self.streams]
-        if self.completed_strategies >= len(streams):
+        """
+        :return: Concurrent strategy types for each configured stream count
+        """
+        return [self.type_] * len(self.streams)
+    def next_strategy(
+        self,
+        prev_strategy: SchedulingStrategy | None,
+        prev_benchmark: Benchmark | None,
+    ) -> ConcurrentStrategy | None:
+        """
+        Generate concurrent strategy for the next stream count.
+        :param prev_strategy: Previously completed strategy (unused)
+        :param prev_benchmark: Benchmark results from previous execution (unused)
+        :return: ConcurrentStrategy with next stream count, or None if complete
+        """
+        _ = (prev_strategy, prev_benchmark)  # unused
+        if len(self.completed_strategies) >= len(self.streams):
             return None
         return ConcurrentStrategy(
-            streams=streams[self.completed_strategies],
+            streams=self.streams[len(self.completed_strategies)],
+            startup_duration=self.startup_duration,
         )
-    @staticmethod
-    def from_standard_args(
-        rate_type: Union[StrategyType, ProfileType],
-        rate: Optional[Union[float, Sequence[float]]],
-        **kwargs,
-    ) -> "ConcurrentProfile":
-        if rate_type != "concurrent":
-            raise ValueError("Rate type must be 'concurrent' for concurrent profile.")
-        if not rate:
-            raise ValueError("Rate (streams) must be provided for concurrent profile.")
-        if not isinstance(rate, Sequence):
-            rate = [rate]
-        if not all(stream.is_integer() and stream > 0 for stream in rate):
-            raise ValueError(
-                f"All rate values (streams) must be positive integers, received {rate}"
-            )
-        if kwargs:
-            raise ValueError(
-                "No additional arguments are allowed for concurrent profile."
-            )
-        return ConcurrentProfile(streams=[int(rat) for rat in rate])
+@Profile.register("throughput")
 class ThroughputProfile(Profile):
+    """
+    Maximum throughput strategy execution profile with optional concurrency limits.
+    """
     type_: Literal["throughput"] = "throughput"  # type: ignore[assignment]
-    max_concurrency: Optional[int] = Field(
+    max_concurrency: PositiveInt | None = Field(
         default=None,
-        description="The maximum number of concurrent requests that can be scheduled.",
+        description="Maximum concurrent requests to schedule",
     )
+    startup_duration: NonNegativeFloat = Field(
+        default=0.0,
+        description=(
+            "Duration in seconds for distributing startup requests "
+            "before full throughput scheduling"
+        ),
+    )
+    @classmethod
+    def resolve_args(
+        cls,
+        rate_type: str,
+        rate: list[float] | None,
+        random_seed: int,
+        **kwargs: Any,
+    ) -> dict[str, Any]:
+        """
+        Resolve arguments for throughput profile construction.
+        :param rate_type: Profile type identifier (ignored)
+        :param rate: Rate parameter remapped to max_concurrency
+        :param random_seed: Random seed (ignored)
+        :param kwargs: Additional arguments passed through unchanged
+        :return: Resolved arguments dictionary
+        """
+        _ = (rate_type, random_seed)  # unused
+        # Remap rate to max_concurrency, strip out random_seed
+        kwargs.pop("random_seed", None)
+        if rate is not None and len(rate) > 0:
+            kwargs["max_concurrency"] = rate[0]
+        return kwargs
     @property
     def strategy_types(self) -> list[StrategyType]:
+        """
+        :return: Single throughput strategy type
+        """
         return [self.type_]
-    def next_strategy(self) -> Optional[SchedulingStrategy]:
-        if self.completed_strategies >= 1:
+    def next_strategy(
+        self,
+        prev_strategy: SchedulingStrategy | None,
+        prev_benchmark: Benchmark | None,
+    ) -> ThroughputStrategy | None:
+        """
+        Generate throughput strategy or None if already completed.
+        :param prev_strategy: Previously completed strategy (unused)
+        :param prev_benchmark: Benchmark results from previous execution (unused)
+        :return: ThroughputStrategy for first execution, None afterward
+        """
+        _ = (prev_strategy, prev_benchmark)  # unused
+        if len(self.completed_strategies) >= 1:
             return None
         return ThroughputStrategy(
             max_concurrency=self.max_concurrency,
+            startup_duration=self.startup_duration,
         )
-    @staticmethod
-    def from_standard_args(
-        rate_type: Union[StrategyType, ProfileType],
-        rate: Optional[Union[float, Sequence[float]]],
-        **kwargs,
-    ) -> "ThroughputProfile":
-        if rate_type != "throughput":
-            raise ValueError("Rate type must be 'throughput' for throughput profile.")
-        if rate is not None:
-            raise ValueError(
-                "Rate does not apply to throughput profile, it must be set to None."
-            )
-        return ThroughputProfile(**kwargs)
+@Profile.register(["async", "constant", "poisson"])
+class AsyncProfile(Profile):
+    """Rate-based asynchronous strategy execution profile with configurable patterns."""
-class AsyncProfile(ThroughputProfile):
-    type_: Literal["async"] = "async"  # type: ignore[assignment]
+    type_: Literal["async", "constant", "poisson"] = "async"  # type: ignore[assignment]
     strategy_type: Literal["constant", "poisson"] = Field(
-        description="The type of asynchronous strategy to use.",
+        description="Asynchronous strategy pattern type to use",
     )
-    rate: Union[float, Sequence[float]] = Field(
-        description="The rate of requests per second to use.",
+    rate: list[PositiveFloat] = Field(
+        description="Request scheduling rate in requests per second",
     )
-    initial_burst: bool = Field(
-        default=True,
+    startup_duration: NonNegativeFloat = Field(
+        default=0.0,
         description=(
-            "True to send an initial burst of requests (math.floor(self.rate)) "
-            "to reach target rate. False to not send an initial burst."
+            "Duration in seconds for distributing startup requests "
+            "to converge quickly to desired rate"
         ),
     )
+    max_concurrency: PositiveInt | None = Field(
+        default=None,
+        description="Maximum concurrent requests to schedule",
+    )
     random_seed: int = Field(
         default=42,
-        description=(
-            "The random seed to use for the asynchronous strategy. "
-            "This is used to generate random numbers for the Poisson strategy."
-        ),
+        description="Random seed for Poisson distribution strategy",
     )
+    @classmethod
+    def resolve_args(
+        cls,
+        rate_type: str,
+        rate: list[float] | None,
+        random_seed: int,
+        **kwargs: Any,
+    ) -> dict[str, Any]:
+        """
+        Resolve arguments for async profile construction.
+        :param rate_type: Profile type identifier
+        :param rate: Rate configuration for the profile
+        :param random_seed: Seed for stochastic strategies
+        :param kwargs: Additional arguments passed through unchanged
+        :return: Resolved arguments dictionary
+        :raises ValueError: If rate is None
+        """
+        if rate is None:
+            raise ValueError("AsyncProfile requires a rate parameter")
+        kwargs["type_"] = (
+            rate_type
+            if rate_type in ["async", "constant", "poisson"]
+            else kwargs.get("type_", "async")
+        )
+        kwargs["strategy_type"] = (
+            rate_type
+            if rate_type in ["constant", "poisson"]
+            else kwargs.get("strategy_type", "constant")
+        )
+        kwargs["rate"] = rate if isinstance(rate, list) else [rate]
+        kwargs["random_seed"] = random_seed
+        return kwargs
     @property
     def strategy_types(self) -> list[StrategyType]:
-        num_strategies = len(self.rate) if isinstance(self.rate, Sequence) else 1
+        """
+        :return: Async strategy types for each configured rate
+        """
+        num_strategies = len(self.rate)
         return [self.strategy_type] * num_strategies
-    def next_strategy(self) -> Optional[SchedulingStrategy]:
-        rate = self.rate if isinstance(self.rate, Sequence) else [self.rate]
-        if self.completed_strategies >= len(rate):
+    def next_strategy(
+        self,
+        prev_strategy: SchedulingStrategy | None,
+        prev_benchmark: Benchmark | None,
+    ) -> AsyncConstantStrategy | AsyncPoissonStrategy | None:
+        """
+        Generate async strategy for the next configured rate.
+        :param prev_strategy: Previously completed strategy (unused)
+        :param prev_benchmark: Benchmark results from previous execution (unused)
+        :return: AsyncConstantStrategy or AsyncPoissonStrategy for next rate,
+            or None if all rates completed
+        :raises ValueError: If strategy_type is neither 'constant' nor 'poisson'
+        """
+        _ = (prev_strategy, prev_benchmark)  # unused
+        if len(self.completed_strategies) >= len(self.rate):
             return None
+        current_rate = self.rate[len(self.completed_strategies)]
         if self.strategy_type == "constant":
             return AsyncConstantStrategy(
-                rate=rate[self.completed_strategies],
-                initial_burst=self.initial_burst,
+                rate=current_rate,
+                startup_duration=self.startup_duration,
                 max_concurrency=self.max_concurrency,
             )
         elif self.strategy_type == "poisson":
             return AsyncPoissonStrategy(
-                rate=rate[self.completed_strategies],
-                initial_burst=self.initial_burst,
+                rate=current_rate,
+                startup_duration=self.startup_duration,
                 max_concurrency=self.max_concurrency,
                 random_seed=self.random_seed,
             )
         else:
             raise ValueError(f"Invalid strategy type: {self.strategy_type}")
-    @staticmethod
-    def from_standard_args(  # type: ignore[override]
-        rate_type: Union[StrategyType, ProfileType],
-        rate: Optional[Union[float, Sequence[float]]],
-        random_seed: int,
-        **kwargs,
-    ) -> "AsyncProfile":
-        if rate_type not in ("async", "constant", "poisson"):
-            raise ValueError(
-                "Rate type must be in ('async', 'constant', 'poisson') "
-                f"for async profile. Received: {rate_type}"
-            )
-        if not rate:
-            raise ValueError("Rate must be provided for async profile.")
-        if not isinstance(rate, Sequence):
-            rate = [rate]
-        if not all(isinstance(r, (float, int)) and r > 0 for r in rate):
-            raise ValueError(
-                f"All rate values must be positive numbers, received {rate}"
-            )
+@Profile.register("sweep")
+class SweepProfile(Profile):
+    """Adaptive multi-strategy sweep execution profile with rate discovery."""
-        if rate_type == "async":
-            rate_type = "constant"  # default to constant if not specified
-        return AsyncProfile(
-            strategy_type=rate_type,  # type: ignore[arg-type]
-            rate=rate,
-            random_seed=random_seed,
-            **kwargs,
-        )
-class SweepProfile(AsyncProfile):
     type_: Literal["sweep"] = "sweep"  # type: ignore[assignment]
     sweep_size: int = Field(
-        description="The number of strategies to generate for the sweep.",
+        description="Number of strategies to generate for the sweep",
+        ge=2,
+    )
+    strategy_type: Literal["constant", "poisson"] = "constant"
+    startup_duration: NonNegativeFloat = Field(
+        default=0.0,
+        description=(
+            "Duration in seconds for distributing startup requests "
+            "to converge quickly to desired rate"
+        ),
+    )
+    max_concurrency: PositiveInt | None = Field(
+        default=None,
+        description="Maximum concurrent requests to schedule",
+    )
+    random_seed: int = Field(
+        default=42,
+        description="Random seed for Poisson distribution strategy",
+    )
+    synchronous_rate: float = Field(
+        default=-1.0,
+        description="Measured rate from synchronous strategy execution",
+    )
+    throughput_rate: float = Field(
+        default=-1.0,
+        description="Measured rate from throughput strategy execution",
+    )
+    async_rates: list[float] = Field(
+        default_factory=list,
+        description="Generated rates for async strategy sweep",
+    )
+    measured_rates: list[float] = Field(
+        default_factory=list,
+        description="Interpolated rates between synchronous and throughput",
     )
-    rate: float = -1
-    rate_type: Literal["constant", "poisson"] = "constant"
+    @classmethod
+    def resolve_args(
+        cls,
+        rate_type: str,
+        rate: list[float] | None,
+        random_seed: int,
+        **kwargs: Any,
+    ) -> dict[str, Any]:
+        """
+        Resolve arguments for sweep profile construction.
+        :param rate_type: Async strategy type for sweep execution
+        :param rate: Rate parameter specifying sweep size (if provided)
+        :param random_seed: Seed for stochastic strategies
+        :param kwargs: Additional arguments passed through unchanged
+        :return: Resolved arguments dictionary
+        """
+        sweep_size_from_rate = int(rate[0]) if rate else settings.default_sweep_number
+        kwargs["sweep_size"] = kwargs.get("sweep_size", sweep_size_from_rate)
+        kwargs["random_seed"] = random_seed
+        if rate_type in ["constant", "poisson"]:
+            kwargs["strategy_type"] = rate_type
+        return kwargs
     @property
     def strategy_types(self) -> list[StrategyType]:
-        return (
-            ["synchronous"] + ["throughput"] + [self.rate_type] * (self.sweep_size - 2)  # type: ignore[return-value]
-        )
-    def next_strategy(self) -> Optional[SchedulingStrategy]:
-        if self.completed_strategies >= self.sweep_size:
-            return None
-        if self.completed_strategies == 0:
+        """
+        :return: Strategy types for the complete sweep sequence
+        """
+        types = ["synchronous", "throughput"]
+        types += [self.strategy_type] * (self.sweep_size - len(types))
+        return types
+    def next_strategy(
+        self,
+        prev_strategy: SchedulingStrategy | None,
+        prev_benchmark: Benchmark | None,
+    ) -> (
+        AsyncConstantStrategy
+        | AsyncPoissonStrategy
+        | SynchronousProfile
+        | ThroughputProfile
+        | None
+    ):
+        """
+        Generate the next strategy in the adaptive sweep sequence.
+        Executes synchronous and throughput strategies first to measure baseline
+        rates, then generates interpolated rates for async strategies.
+        :param prev_strategy: Previously completed strategy instance
+        :param prev_benchmark: Benchmark results from previous strategy execution
+        :return: Next strategy in sweep sequence, or None if complete
+        :raises ValueError: If strategy_type is neither 'constant' nor 'poisson'
+        """
+        if prev_strategy is None:
             return SynchronousStrategy()
-        if self.completed_strategies == 1:
+        if prev_strategy.type_ == "synchronous":
+            self.synchronous_rate = prev_benchmark.get_request_metrics_sample()[
+                "request_throughput"
+            ]
             return ThroughputStrategy(
                 max_concurrency=self.max_concurrency,
+                startup_duration=self.startup_duration,
             )
-        min_rate = self.measured_rates[0]
-        max_rate = self.measured_rates[1]
-        rates = np.linspace(min_rate, max_rate, self.sweep_size - 1)[1:]
+        if prev_strategy.type_ == "throughput":
+            self.throughput_rate = prev_benchmark.get_request_metrics_sample()[
+                "request_throughput"
+            ]
+            if self.synchronous_rate <= 0 and self.throughput_rate <= 0:
+                raise RuntimeError(
+                    "Invalid rates in sweep; aborting. "
+                    "Were there any successful requests?"
+                )
+            self.measured_rates = list(
+                np.linspace(
+                    self.synchronous_rate,
+                    self.throughput_rate,
+                    self.sweep_size - 1,
+                )
+            )[1:]  # don't rerun synchronous
-        if self.rate_type == "constant":
+        if len(self.completed_strategies) >= self.sweep_size:
+            return None
+        next_rate_index = len(
+            [
+                strat
+                for strat in self.completed_strategies
+                if strat.type_ == self.strategy_type
+            ]
+        )
+        if self.strategy_type == "constant":
             return AsyncConstantStrategy(
-                rate=rates[self.completed_strategies - 2],
-                initial_burst=self.initial_burst,
+                rate=self.measured_rates[next_rate_index],
+                startup_duration=self.startup_duration,
                 max_concurrency=self.max_concurrency,
             )
-        elif self.rate_type == "poisson":
+        elif self.strategy_type == "poisson":
             return AsyncPoissonStrategy(
-                rate=rates[self.completed_strategies - 2],
-                initial_burst=self.initial_burst,
+                rate=self.measured_rates[next_rate_index],
+                startup_duration=self.startup_duration,
                 max_concurrency=self.max_concurrency,
+                random_seed=self.random_seed,
             )
         else:
-            raise ValueError(f"Invalid strategy type: {self.rate_type}")
-    @staticmethod
-    def from_standard_args(  # type: ignore[override]
-        rate_type: Union[StrategyType, ProfileType],
-        rate: Optional[Union[float, Sequence[float]]],
-        random_seed: int,
-        **kwargs,
-    ) -> "SweepProfile":
-        if rate_type != "sweep":
-            raise ValueError("Rate type must be 'sweep' for sweep profile.")
-        if "sweep_size" in kwargs:
-            raise ValueError("Sweep size must not be provided, use rate instead.")
-        if isinstance(rate, Sequence):
-            if len(rate) != 1:
-                raise ValueError(
-                    "Rate must be a single value for sweep profile, received "
-                    f"{len(rate)} values."
-                )
-            rate = rate[0]
-        if not rate:
-            rate = settings.default_sweep_number
-        if not rate:
-            raise ValueError(
-                "Rate (sweep_size) must be provided for concurrent profile."
-            )
-        if (
-            not isinstance(rate, (int, float))
-            or (isinstance(rate, float) and not rate.is_integer())
-            or rate <= 1
-        ):
-            raise ValueError(
-                f"Rate (sweep_size) must be a positive integer > 1, received {rate} "
-                f"with type {type(rate)}"
-            )
-        if not kwargs:
-            kwargs = {}
-        if "strategy_type" not in kwargs:
-            kwargs["strategy_type"] = "constant"
-        return SweepProfile(sweep_size=int(rate), random_seed=random_seed, **kwargs)
-def create_profile(
-    rate_type: Union[StrategyType, ProfileType],
-    rate: Optional[Union[float, Sequence[float]]],
-    random_seed: int = 42,
-    **kwargs,
-) -> "Profile":
-    if rate_type == "synchronous":
-        return SynchronousProfile.from_standard_args(
-            rate_type=rate_type,
-            rate=rate,
-            **kwargs,
-        )
-    if rate_type == "concurrent":
-        return ConcurrentProfile.from_standard_args(
-            rate_type=rate_type,
-            rate=rate,
-            **kwargs,
-        )
-    if rate_type == "throughput":
-        return ThroughputProfile.from_standard_args(
-            rate_type=rate_type,
-            rate=rate,
-            **kwargs,
-        )
-    if rate_type in ("async", "constant", "poisson"):
-        return AsyncProfile.from_standard_args(
-            rate_type=rate_type,
-            rate=rate,
-            random_seed=random_seed,
-            **kwargs,
-        )
-    if rate_type == "sweep":
-        return SweepProfile.from_standard_args(
-            rate_type=rate_type,
-            rate=rate,
-            random_seed=random_seed,
-            **kwargs,
-        )
-    raise ValueError(f"Invalid profile type: {rate_type}")
+            raise ValueError(f"Invalid strategy type: {self.strategy_type}")

guidellm 0.4.0a18__py3-none-any.whl → 0.4.0a155__py3-none-any.whl

Potentially problematic release.

guidellm 0.4.0a18py3-none-any.whl → 0.4.0a155py3-none-any.whl