PyPI - evograd-diff - Versions diffs - 0.1.0__py3-none-any.whl - Mend

evograd-diff 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

evograd/__init__.py +67 -0
evograd/algorithms/__init__.py +138 -0
evograd/algorithms/cmaes.py +1365 -0
evograd/algorithms/de.py +895 -0
evograd/algorithms/ga.py +532 -0
evograd/algorithms/pso.py +648 -0
evograd/algorithms/shade.py +1165 -0
evograd/benchmarks/functions/__init__.py +229 -0
evograd/benchmarks/functions/base.py +217 -0
evograd/benchmarks/functions/cec2017/__init__.py +250 -0
evograd/benchmarks/functions/cec2017/basic.py +413 -0
evograd/benchmarks/functions/cec2017/composition.py +580 -0
evograd/benchmarks/functions/cec2017/data.pkl +0 -0
evograd/benchmarks/functions/cec2017/data.py +350 -0
evograd/benchmarks/functions/cec2017/hybrid.py +406 -0
evograd/benchmarks/functions/cec2017/simple.py +326 -0
evograd/benchmarks/functions/classical.py +649 -0
evograd/benchmarks/functions/smoothed_funnel.py +476 -0
evograd/benchmarks/functions/transforms.py +463 -0
evograd/benchmarks/run_benchmark_functions.py +1208 -0
evograd/core/__init__.py +73 -0
evograd/core/algorithm.py +778 -0
evograd/core/maximize.py +269 -0
evograd/core/minimize.py +740 -0
evograd/core/problem.py +444 -0
evograd/core/result.py +571 -0
evograd/core/termination.py +602 -0
evograd/operators/__init__.py +178 -0
evograd/operators/crossover.py +1117 -0
evograd/operators/mutation.py +1098 -0
evograd/operators/relaxations.py +175 -0
evograd/operators/repair.py +601 -0
evograd/operators/sampling.py +577 -0
evograd/operators/selection.py +981 -0
evograd/operators/survival.py +1000 -0
evograd/tests/__init__.py +11 -0
evograd/tests/run_all.py +78 -0
evograd/tests/test_core.py +528 -0
evograd/tests/test_ga.py +572 -0
evograd/tests/test_operators.py +662 -0
evograd/tests/test_per_individual.py +326 -0
evograd/tests/test_utils.py +328 -0
evograd/utils/__init__.py +97 -0
evograd/utils/callbacks.py +926 -0
evograd/utils/device.py +502 -0
evograd/utils/duplicates.py +421 -0
evograd_diff-0.1.0.dist-info/METADATA +439 -0
evograd_diff-0.1.0.dist-info/RECORD +50 -0
evograd_diff-0.1.0.dist-info/WHEEL +4 -0
evograd_diff-0.1.0.dist-info/licenses/LICENSE +201 -0

evograd/core/minimize.py ADDED Viewed

@@ -0,0 +1,740 @@
+"""
+Minimisation function for EvoGrad optimisation.
+This module provides the main entry point for running optimisation,
+following pymoo's interface style where algorithm initialisation
+happens inside the minimize function.
+Example:
+    >>> from evograd.core.problem import Problem
+    >>> from evograd.core.minimize import minimize
+    >>> from evograd.core.termination import MaxEvaluations
+    >>> from evograd.algorithms import GA
+    >>>
+    >>> # Define problem
+    >>> problem = Problem(
+    ...     objective=lambda x: (x**2).sum(dim=-1),
+    ...     n_var=30,
+    ...     xl=-100.0,
+    ...     xu=100.0,
+    ... )
+    >>>
+    >>> # Create algorithm (not initialized)
+    >>> algorithm = GA(pop_size=100, eliminate_duplicates=True)
+    >>>
+    >>> # Run optimisation
+    >>> result = minimize(
+    ...     problem,
+    ...     algorithm,
+    ...     termination=MaxEvaluations(10000),
+    ...     seed=42,
+    ...     verbose=True,
+    ...     )
+    >>>
+    >>> print(f"Best fitness: {result.best_fitness}")
+    >>> print(f"Best solution: {result.best_solution}")
+"""
+from __future__ import annotations
+import time
+from typing import TYPE_CHECKING, Any, Dict, List, Optional, Union
+import torch
+from evograd.core.result import Result, ResultBuilder
+from evograd.core.termination import (
+    Termination,
+    TerminationCollection,
+    TargetReached,
+    default_termination,
+)
+from evograd.utils.callbacks import (
+    Callback,
+    CallbackList,
+    CallbackState,
+    HistoryCallback,
+    PrintCallback,
+)
+from evograd.utils.device import set_seed
+if TYPE_CHECKING:
+    from evograd.core.algorithm import Algorithm
+    from evograd.core.problem import Problem
+__all__ = [
+    "minimize",
+]
+_OPT_DEFAULTS = {
+    "GA":    dict(lr_pop=3e-4,  lr_hyper=0.001,  grad_clip_pop=0.2, grad_clip_hyper=0.2, pop_momentum=0.0),
+    "DE":    dict(lr_pop=0.01,  lr_hyper=0.001,  grad_clip_pop=0.5, grad_clip_hyper=0.3, pop_momentum=0.9),
+    "PSO":   dict(lr_pop=0.001, lr_hyper=0.001,  grad_clip_pop=1.0, grad_clip_hyper=0.1, pop_momentum=0.9),
+    "CMAES": dict(lr_pop=0.003, lr_hyper=0.0003, grad_clip_pop=0.5, grad_clip_hyper=0.1, pop_momentum=0.9),
+}
+def minimize(
+    problem: Problem,
+    algorithm: Algorithm,
+    termination: Optional[Termination] = None,
+    seed: Optional[int] = None,
+    verbose: bool = True,
+    callback: Optional[Union[Callback, List[Callback]]] = None,
+    copy_algorithm: bool = False,
+    save_history: bool = True,
+    initialize: bool = True,
+    # Differentiable mode options
+    optimizer: Optional[torch.optim.Optimizer] = None,
+    lr_pop: Optional[float] = None,
+    lr_hyper: Optional[float] = None,
+    grad_clip_pop: Optional[float] = None,
+    grad_clip_hyper: Optional[float] = None,
+    scheduler: Optional[str] = None,
+    scheduler_patience: int = 50,
+    scheduler_factor: float = 0.5,
+    min_lr: float = 1e-6,
+) -> Result:
+    """
+    Minimise an objective function using a population-based algorithm.
+    This function initialises the algorithm with the problem and runs
+    the optimisation loop until termination criteria are met. Follows
+    pymoo's interface style.
+    Differentiable Mode
+    -------------------
+    EvoGrad automatically detects learnable parameters (nn.Parameter with
+    requires_grad=True) and uses backpropagation to update them. This covers:
+    - Population updates: algorithm.differentiable=True
+    - Operator hyperparameters: operator.differentiable=True
+    - Adaptive PSO coefficients: adaptive=True (w, c1, c2 per particle)
+    - Any other learnable parameters in the algorithm
+    Thus, EvoGrad supports four combinations of differentiability:
+    1. algorithm.differentiable=False, operators.differentiable=False
+       → Pure classical EA, no backpropagation
+    2. algorithm.differentiable=False, operators.differentiable=True
+       → Classical EA dynamics, but learn operator hyperparameters
+         (e.g., crossover eta, mutation rate, PSO w/c1/c2)
+    3. algorithm.differentiable=True, operators.differentiable=False
+       → Gradient-based population updates (local search), fixed operators
+    4. algorithm.differentiable=True, operators.differentiable=True
+       → Full end-to-end differentiable optimisation
+    Args:
+        problem: Problem instance defining the objective function,
+            bounds, and constraints.
+        algorithm: Algorithm instance (e.g., GA, DE, PSO, CMAES).
+            Will be initialized inside this function.
+        termination: When to stop optimisation. Must be a Termination
+            instance (e.g., MaxEvaluations(10000)). If None, uses
+            default (10000 evaluations).
+        seed: Random seed for reproducibility. Applied before
+            algorithm initialisation.
+        verbose: If True, print progress during optimisation.
+        callback: Single Callback or list of Callbacks for monitoring.
+            HistoryCallback is always included automatically.
+        copy_algorithm: If True, create a copy of the algorithm to
+            preserve the original. Default False.
+        save_history: If True (default), save convergence history
+            in result. Set False to reduce memory for long runs.
+        initialize: If True (default), initialize the algorithm with the
+            problem. Set to False to continue optimization with an already
+            initialized algorithm (e.g., when switching problems at runtime
+            while preserving population state and hyperparameters).
+            The algorithm must have been previously initialized. When False,
+            the termination budget is additive (e.g., MaxEvaluations(500)
+            will run 500 more evaluations from the current state).
+        # Differentiable mode options (used if learnable params exist):
+        optimizer: PyTorch optimizer for gradient-based updates.
+            If None, SGD is used with specified lr.
+        lr_pop: Learning rate for gradient-based updates of the population (default: 1e-2).
+        lr_hyper: Learning rate for gradient-based updates of the hyperparameters (default: 1e-3).
+        grad_clip_pop: Maximum gradient norm for clipping population gradient (None = no clipping).
+        grad_clip_hyper: Maximum gradient norm for clipping hyperparam gradient (None = no clipping).
+        scheduler: Learning rate scheduler type:
+            - 'plateau': Reduce on plateau (default)
+            - 'step': Reduce every N generations
+            - 'cosine': Cosine annealing
+            - 'exponential': Exponential decay
+            - None: No scheduler
+        scheduler_patience: Generations without improvement before
+            reducing LR (for 'plateau' scheduler).
+        scheduler_factor: Factor to multiply LR when reducing.
+        min_lr: Minimum learning rate.
+    Returns:
+        Result object containing:
+            - best_solution: Best solution found
+            - best_fitness: Best fitness value
+            - population: Final population
+            - fitness: Final fitness values
+            - n_evals: Total evaluations
+            - n_gen: Total generations
+            - history: Convergence history (if save_history=True)
+            - success: Whether target was reached
+    Example:
+        >>> # Basic usage (classical EA)
+        >>> result = minimize(problem, GA(pop_size=100), seed=42)
+        >>>
+        >>> # Learn operator hyperparameters with classical dynamics
+        >>> from evograd.operators import SBX, PolynomialMutation
+        >>> algorithm = GA(
+        ...     pop_size=100,
+        ...     crossover=SBX(eta=15, differentiable=True),
+        ...     mutation=PolynomialMutation(eta=20, differentiable=True),
+        ...     differentiable=False,  # Population not updated via gradients
+        ...     )
+        >>> result = minimize(problem, algorithm, termination=MaxEvaluations(10000))
+        >>>
+        >>> # Full differentiable mode
+        >>> algorithm = GA(pop_size=100, differentiable=True)
+        >>> result = minimize(problem, algorithm, lr=0.01, grad_clip_pop=1.0)
+        >>>
+        >>> # Continue optimization with a different problem (e.g., surrogate -> true)
+        >>> # First optimize with surrogate problem
+        >>> pso = PSO(pop_size=100, differentiable=True)
+        >>> result1 = minimize(surrogate_problem, pso, termination=MaxEvaluations(10000))
+        >>> # Then continue with true problem (preserves velocities, personal bests)
+        >>> result2 = minimize(true_problem, pso, termination=MaxEvaluations(500),
+        ...                    initialize=False)
+    Note:
+        By default (initialize=True), the algorithm is initialized inside this
+        function. Do not call algorithm.initialize() before passing to minimize().
+        When initialize=False, the algorithm must have been previously initialized
+        (e.g., from a prior minimize() call). This allows switching problems at
+        runtime while preserving population state, velocities, and personal bests.
+    """
+    # -------------------------------------------------------------------------
+    # Setup
+    # -------------------------------------------------------------------------
+    # Set seed first for reproducibility
+    if seed is not None:
+        set_seed(seed)
+    # Copy algorithm if requested
+    if copy_algorithm:
+        import copy
+        algorithm = copy.deepcopy(algorithm)
+    # Parse termination criteria
+    termination = _parse_termination(termination)
+    # Setup callbacks
+    callbacks = _setup_callbacks(callback, verbose, save_history)
+    # Initialize algorithm with problem (or continue with existing state)
+    if initialize:
+        algorithm.initialize(problem)
+    else:
+        # Continue with existing algorithm state but update problem reference
+        # This preserves population, velocities, personal bests, etc.
+        if not hasattr(algorithm, 'generation') or algorithm.generation == 0:
+            raise ValueError(
+                "initialize=False requires a previously initialized algorithm. "
+                "Run minimize() with initialize=True first."
+            )
+        # Update problem reference and bounds
+        algorithm.problem = problem
+        algorithm.xl = problem.xl
+        algorithm.xu = problem.xu
+        # Re-evaluate the current population on the new problem so that
+        # fitness values (including personal bests in PSO) are consistent
+        # with the new objective.  Without this, stale fitness values from
+        # the old problem prevent the algorithm from accepting any new
+        # solutions (e.g., surrogate fitness ~0.003 vs ODE fitness ~200).
+        with torch.no_grad():
+            new_fitness = algorithm._evaluate(algorithm.population)
+            algorithm.state.fitness = new_fitness
+            algorithm.state.best_fitness = float('inf')
+            algorithm.state.update_best(algorithm.population, new_fitness)
+            # PSO: re-evaluate personal bests on the new problem
+            if hasattr(algorithm, '_p_best') and hasattr(algorithm, '_p_best_fitness'):
+                pb_fitness = algorithm._evaluate(algorithm._p_best)
+                algorithm._p_best_fitness.copy_(pb_fitness)
+        # Update termination budget to add to existing evaluations/generations
+        _update_termination_budget(termination, algorithm)
+    # Setup result builder
+    builder = ResultBuilder()
+    builder.set_problem(problem)
+    builder.set_algorithm(algorithm)
+    # -------------------------------------------------------------------------
+    # Setup differentiable mode
+    # -------------------------------------------------------------------------
+    # Collect all learnable parameters (nn.Parameter with requires_grad=True)
+    # learnable_params = [p for p in algorithm.parameters() if p.requires_grad]
+    pop_params   = []
+    hyper_params = []
+    for name, p in algorithm.named_parameters():
+        if not p.requires_grad:
+            continue
+        if name == "_population":
+            pop_params.append(p)
+        else:
+            hyper_params.append(p)
+    use_backprop = (len(pop_params) > 0) or (len(hyper_params) > 0)
+    lr_pop_eff, lr_hyper_eff, grad_clip_pop, grad_clip_hyper, defaults = _resolve_opt_defaults(
+    algorithm, problem, lr_pop, lr_hyper, grad_clip_pop, grad_clip_hyper)
+    optimizers: List[torch.optim.Optimizer] = []
+    schedulers: List[Optional[torch.optim.lr_scheduler.LRScheduler]] = []
+    if use_backprop:
+        # Create optimizer if not provided
+        if optimizer is None:
+            if len(pop_params) > 0 and isinstance(lr_pop_eff, (int, float)) and lr_pop_eff > 0:
+                optimizers.append(torch.optim.SGD(pop_params, lr=lr_pop_eff, momentum=defaults["pop_momentum"]))
+            if len(hyper_params) > 0 and isinstance(lr_hyper_eff, (int, float)) and lr_hyper_eff > 0:
+                optimizers.append(torch.optim.Adam(hyper_params, lr=lr_hyper_eff))
+        else:
+            # Accept a single optimizer or a list/tuple of optimizers
+            if isinstance(optimizer, (list, tuple)):
+                optimizers.extend(list(optimizer))
+            else:
+                optimizers.append(optimizer)
+        # Create LR scheduler
+        est_gens = _estimate_total_generations(termination, algorithm)
+        for opt in optimizers:
+            schedulers.append(
+                _create_scheduler(
+                    opt,
+                    scheduler,
+                    scheduler_patience,
+                    scheduler_factor,
+                    min_lr,
+                    total_generations=est_gens,
+                )
+            )
+    else:
+        optimizers = []
+        schedulers = []
+    # -------------------------------------------------------------------------
+    # Create callback state
+    # -------------------------------------------------------------------------
+    state = CallbackState(
+        generation=algorithm.generation,
+        n_evals=algorithm.n_evals,
+        max_evals=getattr(termination, 'max_evals', None),
+        max_generations=getattr(termination, 'max_gens', None),
+        best_fitness=algorithm.best_fitness,
+        best_solution=algorithm.best_solution,
+        current_fitness=algorithm.fitness,
+        current_population=algorithm.population,
+        algorithm=algorithm,
+        hyperparams=algorithm._get_hyperparams(),
+    )
+    # -------------------------------------------------------------------------
+    # Optimisation loop
+    # -------------------------------------------------------------------------
+    builder.start()
+    start_time = time.perf_counter()
+    # Notify callbacks of start
+    _call_callbacks(callbacks, "on_optimisation_start", state)
+    # Reset termination state
+    termination.reset()
+    while not termination.should_terminate(algorithm):
+        # Check callback early stopping
+        if state.stop_optimisation:
+            break
+        # Generation start callback
+        _call_callbacks(callbacks, "on_generation_start", state)
+        # Run one generation
+        if use_backprop:
+            _step_differentiable(
+                algorithm,
+                optimizers,
+                schedulers,
+                pop_params,
+                hyper_params,
+                grad_clip_pop,
+                grad_clip_hyper,
+            )
+        else:
+            algorithm.step()
+        # Update callback state
+        state.generation = algorithm.generation
+        state.n_evals = algorithm.n_evals
+        state.best_fitness = algorithm.best_fitness
+        state.best_solution = algorithm.best_solution
+        state.current_fitness = algorithm.fitness
+        state.current_population = algorithm.population
+        state.hyperparams = algorithm._get_hyperparams()
+        state.elapsed_time = time.perf_counter() - start_time
+        # Generation end callback
+        _call_callbacks(callbacks, "on_generation_end", state)
+    # -------------------------------------------------------------------------
+    # Finalize
+    # -------------------------------------------------------------------------
+    # Determine success (check if TargetReached was met)
+    success = _check_target_reached(termination, algorithm)
+    # Build result
+    builder.finish(algorithm, termination, success)
+    # Get history from callbacks
+    if save_history:
+        history = _collect_history(callbacks)
+        builder.set_history(history)
+    result = builder.build()
+    # Final callback
+    _call_callbacks(callbacks, "on_optimisation_end", state)
+    return result
+# =============================================================================
+# Helper Functions
+# =============================================================================
+def _resolve_opt_defaults(
+    algorithm: "Algorithm",
+    problem: "Problem",
+    lr_pop,
+    lr_hyper,
+    grad_clip_pop,
+    grad_clip_hyper,
+):
+    """Resolve per-algorithm optimiser defaults.
+    Sentinel convention:
+        - ``-1`` means "use the per-algorithm default from ``_OPT_DEFAULTS``".
+          This is the value the benchmark CLI passes by default.
+        - ``None`` means "disable" — no optimiser / no clipping.
+          This is the value ``minimize()`` uses when the caller omits the arg.
+        - Any other numeric value is used as-is.
+    """
+    alg_name = algorithm.__class__.__name__
+    defaults = _OPT_DEFAULTS.get(alg_name, _OPT_DEFAULTS["GA"])
+    # -1 means "use defaults", None means "disable" (for clips)
+    if lr_pop == -1:
+        lr_pop = defaults["lr_pop"]
+    if lr_hyper == -1:
+        lr_hyper = defaults["lr_hyper"]
+    if grad_clip_pop == -1:
+        grad_clip_pop = defaults["grad_clip_pop"]
+    if grad_clip_hyper == -1:
+        grad_clip_hyper = defaults["grad_clip_hyper"]
+    # Dimension scaling only if lr_pop > 0
+    if isinstance(lr_pop, (int, float)) and lr_pop > 0:
+        lr_pop_eff = lr_pop / (problem.n_var ** 0.5)
+    else:
+        lr_pop_eff = lr_pop  # 0.0 or something explicit
+    return lr_pop_eff, lr_hyper, grad_clip_pop, grad_clip_hyper, defaults
+def _parse_termination(termination: Optional[Termination]) -> Termination:
+    """
+    Parse termination argument into Termination instance.
+    Args:
+        termination: Termination instance or None for default.
+    Returns:
+        Termination instance.
+    """
+    if termination is None:
+        return default_termination()
+    if isinstance(termination, Termination):
+        return termination
+    raise TypeError(
+        f"termination must be a Termination instance or None. "
+        f"Got {type(termination).__name__}. "
+        f"Example: termination=MaxEvaluations(10000)"
+    )
+def _update_termination_budget(
+    termination: Termination,
+    algorithm: "Algorithm",
+) -> None:
+    """
+    Update termination budget when continuing optimization (initialize=False).
+    Adds the current algorithm's evaluations/generations to the termination
+    criterion's budget, so the new budget is additive rather than absolute.
+    Args:
+        termination: The termination criterion to update.
+        algorithm: The algorithm with current evaluation/generation counts.
+    """
+    from evograd.core.termination import (
+        MaxEvaluations,
+        MaxGenerations,
+        TerminationCollection,
+    )
+    def _update_single(term: Termination) -> None:
+        if isinstance(term, MaxEvaluations):
+            # Add current evaluations to budget
+            term.max_evals += algorithm.n_evals
+        elif isinstance(term, MaxGenerations):
+            # Add current generations to budget
+            term.max_gens += algorithm.generation
+    if isinstance(termination, TerminationCollection):
+        # Update all criteria in the collection
+        for criterion in termination.criteria:
+            _update_single(criterion)
+    else:
+        _update_single(termination)
+def _setup_callbacks(
+    callback: Optional[Union[Callback, List[Callback]]],
+    verbose: bool,
+    save_history: bool,
+) -> List[Callback]:
+    """Setup callback list with defaults."""
+    callbacks = []
+    # Always include history callback if saving history
+    if save_history:
+        callbacks.append(HistoryCallback())
+    # Add user callbacks
+    if callback is not None:
+        if isinstance(callback, list):
+            callbacks.extend(callback)
+        elif isinstance(callback, CallbackList):
+            callbacks.extend(callback.callbacks)
+        else:
+            callbacks.append(callback)
+    # Add print callback if verbose (and not already present)
+    if verbose:
+        has_print = any(isinstance(cb, PrintCallback) for cb in callbacks)
+        if not has_print:
+            callbacks.append(PrintCallback(every=1))
+    return callbacks
+def _call_callbacks(callbacks: List[Callback], method: str, state: CallbackState) -> None:
+    """Call a method on all callbacks."""
+    for cb in callbacks:
+        getattr(cb, method)(state)
+def _collect_history(callbacks: List[Callback]) -> Dict[str, List[Any]]:
+    """Collect history from HistoryCallback if present."""
+    for cb in callbacks:
+        if isinstance(cb, HistoryCallback):
+            return cb.to_dict()
+    return {}
+def _check_target_reached(termination: Termination, algorithm: Algorithm) -> bool:
+    """Check if target was reached (for TargetReached termination)."""
+    if isinstance(termination, TargetReached):
+        best = algorithm.best_fitness
+        if termination.minimize:
+            return best <= termination.target_fitness
+        else:
+            return best >= termination.target_fitness
+    if isinstance(termination, TerminationCollection):
+        for criterion in termination.criteria:
+            if isinstance(criterion, TargetReached):
+                best = algorithm.best_fitness
+                if criterion.minimize:
+                    if best <= criterion.target_fitness:
+                        return True
+                else:
+                    if best >= criterion.target_fitness:
+                        return True
+    return False
+def _estimate_total_generations(termination: Termination, algorithm: "Algorithm") -> int:
+    """
+    Estimate the total number of generations from the termination criterion.
+    Used to set ``T_max`` for the cosine-annealing scheduler so that the
+    learning-rate schedule matches the actual optimisation budget.
+    Falls back to 10 000 if no budget can be inferred.
+    """
+    from evograd.core.termination import MaxEvaluations, MaxGenerations, TerminationCollection
+    def _extract(term: Termination) -> Optional[int]:
+        if isinstance(term, MaxGenerations):
+            return term.max_gens
+        if isinstance(term, MaxEvaluations):
+            pop = max(algorithm.pop_size, 1)
+            return term.max_evals // pop
+        return None
+    if isinstance(termination, TerminationCollection):
+        for criterion in termination.criteria:
+            val = _extract(criterion)
+            if val is not None:
+                return val
+    val = _extract(termination)
+    if val is not None:
+        return val
+    return 10_000  # safe fallback
+def _create_scheduler(
+    optimizer: torch.optim.Optimizer,
+    scheduler_type: Optional[str],
+    patience: int,
+    factor: float,
+    min_lr: float,
+    total_generations: int = 10_000,
+) -> Optional[torch.optim.lr_scheduler.LRScheduler]:
+    """Create learning rate scheduler.
+    Args:
+        total_generations: Estimated total generations for the optimisation
+            run. Used as ``T_max`` for the cosine-annealing scheduler.
+    """
+    if scheduler_type is None:
+        return None
+    scheduler_type = scheduler_type.lower()
+    if scheduler_type == "plateau":
+        return torch.optim.lr_scheduler.ReduceLROnPlateau(
+            optimizer,
+            mode="min",
+            factor=factor,
+            patience=patience,
+            min_lr=min_lr,
+        )
+    elif scheduler_type == "step":
+        return torch.optim.lr_scheduler.StepLR(
+            optimizer,
+            step_size=patience,
+            gamma=factor,
+        )
+    elif scheduler_type == "cosine":
+        return torch.optim.lr_scheduler.CosineAnnealingLR(
+            optimizer,
+            T_max=total_generations,
+            eta_min=min_lr,
+        )
+    elif scheduler_type == "exponential":
+        return torch.optim.lr_scheduler.ExponentialLR(
+            optimizer,
+            gamma=factor ** (1.0 / patience),
+        )
+    else:
+        raise ValueError(
+            f"Unknown scheduler type: {scheduler_type}. "
+            f"Use 'plateau', 'step', 'cosine', or 'exponential'."
+        )
+def _step_differentiable(
+    algorithm: Algorithm,
+    optimizers: List[torch.optim.Optimizer],
+    schedulers: List[Optional[torch.optim.lr_scheduler.LRScheduler]],
+    pop_params: Optional[List],
+    hyper_params: Optional[List],
+    grad_clip_pop: Optional[float],
+    grad_clip_hyper: Optional[float],
+) -> float:
+    """
+    Perform one generation step with gradient-based updates.
+    Gradients automatically flow to all nn.Parameter tensors:
+    - Population (if algorithm.differentiable=True)
+    - Operator params (if operator.differentiable=True)
+    - Adaptive coefficients (if adaptive=True)
+    Args:
+        algorithm: The algorithm instance.
+        optimizer: PyTorch optimizer.
+        scheduler: Optional LR scheduler.
+        pop_params: population parameters.
+        hyper_params: hyperparam parameters.
+        grad_clip_pop: Maximum gradient norm for clipping the population gradient.
+        grad_clip_hyper: Maximum gradient norm for clipping the hyperparam gradient.
+    Returns:
+        Loss value (best fitness).
+    """
+    if algorithm.differentiable and isinstance(algorithm.population, torch.nn.Parameter):
+        algorithm.population.requires_grad_(True)
+    # Zero gradients
+    for opt in optimizers:
+        opt.zero_grad(set_to_none=True)
+    # Forward pass (builds computation graph)
+    loss = algorithm.forward()
+    # Backward pass
+    loss.backward()
+    # Gradient clipping
+    if grad_clip_pop is not None and pop_params:
+        torch.nn.utils.clip_grad_norm_(pop_params, grad_clip_pop)
+    if grad_clip_hyper is not None and hyper_params:
+        torch.nn.utils.clip_grad_norm_(hyper_params, grad_clip_hyper)
+    # Optimizer step
+    for opt in optimizers:
+        opt.step()
+    # Commit evolutionary changes
+    algorithm.update_state()
+    # Scheduler step
+    for sch in schedulers:
+        if sch is None:
+            continue
+        if isinstance(sch, torch.optim.lr_scheduler.ReduceLROnPlateau):
+            sch.step(loss.item())
+        else:
+            sch.step()
+    return float(loss.detach())