PyPI - evograd-diff - Versions diffs - 0.1.0__py3-none-any.whl - Mend

evograd-diff 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

evograd/__init__.py +67 -0
evograd/algorithms/__init__.py +138 -0
evograd/algorithms/cmaes.py +1365 -0
evograd/algorithms/de.py +895 -0
evograd/algorithms/ga.py +532 -0
evograd/algorithms/pso.py +648 -0
evograd/algorithms/shade.py +1165 -0
evograd/benchmarks/functions/__init__.py +229 -0
evograd/benchmarks/functions/base.py +217 -0
evograd/benchmarks/functions/cec2017/__init__.py +250 -0
evograd/benchmarks/functions/cec2017/basic.py +413 -0
evograd/benchmarks/functions/cec2017/composition.py +580 -0
evograd/benchmarks/functions/cec2017/data.pkl +0 -0
evograd/benchmarks/functions/cec2017/data.py +350 -0
evograd/benchmarks/functions/cec2017/hybrid.py +406 -0
evograd/benchmarks/functions/cec2017/simple.py +326 -0
evograd/benchmarks/functions/classical.py +649 -0
evograd/benchmarks/functions/smoothed_funnel.py +476 -0
evograd/benchmarks/functions/transforms.py +463 -0
evograd/benchmarks/run_benchmark_functions.py +1208 -0
evograd/core/__init__.py +73 -0
evograd/core/algorithm.py +778 -0
evograd/core/maximize.py +269 -0
evograd/core/minimize.py +740 -0
evograd/core/problem.py +444 -0
evograd/core/result.py +571 -0
evograd/core/termination.py +602 -0
evograd/operators/__init__.py +178 -0
evograd/operators/crossover.py +1117 -0
evograd/operators/mutation.py +1098 -0
evograd/operators/relaxations.py +175 -0
evograd/operators/repair.py +601 -0
evograd/operators/sampling.py +577 -0
evograd/operators/selection.py +981 -0
evograd/operators/survival.py +1000 -0
evograd/tests/__init__.py +11 -0
evograd/tests/run_all.py +78 -0
evograd/tests/test_core.py +528 -0
evograd/tests/test_ga.py +572 -0
evograd/tests/test_operators.py +662 -0
evograd/tests/test_per_individual.py +326 -0
evograd/tests/test_utils.py +328 -0
evograd/utils/__init__.py +97 -0
evograd/utils/callbacks.py +926 -0
evograd/utils/device.py +502 -0
evograd/utils/duplicates.py +421 -0
evograd_diff-0.1.0.dist-info/METADATA +439 -0
evograd_diff-0.1.0.dist-info/RECORD +50 -0
evograd_diff-0.1.0.dist-info/WHEEL +4 -0
evograd_diff-0.1.0.dist-info/licenses/LICENSE +201 -0

evograd/tests/test_per_individual.py ADDED Viewed

@@ -0,0 +1,326 @@
+"""
+Test script for per-individual/per-gene parameter support in operators.
+This script demonstrates the four parameter configurations:
+    1. Fixed (scalar): Same value for all individuals and genes
+    2. Per-gene [D]: Different value per gene, same across individuals
+    3. Per-individual [N]: Different value per individual, same across genes
+    4. Per-gene + Per-individual [N, D]: Full matrix
+Run with:
+    python -m tests.test_per_individual
+"""
+import torch
+import sys
+import os
+# Add parent to path
+sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+from evograd.operators.crossover import (
+    BinomialCrossover,
+    SBXCrossover,
+    BlendCrossover,
+    ArithmeticCrossover,
+)
+from evograd.operators.mutation import (
+    PolynomialMutation,
+    GaussianMutation,
+    UniformMutation,
+)
+def test_crossover_configurations():
+    """Test all four parameter configurations for crossover operators."""
+    print("\n" + "=" * 70)
+    print("Testing Crossover Per-Individual/Per-Gene Configurations")
+    print("=" * 70)
+    N, D = 50, 10  # 50 individuals, 10 variables
+    parent1 = torch.randn(N, D)
+    parent2 = torch.randn(N, D)
+    # ==========================================================================
+    # BinomialCrossover (DE-style) - Most important for SHADE
+    # ==========================================================================
+    print("\n1. BinomialCrossover configurations:")
+    crossover = BinomialCrossover(cr=0.9)
+    # Config 1: Fixed (default)
+    print("   a) Fixed CR (scalar) - default behavior")
+    trial = crossover(parent1, parent2)
+    assert trial.shape == (N, D), f"Expected ({N}, {D}), got {trial.shape}"
+    print(f"      Shape: {trial.shape} ✓")
+    # Config 2: Per-gene [D]
+    print("   b) Per-gene CR [D]")
+    cr_per_gene = torch.linspace(0.5, 1.0, D)  # Different CR per gene
+    trial = crossover(parent1, parent2, cr=cr_per_gene)
+    assert trial.shape == (N, D)
+    print(f"      CR shape: {cr_per_gene.shape} -> Output: {trial.shape} ✓")
+    # Config 3: Per-individual [N] - SHADE needs this!
+    print("   c) Per-individual CR [N] - SHADE-style")
+    cr_per_ind = torch.rand(N) * 0.5 + 0.5  # CR in [0.5, 1.0] per individual
+    trial = crossover(parent1, parent2, cr=cr_per_ind)
+    assert trial.shape == (N, D)
+    print(f"      CR shape: {cr_per_ind.shape} -> Output: {trial.shape} ✓")
+    # Config 4: Full matrix [N, D]
+    print("   d) Full matrix CR [N, D]")
+    cr_matrix = torch.rand(N, D)
+    trial = crossover(parent1, parent2, cr=cr_matrix)
+    assert trial.shape == (N, D)
+    print(f"      CR shape: {cr_matrix.shape} -> Output: {trial.shape} ✓")
+    # ==========================================================================
+    # SBXCrossover - Test eta and prob overrides
+    # ==========================================================================
+    print("\n2. SBXCrossover configurations:")
+    sbx = SBXCrossover(eta=15, prob=0.9)
+    # Per-individual eta
+    print("   a) Per-individual eta [N]")
+    eta_per_ind = torch.rand(N) * 15 + 5  # eta in [5, 20] per individual
+    offspring = sbx(parent1, parent2, eta=eta_per_ind)
+    assert offspring.shape == (N, D)
+    print(f"      Eta shape: {eta_per_ind.shape} -> Output: {offspring.shape} ✓")
+    # Per-gene prob
+    print("   b) Per-gene prob [D]")
+    prob_per_gene = torch.linspace(0.5, 1.0, D)
+    offspring = sbx(parent1, parent2, prob=prob_per_gene)
+    assert offspring.shape == (N, D)
+    print(f"      Prob shape: {prob_per_gene.shape} -> Output: {offspring.shape} ✓")
+    # Both eta and prob as full matrices
+    print("   c) Full matrix eta and prob [N, D]")
+    eta_matrix = torch.rand(N, D) * 15 + 5
+    prob_matrix = torch.rand(N, D) * 0.5 + 0.5
+    offspring = sbx(parent1, parent2, eta=eta_matrix, prob=prob_matrix)
+    assert offspring.shape == (N, D)
+    print(f"      Eta: {eta_matrix.shape}, Prob: {prob_matrix.shape} -> Output: {offspring.shape} ✓")
+    # ==========================================================================
+    # ArithmeticCrossover - Test alpha override
+    # ==========================================================================
+    print("\n3. ArithmeticCrossover configurations:")
+    arith = ArithmeticCrossover(alpha=0.5)
+    # Per-individual alpha
+    print("   a) Per-individual alpha [N]")
+    alpha_per_ind = torch.rand(N)
+    offspring = arith(parent1, parent2, alpha=alpha_per_ind)
+    assert offspring.shape == (N, D)
+    print(f"      Alpha shape: {alpha_per_ind.shape} -> Output: {offspring.shape} ✓")
+    # Verify arithmetic crossover formula
+    print("   b) Verify formula: offspring = alpha * p1 + (1-alpha) * p2")
+    alpha_test = 0.3
+    offspring_test = arith(parent1, parent2, alpha=alpha_test)
+    expected = alpha_test * parent1 + (1 - alpha_test) * parent2
+    assert torch.allclose(offspring_test, expected, atol=1e-6)
+    print(f"      Formula verified ✓")
+    print("\n✓ All crossover configurations passed!")
+def test_mutation_configurations():
+    """Test all four parameter configurations for mutation operators."""
+    print("\n" + "=" * 70)
+    print("Testing Mutation Per-Individual/Per-Gene Configurations")
+    print("=" * 70)
+    N, D = 50, 10  # 50 individuals, 10 variables
+    population = torch.randn(N, D)
+    xl = torch.zeros(D)
+    xu = torch.ones(D)
+    # ==========================================================================
+    # PolynomialMutation - Test eta and prob overrides
+    # ==========================================================================
+    print("\n1. PolynomialMutation configurations:")
+    mutation = PolynomialMutation(eta=20, prob=0.1)
+    # Config 1: Fixed (default)
+    print("   a) Fixed eta and prob (scalar) - default behavior")
+    mutated = mutation(population, xl, xu)
+    assert mutated.shape == (N, D)
+    print(f"      Shape: {mutated.shape} ✓")
+    # Config 2: Per-gene [D]
+    print("   b) Per-gene eta [D]")
+    eta_per_gene = torch.linspace(10, 30, D)
+    mutated = mutation(population, xl, xu, eta=eta_per_gene)
+    assert mutated.shape == (N, D)
+    print(f"      Eta shape: {eta_per_gene.shape} -> Output: {mutated.shape} ✓")
+    # Config 3: Per-individual [N]
+    print("   c) Per-individual eta [N] - Self-adaptive GA style")
+    eta_per_ind = torch.rand(N) * 20 + 10  # eta in [10, 30] per individual
+    mutated = mutation(population, xl, xu, eta=eta_per_ind)
+    assert mutated.shape == (N, D)
+    print(f"      Eta shape: {eta_per_ind.shape} -> Output: {mutated.shape} ✓")
+    # Config 4: Full matrix [N, D]
+    print("   d) Full matrix eta and prob [N, D]")
+    eta_matrix = torch.rand(N, D) * 20 + 10
+    prob_matrix = torch.rand(N, D) * 0.2
+    mutated = mutation(population, xl, xu, eta=eta_matrix, prob=prob_matrix)
+    assert mutated.shape == (N, D)
+    print(f"      Eta: {eta_matrix.shape}, Prob: {prob_matrix.shape} -> Output: {mutated.shape} ✓")
+    # ==========================================================================
+    # GaussianMutation - Test sigma override (important for DE/SHADE)
+    # ==========================================================================
+    print("\n2. GaussianMutation configurations:")
+    gauss = GaussianMutation(sigma=0.1)
+    # Per-individual sigma (like F in DE/SHADE)
+    print("   a) Per-individual sigma [N] - SHADE F-style")
+    F_per_ind = torch.rand(N) * 0.5 + 0.5  # F in [0.5, 1.0] per individual
+    mutated = gauss(population, xl, xu, sigma=F_per_ind)
+    assert mutated.shape == (N, D)
+    print(f"      Sigma shape: {F_per_ind.shape} -> Output: {mutated.shape} ✓")
+    # Per-gene sigma
+    print("   b) Per-gene sigma [D]")
+    sigma_per_gene = torch.linspace(0.05, 0.2, D)
+    mutated = gauss(population, xl, xu, sigma=sigma_per_gene)
+    assert mutated.shape == (N, D)
+    print(f"      Sigma shape: {sigma_per_gene.shape} -> Output: {mutated.shape} ✓")
+    # ==========================================================================
+    # UniformMutation - Test prob override
+    # ==========================================================================
+    print("\n3. UniformMutation configurations:")
+    unif = UniformMutation(prob=0.05)
+    # Per-individual prob
+    print("   a) Per-individual prob [N]")
+    prob_per_ind = torch.rand(N) * 0.1
+    mutated = unif(population, xl, xu, prob=prob_per_ind)
+    assert mutated.shape == (N, D)
+    print(f"      Prob shape: {prob_per_ind.shape} -> Output: {mutated.shape} ✓")
+    print("\n✓ All mutation configurations passed!")
+def test_shade_style_usage():
+    """Demonstrate SHADE-style usage with per-individual F and CR."""
+    print("\n" + "=" * 70)
+    print("Demonstrating SHADE-style Usage")
+    print("=" * 70)
+    N, D = 100, 30
+    # Simulated SHADE setup
+    print("\n1. Setting up SHADE-style parameters:")
+    # Population
+    population = torch.rand(N, D)
+    xl = torch.zeros(D)
+    xu = torch.ones(D)
+    # Per-individual F and CR (sampled from historical memory in real SHADE)
+    F_per_ind = torch.randn(N).abs() * 0.3 + 0.5  # F ~ |N(0.5, 0.3)|
+    CR_per_ind = torch.randn(N) * 0.1 + 0.5  # CR ~ N(0.5, 0.1)
+    CR_per_ind = CR_per_ind.clamp(0, 1)
+    print(f"   F per individual: shape={F_per_ind.shape}, range=[{F_per_ind.min():.3f}, {F_per_ind.max():.3f}]")
+    print(f"   CR per individual: shape={CR_per_ind.shape}, range=[{CR_per_ind.min():.3f}, {CR_per_ind.max():.3f}]")
+    # Select random individuals for mutation (DE/rand/1)
+    print("\n2. Creating donor vectors (DE/rand/1 style):")
+    r1 = torch.randint(0, N, (N,))
+    r2 = torch.randint(0, N, (N,))
+    r3 = torch.randint(0, N, (N,))
+    # Mutation: donor = x_r1 + F * (x_r2 - x_r3)
+    # Here we use per-individual F
+    diff = population[r2] - population[r3]
+    donor = population[r1] + F_per_ind.unsqueeze(1) * diff
+    print(f"   Donor vectors created: {donor.shape}")
+    # Binomial crossover with per-individual CR
+    print("\n3. Applying binomial crossover with per-individual CR:")
+    crossover = BinomialCrossover(cr=0.5)  # Default CR, but we'll override
+    trial = crossover(population, donor, cr=CR_per_ind)
+    print(f"   Trial vectors created: {trial.shape}")
+    # Verify different individuals have different number of genes crossed
+    genes_from_donor = (trial == donor).float().sum(dim=1)
+    print(f"   Genes from donor (per individual): mean={genes_from_donor.mean():.1f}, std={genes_from_donor.std():.1f}")
+    print("\n✓ SHADE-style demonstration complete!")
+def test_differentiable_mode():
+    """Test gradient flow with per-individual parameters."""
+    print("\n" + "=" * 70)
+    print("Testing Gradient Flow with Per-Individual Parameters")
+    print("=" * 70)
+    N, D = 20, 5
+    # Differentiable operators
+    print("\n1. SBXCrossover with gradient flow:")
+    sbx = SBXCrossover(eta=15, prob=0.9, differentiable=True, learn_eta=True)
+    p1 = torch.nn.Parameter(torch.randn(N, D))
+    p2 = torch.randn(N, D)
+    eta_per_ind = torch.rand(N) * 10 + 5  # Not learnable, just passed in
+    offspring = sbx(p1, p2, eta=eta_per_ind)
+    loss = offspring.sum()
+    loss.backward()
+    assert p1.grad is not None, "Gradients should flow to parent1"
+    print(f"   Gradients flow through per-individual eta: ✓")
+    print(f"   Parent1 grad norm: {p1.grad.norm():.4f}")
+    # PolynomialMutation with gradient flow
+    print("\n2. PolynomialMutation with gradient flow:")
+    mutation = PolynomialMutation(eta=20, prob=0.1, differentiable=True, learn_eta=True)
+    x = torch.nn.Parameter(torch.randn(N, D))
+    xl = torch.zeros(D)
+    xu = torch.ones(D)
+    eta_per_ind = torch.rand(N) * 20 + 10
+    mutated = mutation(x, xl, xu, eta=eta_per_ind)
+    loss = mutated.sum()
+    loss.backward()
+    assert x.grad is not None, "Gradients should flow to input"
+    print(f"   Gradients flow through per-individual eta: ✓")
+    print(f"   Input grad norm: {x.grad.norm():.4f}")
+    print("\n✓ All gradient tests passed!")
+def main():
+    """Run all tests."""
+    print("\n" + "#" * 70)
+    print("# Per-Individual/Per-Gene Parameter Support Tests")
+    print("#" * 70)
+    test_crossover_configurations()
+    test_mutation_configurations()
+    test_shade_style_usage()
+    test_differentiable_mode()
+    print("\n" + "=" * 70)
+    print("ALL TESTS PASSED! ✓")
+    print("=" * 70)
+    print("\nSummary of Four Configurations:")
+    print("  1. Fixed (scalar)     - Same value for all")
+    print("  2. Per-gene [D]       - Different per variable")
+    print("  3. Per-individual [N] - Different per individual (SHADE needs this!)")
+    print("  4. Full matrix [N, D] - Maximum flexibility")
+if __name__ == "__main__":
+    main()

evograd/tests/test_utils.py ADDED Viewed

@@ -0,0 +1,328 @@
+"""
+Test script for EvoGrad utils module.
+Tests:
+    - device.py: Device detection and tensor movement
+    - duplicates.py: Duplicate elimination
+    - callbacks.py: Callback system
+Usage:
+    python -m evograd.tests.test_utils
+"""
+import sys
+import torch
+import torch.nn as nn
+import tempfile
+import os
+# Add parent of evograd to path for imports
+sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))
+from evograd.utils.device import get_device, to_device
+from evograd.utils.duplicates import (
+    DuplicateMethod,
+    DuplicateEliminator,
+    eliminate_duplicates,
+    has_duplicates,
+    count_duplicates,
+)
+from evograd.utils.callbacks import (
+    Callback,
+    CallbackList,
+    CallbackState,
+    HistoryCallback,
+    PrintCallback,
+    EarlyStoppingCallback,
+    CheckpointCallback,
+    ConvergenceCallback,
+)
+def test_device():
+    """Test device detection and tensor movement."""
+    print("\n" + "="*60)
+    print("Testing device.py")
+    print("="*60)
+    # Test get_device
+    print("\n1. Testing get_device()...")
+    device = get_device()
+    print(f"   Default device: {device}")
+    assert isinstance(device, torch.device)
+    # Test with specific device string
+    cpu_device = get_device("cpu")
+    print(f"   CPU device: {cpu_device}")
+    assert cpu_device.type == "cpu"
+    # Test auto detection (None means auto)
+    auto_device = get_device(None)
+    print(f"   Auto device: {auto_device}")
+    # Test to_device with tensors (keyword-only device argument)
+    print("\n2. Testing to_device() with tensors...")
+    x = torch.randn(10, 5)
+    y = torch.randn(3, 3)
+    x_moved, y_moved = to_device(x, y, device=cpu_device)
+    print(f"   Moved tensors to {x_moved.device}")
+    assert x_moved.device == cpu_device
+    assert y_moved.device == cpu_device
+    # Test to_device with single tensor
+    print("\n3. Testing to_device() with single tensor...")
+    z = torch.randn(5)
+    (z_moved,) = to_device(z, device=cpu_device)
+    print(f"   Moved single tensor to {z_moved.device}")
+    assert z_moved.device == cpu_device
+    print("\n✓ device.py tests passed!")
+def test_duplicates():
+    """Test duplicate elimination strategies."""
+    print("\n" + "="*60)
+    print("Testing duplicates.py")
+    print("="*60)
+    # Create test population with duplicates
+    pop = torch.tensor([
+        [1.0, 2.0, 3.0],
+        [1.0, 2.0, 3.0],  # Exact duplicate of row 0
+        [4.0, 5.0, 6.0],
+        [1.0001, 2.0001, 3.0001],  # Near duplicate of row 0
+        [7.0, 8.0, 9.0],
+    ])
+    xl = torch.zeros(3)
+    xu = torch.ones(3) * 10
+    # Test DuplicateEliminator with EPSILON_L2
+    print("\n1. Testing DuplicateEliminator (EPSILON_L2)...")
+    eliminator = DuplicateEliminator(
+        method=DuplicateMethod.EPSILON_L2,
+        epsilon=0.01,
+    )
+    # Eliminate duplicates by calling the eliminator
+    new_pop = eliminator(pop, xl, xu)
+    print(f"   Original population shape: {pop.shape}")
+    print(f"   Population after elimination: {new_pop.shape}")
+    print(f"   Duplicates found: {eliminator.n_duplicates_found}")
+    print(f"   Duplicates resolved: {eliminator.n_duplicates_resolved}")
+    # Test has_duplicates function
+    print("\n2. Testing has_duplicates()...")
+    has_dups = has_duplicates(pop, epsilon=0.01)
+    print(f"   Has duplicates: {has_dups}")
+    assert has_dups == True, "Population should have duplicates"
+    # Test count_duplicates function
+    print("\n3. Testing count_duplicates()...")
+    n_dups = count_duplicates(pop, epsilon=0.01)
+    print(f"   Number of duplicates: {n_dups}")
+    assert n_dups >= 1, "Should find at least 1 duplicate"
+    # Test DuplicateEliminator with HASH method
+    print("\n4. Testing DuplicateEliminator (HASH)...")
+    hash_eliminator = DuplicateEliminator(
+        method=DuplicateMethod.HASH,
+        decimals=2,
+    )
+    new_pop_hash = hash_eliminator(pop, xl, xu)
+    print(f"   Hash method duplicates found: {hash_eliminator.n_duplicates_found}")
+    # Test DuplicateEliminator with NONE method
+    print("\n5. Testing DuplicateEliminator (NONE)...")
+    no_elim = DuplicateEliminator(method=DuplicateMethod.NONE)
+    new_pop_none = no_elim(pop, xl, xu)
+    assert torch.allclose(new_pop_none, pop), "NONE method should not modify population"
+    print("   NONE method correctly leaves population unchanged")
+    # Test eliminate_duplicates convenience function
+    print("\n6. Testing eliminate_duplicates()...")
+    cleaned_pop = eliminate_duplicates(pop, xl, xu, epsilon=0.01)
+    print(f"   Cleaned population shape: {cleaned_pop.shape}")
+    print("\n✓ duplicates.py tests passed!")
+def test_callbacks():
+    """Test callback system."""
+    print("\n" + "="*60)
+    print("Testing callbacks.py")
+    print("="*60)
+    # Test HistoryCallback
+    print("\n1. Testing HistoryCallback...")
+    history_cb = HistoryCallback(
+        track_population=True,
+        track_hyperparams=True,
+        track_diversity=False,
+        track_fitness_stats=True,
+    )
+    # Create initial state
+    state = CallbackState(
+        generation=0,
+        n_evals=0,
+        best_fitness=float('inf'),
+        best_solution=torch.randn(5),
+        current_fitness=torch.randn(10),
+        current_population=torch.randn(10, 5),
+    )
+    history_cb.on_optimisation_start(state)
+    for gen in range(5):
+        state.generation = gen
+        state.n_evals = (gen + 1) * 10
+        state.best_fitness = 100.0 / (gen + 1)
+        state.current_fitness = torch.randn(10)
+        history_cb.on_generation_end(state)
+    print(f"   Tracked generations: {len(history_cb.generations)}")
+    print(f"   Best fitness history: {history_cb.best_fitness[:3]}...")
+    assert len(history_cb.generations) == 5
+    assert len(history_cb.best_fitness) == 5
+    # Test PrintCallback
+    print("\n2. Testing PrintCallback...")
+    print_cb = PrintCallback(every=2, show_time=True)
+    state = CallbackState(generation=0, n_evals=0, best_fitness=100.0)
+    print_cb.on_optimisation_start(state)
+    for gen in range(4):
+        state.generation = gen
+        state.best_fitness = 100.0 - gen * 10
+        state.n_evals = gen * 10
+        print_cb.on_generation_end(state)
+    print_cb.on_optimisation_end(state)
+    print("   PrintCallback executed without errors")
+    # Test EarlyStoppingCallback
+    print("\n3. Testing EarlyStoppingCallback...")
+    early_stop_cb = EarlyStoppingCallback(
+        patience=3,
+        min_delta=0.1,
+    )
+    state = CallbackState(generation=0, n_evals=0, best_fitness=100.0)
+    early_stop_cb.on_optimisation_start(state)
+    # Simulate improvement then stagnation
+    fitness_sequence = [100, 90, 80, 80, 80, 80]  # Stagnates after 3rd
+    stopped_at = None
+    for gen, fit in enumerate(fitness_sequence):
+        state.generation = gen
+        state.best_fitness = fit
+        early_stop_cb.on_generation_end(state)
+        if state.stop_optimisation:
+            stopped_at = gen
+            break
+    print(f"   Early stopping triggered at generation: {stopped_at}")
+    assert stopped_at is not None, "Early stopping should have triggered"
+    # Test CheckpointCallback
+    print("\n4. Testing CheckpointCallback...")
+    with tempfile.TemporaryDirectory() as tmpdir:
+        # Create a mock module for checkpointing
+        mock_module = nn.Linear(5, 1)
+        checkpoint_cb = CheckpointCallback(
+            directory=tmpdir,
+            every=2,
+            save_best_only=True,
+        )
+        state = CallbackState(
+            generation=0,
+            n_evals=0,
+            best_fitness=100.0,
+            algorithm=mock_module,
+        )
+        checkpoint_cb.on_optimisation_start(state)
+        for gen in range(5):
+            state.generation = gen
+            state.best_fitness = 100.0 - gen * 20
+            checkpoint_cb.on_generation_end(state)
+        checkpoint_cb.on_optimisation_end(state)
+        # Check files were created
+        files = os.listdir(tmpdir)
+        print(f"   Checkpoint files created: {files}")
+        assert len(files) > 0, "Should have created checkpoint files"
+    # Test ConvergenceCallback
+    print("\n5. Testing ConvergenceCallback...")
+    conv_cb = ConvergenceCallback(
+        threshold=0.001,
+        window=3,
+        min_generations=0,
+    )
+    state = CallbackState(generation=0, n_evals=0, best_fitness=100.0)
+    conv_cb.on_optimisation_start(state)
+    # Simulate convergence
+    fitness_sequence = [100.0, 50.0, 25.0, 24.999, 24.998, 24.997]
+    stopped_at = None
+    for gen, fit in enumerate(fitness_sequence):
+        state.generation = gen
+        state.best_fitness = fit
+        conv_cb.on_generation_end(state)
+        if state.stop_optimisation:
+            stopped_at = gen
+            break
+    print(f"   Convergence detected at generation: {stopped_at}")
+    # Test CallbackList
+    print("\n6. Testing CallbackList...")
+    cb_list = CallbackList([
+        HistoryCallback(),
+        PrintCallback(every=10),
+    ])
+    state = CallbackState(generation=0, n_evals=0, best_fitness=100.0)
+    cb_list.on_optimisation_start(state)
+    for gen in range(3):
+        state.generation = gen
+        state.best_fitness = 100.0 - gen
+        cb_list.on_generation_end(state)
+    cb_list.on_optimisation_end(state)
+    print("   CallbackList executed all callbacks")
+    print("\n✓ callbacks.py tests passed!")
+def run_all_tests():
+    """Run all utils tests."""
+    print("\n" + "#"*60)
+    print("# EvoGrad Utils Module Tests")
+    print("#"*60)
+    try:
+        test_device()
+        test_duplicates()
+        test_callbacks()
+        print("\n" + "="*60)
+        print("✓ ALL UTILS TESTS PASSED!")
+        print("="*60)
+        return True
+    except Exception as e:
+        print(f"\n✗ TEST FAILED: {e}")
+        import traceback
+        traceback.print_exc()
+        return False
+if __name__ == "__main__":
+    success = run_all_tests()
+    sys.exit(0 if success else 1)