PyPI - evolutionary-policy-optimization - Versions diffs - 0.0.22__py3-none-any.whl → 0.0.24__py3-none-any.whl - Mend

evolutionary-policy-optimization 0.0.22py3-none-any.whl → 0.0.24py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

evolutionary_policy_optimization/epo.py CHANGED Viewed

@@ -8,6 +8,7 @@ import torch.nn.functional as F
 from torch.nn import Linear, Module, ModuleList
 from torch.utils.data import TensorDataset, DataLoader
+import einx
 from einops import rearrange, repeat, einsum
 from einops.layers.torch import Rearrange
@@ -31,11 +32,14 @@ def identity(t):
 def xnor(x, y):
     return not (x ^ y)
-def l2norm(t):
-    return F.normalize(t, p = 2, dim = -1)
+def divisible_by(num, den):
+    return (num % den) == 0
 # tensor helpers
+def l2norm(t):
+    return F.normalize(t, p = 2, dim = -1)
 def log(t, eps = 1e-20):
     return t.clamp(min = eps).log()
@@ -290,7 +294,7 @@ class ShouldRunGeneticAlgorithm(Module):
         # however, this equation does not make much sense to me if fitness increases unbounded
         # just let it be customizable, and offer a variant where mean and variance is over some threshold (could account for skew too)
-        return (fitnesses.amax() - fitnesses.amin()) > (self.gamma * torch.median(fitnesses))
+        return (fitnesses.amax(dim = -1) - fitnesses.amin(dim = -1)) > (self.gamma * torch.median(fitnesses, dim = -1).values)
 # classes
@@ -300,6 +304,7 @@ class LatentGenePool(Module):
         num_latents,                     # same as gene pool size
         dim_latent,                      # gene dimension
         num_latent_sets = 1,             # allow for sets of latents / gene per individual, expression of a set controlled by the environment
+        num_islands = 1,                 # add the island strategy, which has been effectively used in a few recent works
         dim_state = None,
         frozen_latents = True,
         crossover_random = True,         # random interp from parent1 to parent2 for crossover, set to `False` for averaging (0.5 constant value)
@@ -340,6 +345,9 @@ class LatentGenePool(Module):
         # some derived values
+        assert num_islands >= 1
+        assert divisible_by(num_latents, num_islands)
         assert 0. < frac_tournaments < 1.
         assert 0. < frac_natural_selected < 1.
         assert 0. <= frac_elitism < 1.
@@ -347,13 +355,16 @@ class LatentGenePool(Module):
         self.dim_latent = dim_latent
         self.num_latents = num_latents
-        self.num_natural_selected = int(frac_natural_selected * num_latents)
+        self.num_islands = num_islands
+        latents_per_island = num_latents // num_islands
+        self.num_natural_selected = int(frac_natural_selected * latents_per_island)
         self.num_tournament_participants = int(frac_tournaments * self.num_natural_selected)
         self.crossover_random  = crossover_random
         self.mutation_strength = mutation_strength
-        self.num_elites = int(frac_elitism * num_latents)
+        self.num_elites = int(frac_elitism * latents_per_island)
         self.has_elites = self.num_elites > 0
         if not exists(should_run_genetic_algorithm):
@@ -369,13 +380,15 @@ class LatentGenePool(Module):
         inplace = True
     ):
         """
+        i - islands
         p - population
         g - gene dimension
         n - number of genes per individual
+        t - num tournament participants
         """
-        if not self.should_run_genetic_algorithm(fitness):
-            return
+        islands = self.num_islands
+        tournament_participants = self.num_tournament_participants
         assert self.num_latents > 1
@@ -384,39 +397,64 @@ class LatentGenePool(Module):
         pop_size = genes.shape[0]
         assert pop_size == fitness.shape[0]
+        pop_size_per_island = pop_size // islands
+        # split out the islands
+        fitness = rearrange(fitness, '(i p) -> i p', i = islands)
+        # from the fitness, decide whether to actually run the genetic algorithm or not
+        should_update_per_island = self.should_run_genetic_algorithm(fitness)
+        if not should_update_per_island.any():
+            if inplace:
+                return
+            return genes
+        genes = rearrange(genes, '(i p) n g -> i p n g', i = islands)
+        orig_genes = genes
         # 1. natural selection is simple in silico
         # you sort the population by the fitness and slice off the least fit end
-        sorted_indices = fitness.sort().indices
-        natural_selected_indices = sorted_indices[-self.num_natural_selected:]
-        genes, fitness = genes[natural_selected_indices], fitness[natural_selected_indices]
+        sorted_indices = fitness.sort(dim = -1).indices
+        natural_selected_indices = sorted_indices[..., -self.num_natural_selected:]
+        natural_select_gene_indices = repeat(natural_selected_indices, '... -> ... n g', n = genes.shape[-2], g = genes.shape[-1])
+        genes, fitness = genes.gather(1, natural_select_gene_indices), fitness.gather(1, natural_selected_indices)
         # 2. for finding pairs of parents to replete gene pool, we will go with the popular tournament strategy
-        batch_randperm = torch.randn((pop_size - self.num_natural_selected, self.num_tournament_participants)).argsort(dim = -1)
+        rand_tournament_gene_ids = torch.randn((islands, pop_size_per_island - self.num_natural_selected, tournament_participants)).argsort(dim = -1)
+        rand_tournament_gene_ids_for_gather = rearrange(rand_tournament_gene_ids, 'i p t -> i (p t)')
-        participants = genes[batch_randperm]
-        participant_fitness = fitness[batch_randperm]
+        participant_fitness = fitness.gather(1, rand_tournament_gene_ids_for_gather)
+        participant_fitness = rearrange(participant_fitness, 'i (p t) -> i p t', t = tournament_participants)
-        tournament_winner_indices = participant_fitness.topk(2, dim = -1).indices
+        parent_indices_at_tournament = participant_fitness.topk(2, dim = -1).indices
+        parent_gene_ids = rand_tournament_gene_ids.gather(-1, parent_indices_at_tournament)
-        tournament_winner_indices = repeat(tournament_winner_indices, '... -> ... n g', g = self.dim_latent, n = self.num_latent_sets)
+        parent_gene_ids_for_gather = repeat(parent_gene_ids, 'i p parents -> i (p parents) n g', n = genes.shape[-2], g = genes.shape[-1])
-        parents = participants.gather(-3, tournament_winner_indices)
+        parents = genes.gather(1, parent_gene_ids_for_gather)
+        parents = rearrange(parents, 'i (p parents) ... -> i p parents ...', parents = 2)
         # 3. do a crossover of the parents - in their case they went for a simple averaging, but since we are doing tournament style and the same pair of parents may be re-selected, lets make it random interpolation
-        parent1, parent2 = parents.unbind(dim = 1)
+        parent1, parent2 = parents.unbind(dim = 2)
         children = crossover_latents(parent1, parent2, random = self.crossover_random)
         # append children to gene pool
-        genes = cat((children, genes))
+        genes = cat((children, genes), dim = 1)
         # 4. they use the elitism strategy to protect best performing genes from being changed
         if self.has_elites:
-            genes, elites = genes[:-self.num_elites], genes[-self.num_elites:]
+            genes, elites = genes[:, :-self.num_elites], genes[:, -self.num_elites:]
         # 5. mutate with gaussian noise - todo: add drawing the mutation rate from exponential distribution, from the fast genetic algorithms paper from 2017
@@ -425,10 +463,18 @@ class LatentGenePool(Module):
         # add back the elites
         if self.has_elites:
-            genes = cat((genes, elites))
+            genes = cat((genes, elites), dim = 1)
         genes = self.maybe_l2norm(genes)
+        # account for criteria of whether to actually run GA or not
+        genes = einx.where('i, i ..., i ...', should_update_per_island, genes, orig_genes)
+        # merge island back into pop dimension
+        genes = rearrange(genes, 'i p ... -> (i p) ...')
         if not inplace:
             return genes

{evolutionary_policy_optimization-0.0.22.dist-info → evolutionary_policy_optimization-0.0.24.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: evolutionary-policy-optimization
-Version: 0.0.22
+Version: 0.0.24
 Summary: EPO - Pytorch
 Project-URL: Homepage, https://pypi.org/project/evolutionary-policy-optimization/
 Project-URL: Repository, https://github.com/lucidrains/evolutionary-policy-optimization
@@ -36,7 +36,8 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
 Requires-Python: >=3.9
 Requires-Dist: adam-atan2-pytorch
 Requires-Dist: assoc-scan
-Requires-Dist: einops>=0.8.0
+Requires-Dist: einops>=0.8.1
+Requires-Dist: einx>=0.3.0
 Requires-Dist: hl-gauss-pytorch>=0.1.19
 Requires-Dist: torch>=2.2
 Requires-Dist: tqdm

evolutionary_policy_optimization-0.0.24.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,7 @@
+evolutionary_policy_optimization/__init__.py,sha256=Qavcia0n13jjaWIS_LPW7QrxSLT_BBeKujCjF9kQjbA,133
+evolutionary_policy_optimization/epo.py,sha256=-kQgrnnOLiCOZ-6EroO057tDx0sS7TQro92cjJhSbZU,20353
+evolutionary_policy_optimization/experimental.py,sha256=ktBKxRF27Qsj7WIgBpYlWXqMVxO9zOx2oD1JuDYRAwM,548
+evolutionary_policy_optimization-0.0.24.dist-info/METADATA,sha256=d3imh1p1-nPpNGhD8cReLdL07_-oHZs3YqJaOEJi1TM,4958
+evolutionary_policy_optimization-0.0.24.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+evolutionary_policy_optimization-0.0.24.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
+evolutionary_policy_optimization-0.0.24.dist-info/RECORD,,

evolutionary_policy_optimization-0.0.22.dist-info/RECORD DELETED Viewed

@@ -1,7 +0,0 @@
-evolutionary_policy_optimization/__init__.py,sha256=Qavcia0n13jjaWIS_LPW7QrxSLT_BBeKujCjF9kQjbA,133
-evolutionary_policy_optimization/epo.py,sha256=TbUX2L-Wa2zIZ2b7iHmBtaym-qDSLAFrC7iU7xReX_k,18449
-evolutionary_policy_optimization/experimental.py,sha256=ktBKxRF27Qsj7WIgBpYlWXqMVxO9zOx2oD1JuDYRAwM,548
-evolutionary_policy_optimization-0.0.22.dist-info/METADATA,sha256=L3G-tesSEyhrc_SbTN6HuJQlXfogEUvr3W9SXPcnRVw,4931
-evolutionary_policy_optimization-0.0.22.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-evolutionary_policy_optimization-0.0.22.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
-evolutionary_policy_optimization-0.0.22.dist-info/RECORD,,

{evolutionary_policy_optimization-0.0.22.dist-info → evolutionary_policy_optimization-0.0.24.dist-info}/WHEEL RENAMED Viewed

File without changes

{evolutionary_policy_optimization-0.0.22.dist-info → evolutionary_policy_optimization-0.0.24.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

evolutionary-policy-optimization 0.0.22__py3-none-any.whl → 0.0.24__py3-none-any.whl

evolutionary-policy-optimization 0.0.22py3-none-any.whl → 0.0.24py3-none-any.whl