PyPI - brainstate - Versions diffs - 0.1.8__py2.py3-none-any.whl → 0.1.9__py2.py3-none-any.whl - Mend

brainstate 0.1.8py2.py3-none-any.whl → 0.1.9py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (133) hide show

brainstate/__init__.py +58 -51
brainstate/_compatible_import.py +148 -148
brainstate/_state.py +1605 -1663
brainstate/_state_test.py +52 -52
brainstate/_utils.py +47 -47
brainstate/augment/__init__.py +30 -30
brainstate/augment/_autograd.py +778 -778
brainstate/augment/_autograd_test.py +1289 -1289
brainstate/augment/_eval_shape.py +99 -99
brainstate/augment/_eval_shape_test.py +38 -38
brainstate/augment/_mapping.py +1060 -1060
brainstate/augment/_mapping_test.py +597 -597
brainstate/augment/_random.py +151 -151
brainstate/compile/__init__.py +38 -38
brainstate/compile/_ad_checkpoint.py +204 -204
brainstate/compile/_ad_checkpoint_test.py +49 -49
brainstate/compile/_conditions.py +256 -256
brainstate/compile/_conditions_test.py +220 -220
brainstate/compile/_error_if.py +92 -92
brainstate/compile/_error_if_test.py +52 -52
brainstate/compile/_jit.py +346 -346
brainstate/compile/_jit_test.py +143 -143
brainstate/compile/_loop_collect_return.py +536 -536
brainstate/compile/_loop_collect_return_test.py +58 -58
brainstate/compile/_loop_no_collection.py +184 -184
brainstate/compile/_loop_no_collection_test.py +50 -50
brainstate/compile/_make_jaxpr.py +888 -888
brainstate/compile/_make_jaxpr_test.py +156 -156
brainstate/compile/_progress_bar.py +202 -202
brainstate/compile/_unvmap.py +159 -159
brainstate/compile/_util.py +147 -147
brainstate/environ.py +563 -563
brainstate/environ_test.py +62 -62
brainstate/functional/__init__.py +27 -26
brainstate/graph/__init__.py +29 -29
brainstate/graph/_graph_node.py +244 -244
brainstate/graph/_graph_node_test.py +73 -73
brainstate/graph/_graph_operation.py +1738 -1738
brainstate/graph/_graph_operation_test.py +563 -563
brainstate/init/__init__.py +26 -26
brainstate/init/_base.py +52 -52
brainstate/init/_generic.py +244 -244
brainstate/init/_random_inits.py +553 -553
brainstate/init/_random_inits_test.py +149 -149
brainstate/init/_regular_inits.py +105 -105
brainstate/init/_regular_inits_test.py +50 -50
brainstate/mixin.py +365 -363
brainstate/mixin_test.py +77 -73
brainstate/nn/__init__.py +135 -131
brainstate/{functional → nn}/_activations.py +808 -813
brainstate/{functional → nn}/_activations_test.py +331 -331
brainstate/nn/_collective_ops.py +514 -514
brainstate/nn/_collective_ops_test.py +43 -43
brainstate/nn/_common.py +178 -178
brainstate/nn/_conv.py +501 -501
brainstate/nn/_conv_test.py +238 -238
brainstate/nn/_delay.py +509 -502
brainstate/nn/_delay_test.py +238 -184
brainstate/nn/_dropout.py +426 -426
brainstate/nn/_dropout_test.py +100 -100
brainstate/nn/_dynamics.py +1343 -1343
brainstate/nn/_dynamics_test.py +78 -78
brainstate/nn/_elementwise.py +1119 -1119
brainstate/nn/_elementwise_test.py +169 -169
brainstate/nn/_embedding.py +58 -58
brainstate/nn/_exp_euler.py +92 -92
brainstate/nn/_exp_euler_test.py +35 -35
brainstate/nn/_fixedprob.py +239 -239
brainstate/nn/_fixedprob_test.py +114 -114
brainstate/nn/_inputs.py +608 -608
brainstate/nn/_linear.py +424 -424
brainstate/nn/_linear_mv.py +83 -83
brainstate/nn/_linear_mv_test.py +120 -120
brainstate/nn/_linear_test.py +107 -107
brainstate/nn/_ltp.py +28 -28
brainstate/nn/_module.py +377 -377
brainstate/nn/_module_test.py +40 -40
brainstate/nn/_neuron.py +705 -705
brainstate/nn/_neuron_test.py +161 -161
brainstate/nn/_normalizations.py +975 -918
brainstate/nn/_normalizations_test.py +73 -73
brainstate/{functional → nn}/_others.py +46 -46
brainstate/nn/_poolings.py +1177 -1177
brainstate/nn/_poolings_test.py +217 -217
brainstate/nn/_projection.py +486 -486
brainstate/nn/_rate_rnns.py +554 -554
brainstate/nn/_rate_rnns_test.py +63 -63
brainstate/nn/_readout.py +209 -209
brainstate/nn/_readout_test.py +53 -53
brainstate/nn/_stp.py +236 -236
brainstate/nn/_synapse.py +505 -505
brainstate/nn/_synapse_test.py +131 -131
brainstate/nn/_synaptic_projection.py +423 -423
brainstate/nn/_synouts.py +162 -162
brainstate/nn/_synouts_test.py +57 -57
brainstate/nn/_utils.py +89 -89
brainstate/nn/metrics.py +388 -388
brainstate/optim/__init__.py +38 -38
brainstate/optim/_base.py +64 -64
brainstate/optim/_lr_scheduler.py +448 -448
brainstate/optim/_lr_scheduler_test.py +50 -50
brainstate/optim/_optax_optimizer.py +152 -152
brainstate/optim/_optax_optimizer_test.py +53 -53
brainstate/optim/_sgd_optimizer.py +1104 -1104
brainstate/random/__init__.py +24 -24
brainstate/random/_rand_funs.py +3616 -3616
brainstate/random/_rand_funs_test.py +567 -567
brainstate/random/_rand_seed.py +210 -210
brainstate/random/_rand_seed_test.py +48 -48
brainstate/random/_rand_state.py +1409 -1409
brainstate/random/_random_for_unit.py +52 -52
brainstate/surrogate.py +1957 -1957
brainstate/transform.py +23 -23
brainstate/typing.py +304 -304
brainstate/util/__init__.py +50 -50
brainstate/util/caller.py +98 -98
brainstate/util/error.py +55 -55
brainstate/util/filter.py +469 -469
brainstate/util/others.py +540 -540
brainstate/util/pretty_pytree.py +945 -945
brainstate/util/pretty_pytree_test.py +159 -159
brainstate/util/pretty_repr.py +328 -328
brainstate/util/pretty_table.py +2954 -2954
brainstate/util/scaling.py +258 -258
brainstate/util/struct.py +523 -523
{brainstate-0.1.8.dist-info → brainstate-0.1.9.dist-info}/METADATA +91 -99
brainstate-0.1.9.dist-info/RECORD +130 -0
{brainstate-0.1.8.dist-info → brainstate-0.1.9.dist-info}/WHEEL +1 -1
{brainstate-0.1.8.dist-info → brainstate-0.1.9.dist-info/licenses}/LICENSE +202 -202
brainstate/functional/_normalization.py +0 -81
brainstate/functional/_spikes.py +0 -204
brainstate-0.1.8.dist-info/RECORD +0 -132
{brainstate-0.1.8.dist-info → brainstate-0.1.9.dist-info}/top_level.txt +0 -0

brainstate/optim/_lr_scheduler.py CHANGED Viewed

@@ -1,448 +1,448 @@
-# Copyright 2024 BDP Ecosystem Limited. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-# -*- coding: utf-8 -*-
-from typing import Sequence, Union
-import jax
-import jax.numpy as jnp
-import numpy as np
-from brainstate import environ
-from brainstate._state import State, LongTermState
-from brainstate.graph import Node
-__all__ = [
-    'LearningRateScheduler',
-    'ConstantLR',
-    'StepLR',
-    'MultiStepLR',
-    'CosineAnnealingLR',
-    'CosineAnnealingWarmRestarts',
-    'ExponentialLR',
-    'ExponentialDecayLR',
-    'InverseTimeDecayLR',
-    'PolynomialDecayLR',
-    'PiecewiseConstantLR',
-]
-# learning rate schedules #
-# ----------------------- #
-def make_schedule(scalar_or_schedule):
-    if isinstance(scalar_or_schedule, LearningRateScheduler):
-        return scalar_or_schedule
-    elif isinstance(scalar_or_schedule, (int, float, State)):
-        return ConstantLR(scalar_or_schedule)
-    else:
-        raise TypeError(type(scalar_or_schedule))
-class LearningRateScheduler(Node):
-    """
-    The learning rate scheduler.
-    Parameters
-    ----------
-    lr: float, State
-      The learning rate.
-    last_epoch: int
-      The index of last epoch.
-    """
-    def __init__(self, lr: Union[float, State], last_epoch: int = -1):
-        super().__init__()
-        if isinstance(lr, State):
-            lr.value = jnp.asarray(lr.value, dtype=environ.dftype())
-        else:
-            lr = jnp.asarray(lr, dtype=environ.dftype())
-        self._lr = lr
-        assert last_epoch >= -1, 'last_epoch should be greater than -1.'
-        self.last_epoch = LongTermState(jnp.asarray(last_epoch, dtype=environ.ditype()))
-    @property
-    def lr(self):
-        return self._lr.value if isinstance(self._lr, State) else self._lr
-    @lr.setter
-    def lr(self, value):
-        if isinstance(value, State):
-            value = value.value
-        assert jnp.ndim(value) == 0, 'The learning rate should be a scalar.'
-        if isinstance(self._lr, State):
-            self._lr.value = value
-        else:
-            self._lr = value
-    def step_epoch(self):
-        """
-        Update the epoch count.
-        """
-        self.last_epoch.value += 1
-    def step_call(self):
-        """
-        Update the call count.
-        """
-        pass
-    def __call__(self, i=None):
-        raise NotImplementedError
-class ConstantLR(LearningRateScheduler):
-    """
-    Constant learning rate scheduler.
-    """
-    def __call__(self, i=None):
-        return self.lr
-class CallBasedLRScheduler(LearningRateScheduler):
-    """
-    The learning rate scheduler based on the call count.
-    Parameters
-    ----------
-    lr: float
-      The learning rate.
-    last_epoch: int
-      The index of last epoch.
-    last_call: int
-      The index of last call.
-    """
-    def __init__(self, lr: Union[float, State], last_epoch: int = -1, last_call: int = -1):
-        super().__init__(lr=lr, last_epoch=last_epoch)
-        assert last_call >= -1, 'last_call should be greater than -1.'
-        self.last_call = LongTermState(jnp.asarray(last_call, dtype=environ.ditype()))
-    def step_call(self):
-        """
-        Update the call count.
-        """
-        self.last_call.value += 1
-class StepLR(LearningRateScheduler):
-    """Decays the learning rate of each parameter group by gamma every
-    `step_size` epochs.
-    Parameters
-    ----------
-    lr: float
-      Initial learning rate.
-    step_size: int
-      Period of learning rate decay.
-    gamma: float
-      Multiplicative factor of learning rate decay.
-      Default: 0.1.
-    last_epoch: int
-      The index of last epoch. Default: -1.
-    """
-    def __init__(
-        self,
-        lr: float,
-        step_size: int,
-        gamma: float = 0.1,
-        last_epoch: int = -1
-    ):
-        super().__init__(lr=lr, last_epoch=last_epoch)
-        assert step_size >= 1, 'step_size should be greater than or equal to 1.'
-        assert 1. >= gamma >= 0, 'gamma should be in the range [0, 1].'
-        self.step_size = step_size
-        self.gamma = gamma
-    def __call__(self, i=None):
-        i = (self.last_epoch.value + 1) if i is None else i
-        return self.lr * self.gamma ** (jnp.floor_divide(i, self.step_size))
-class MultiStepLR(LearningRateScheduler):
-    """Decays the learning rate of each parameter group by gamma once the
-    number of epoch reaches one of the milestones. Notice that such decay can
-    happen simultaneously with other changes to the learning rate from outside
-    this scheduler. When last_epoch=-1, sets initial lr as lr.
-    Parameters
-    ----------
-    lr: float
-      Initial learning rate.
-    milestones: sequence of int
-      List of epoch indices. Must be increasing.
-    gamma: float
-      Multiplicative factor of learning rate decay.
-      Default: 0.1.
-    last_epoch: int
-      The index of last epoch. Default: -1.
-    """
-    def __init__(
-        self,
-        lr: float,
-        milestones: Sequence[int],
-        gamma: float = 0.1,
-        last_epoch: int = -1
-    ):
-        super().__init__(lr=lr, last_epoch=last_epoch)
-        assert len(milestones) > 0, 'milestones should be a non-empty sequence.'
-        assert all([milestones[i] < milestones[i + 1] for i in range(len(milestones) - 1)]), (
-            'milestones should be a sequence of increasing integers.'
-        )
-        assert 1. >= gamma >= 0, 'gamma should be in the range [0, 1].'
-        self.milestones = jnp.asarray((-1,) + tuple(milestones) + (np.iinfo(np.int32).max,), dtype=environ.ditype())
-        self.gamma = gamma
-    def __call__(self, i=None):
-        i = (self.last_epoch.value + 1) if i is None else i
-        conditions = jnp.logical_and((i >= self.milestones[:-1]), (i < self.milestones[1:]))
-        p = jnp.argmax(conditions)
-        return self.lr * self.gamma ** p
-class CosineAnnealingLR(LearningRateScheduler):
-    r"""Set the learning rate of each parameter group using a cosine annealing
-    schedule, where :math:`\eta_{max}` is set to the initial lr and
-    :math:`T_{cur}` is the number of epochs since the last restart in SGDR:
-    .. math::
-        \begin{aligned}
-            \eta_t & = \eta_{min} + \frac{1}{2}(\eta_{max} - \eta_{min})\left(1
-            + \cos\left(\frac{T_{cur}}{T_{max}}\pi\right)\right),
-            & T_{cur} \neq (2k+1)T_{max}; \\
-            \eta_{t+1} & = \eta_{t} + \frac{1}{2}(\eta_{max} - \eta_{min})
-            \left(1 - \cos\left(\frac{1}{T_{max}}\pi\right)\right),
-            & T_{cur} = (2k+1)T_{max}.
-        \end{aligned}
-    When last_epoch=-1, sets initial lr as lr. Notice that because the schedule
-    is defined recursively, the learning rate can be simultaneously modified
-    outside this scheduler by other operators. If the learning rate is set
-    solely by this scheduler, the learning rate at each step becomes:
-    .. math::
-        \eta_t = \eta_{min} + \frac{1}{2}(\eta_{max} - \eta_{min})\left(1 +
-        \cos\left(\frac{T_{cur}}{T_{max}}\pi\right)\right)
-    It has been proposed in
-    `SGDR: Stochastic Gradient Descent with Warm Restarts`_. Note that this only
-    implements the cosine annealing part of SGDR, and not the restarts.
-    Parameters
-    ----------
-    lr: float
-      Initial learning rate.
-    T_max: int
-      Maximum number of iterations.
-    eta_min: float
-      Minimum learning rate. Default: 0.
-    last_epoch: int
-      The index of last epoch. Default: -1.
-    .. _SGDR\: Stochastic Gradient Descent with Warm Restarts:
-        https://arxiv.org/abs/1608.03983
-    """
-    def __init__(
-        self,
-        lr: float,
-        T_max: int,
-        eta_min: float = 0.,
-        last_epoch: int = -1,
-    ):
-        super().__init__(lr=lr, last_epoch=last_epoch)
-        assert T_max >= 1, 'T_max should be greater than or equal to 1.'
-        self._init_epoch = last_epoch
-        self.T_max = T_max
-        self.eta_min = eta_min
-    def __call__(self, i=None):
-        i = (self.last_epoch.value + 1) if i is None else i
-        return self.eta_min + (self.lr - self.eta_min) * (1 + jnp.cos(jnp.pi * i / self.T_max)) / 2
-class CosineAnnealingWarmRestarts(CallBasedLRScheduler):
-    r"""Set the learning rate of each parameter group using a cosine annealing
-    schedule, where :math:`\eta_{max}` is set to the initial lr, :math:`T_{cur}`
-    is the number of epochs since the last restart and :math:`T_{i}` is the number
-    of epochs between two warm restarts in SGDR:
-    .. math::
-        \eta_t = \eta_{min} + \frac{1}{2}(\eta_{max} - \eta_{min})\left(1 +
-        \cos\left(\frac{T_{cur}}{T_{i}}\pi\right)\right)
-    When :math:`T_{cur}=T_{i}`, set :math:`\eta_t = \eta_{min}`.
-    When :math:`T_{cur}=0` after restart, set :math:`\eta_t=\eta_{max}`.
-    It has been proposed in
-    `SGDR: Stochastic Gradient Descent with Warm Restarts`_.
-    Parameters
-    ----------
-    lr: float
-      Initial learning rate.
-    num_call_per_epoch: int
-      The number the scheduler to call in each epoch.
-      This usually means the number of batch in each epoch training.
-    T_0: int
-      Number of iterations for the first restart.
-    T_mult: int
-      A factor increases :math:`T_{i}` after a restart. Default: 1.
-    eta_min: float
-      Minimum learning rate. Default: 0.
-    last_call: int
-      The index of last call. Default: -1.
-    .. _SGDR\: Stochastic Gradient Descent with Warm Restarts:
-        https://arxiv.org/abs/1608.03983
-    """
-    def __init__(
-        self,
-        lr: float,
-        num_call_per_epoch: int,
-        T_0: int,
-        T_mult: int = 1,
-        eta_min: float = 0.,
-        last_epoch: int = -1,
-        last_call: int = -1
-    ):
-        super().__init__(lr=lr, last_call=last_call, last_epoch=last_epoch)
-        if T_0 <= 0 or not isinstance(T_0, int):
-            raise ValueError("Expected positive integer T_0, but got {}".format(T_0))
-        if T_mult < 1 or not isinstance(T_mult, int):
-            raise ValueError("Expected integer T_mult >= 1, but got {}".format(T_mult))
-        self.T_mult = T_mult
-        self.eta_min = eta_min
-        self.T_0 = T_0
-        self.num_call_per_epoch = num_call_per_epoch
-    def _cond1(self, epoch):
-        if self.T_mult == 1:
-            T_cur = epoch % self.T_0
-            T_i = self.T_0
-        else:
-            n = jnp.floor(jnp.log(epoch / self.T_0 * (self.T_mult - 1) + 1) / jnp.log(self.T_mult))
-            T_cur = epoch - self.T_0 * (self.T_mult ** n - 1) / (self.T_mult - 1)
-            T_i = self.T_0 * self.T_mult ** n
-        return T_cur, T_i
-    def _cond2(self, epoch):
-        return epoch, self.T_0
-    def __call__(self, i=None):
-        epoch = self.current_epoch(i)
-        T_cur, T_i = jax.lax.cond(epoch >= self.T_0, self._cond1, self._cond2, epoch)
-        return self.eta_min + (self.lr - self.eta_min) * (1 + jnp.cos(jnp.pi * T_cur / T_i)) / 2
-    def current_epoch(self, i=None):
-        i = (self.last_call.value + 1) if i is None else i
-        return jnp.floor(i / self.num_call_per_epoch)
-class ExponentialLR(LearningRateScheduler):
-    """Decays the learning rate of each parameter group by gamma every epoch.
-    When last_epoch=-1, sets initial lr as lr.
-    Parameters
-    ----------
-    lr: float
-      Initial learning rate.
-    gamma: float
-      Multiplicative factor of learning rate decay.
-    last_epoch: int
-      The index of last epoch. Default: -1.
-    """
-    def __init__(self,
-                 lr: float,
-                 gamma: float,
-                 last_epoch: int = -1):
-        super(ExponentialLR, self).__init__(lr=lr, last_epoch=last_epoch)
-        assert 1. >= gamma >= 0, 'gamma should be in the range [0, 1].'
-        self.gamma = gamma
-    def __call__(self, i: int = None):
-        i = (self.last_epoch.value + 1) if i is None else i
-        return self.lr * self.gamma ** i
-class ExponentialDecayLR(CallBasedLRScheduler):
-    def __init__(self, lr, decay_steps, decay_rate, last_epoch: int = -1, last_call: int = -1):
-        super().__init__(lr=lr, last_epoch=last_epoch, last_call=last_call)
-        self.decay_steps = decay_steps
-        self.decay_rate = decay_rate
-    def __call__(self, i=None):
-        i = (self.last_call.value + 1) if i is None else i
-        return self.lr * self.decay_rate ** (i / self.decay_steps)
-class InverseTimeDecayLR(ExponentialDecayLR):
-    def __init__(self, lr, decay_steps, decay_rate, staircase=False,
-                 last_epoch: int = -1, last_call: int = -1):
-        super().__init__(lr, decay_steps, decay_rate, last_epoch=last_epoch, last_call=last_call)
-        self.staircase = staircase
-    def __call__(self, i=None):
-        i = (self.last_call.value + 1) if i is None else i
-        if self.staircase:
-            return self.lr / (1 + self.decay_rate * jnp.floor(i / self.decay_steps))
-        else:
-            return self.lr / (1 + self.decay_rate * i / self.decay_steps)
-class PolynomialDecayLR(CallBasedLRScheduler):
-    def __init__(self, lr, decay_steps, final_lr, power=1.0, last_epoch: int = -1, last_call: int = -1):
-        super(PolynomialDecayLR, self).__init__(lr, last_epoch=last_epoch, last_call=last_call)
-        self.decay_steps = decay_steps
-        self.final_lr = final_lr
-        self.power = power
-    def __call__(self, i=None):
-        i = (self.last_call.value + 1) if i is None else i
-        i = jnp.minimum(i, self.decay_steps)
-        step_mult = (1 - i / self.decay_steps) ** self.power
-        return step_mult * (self.lr - self.final_lr) + self.final_lr
-class PiecewiseConstantLR(CallBasedLRScheduler):
-    def __init__(self, boundaries, values, last_epoch: int = -1, last_call: int = -1):
-        super().__init__(0., last_epoch=last_epoch, last_call=last_call)
-        boundaries = jnp.array(boundaries)
-        values = jnp.array(values)
-        if not boundaries.ndim == values.ndim == 1:
-            raise ValueError("boundaries and values must be sequences")
-        if not boundaries.shape[0] == values.shape[0] - 1:
-            raise ValueError("boundaries length must be one shorter than values length")
-        self.boundaries = boundaries
-        self.values = values
-    def __call__(self, i=None):
-        i = (self.last_call.value + 1) if i is None else i
-        return self.values[jnp.sum(i > self.boundaries)]
+# Copyright 2024 BDP Ecosystem Limited. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+# -*- coding: utf-8 -*-
+from typing import Sequence, Union
+import jax
+import jax.numpy as jnp
+import numpy as np
+from brainstate import environ
+from brainstate._state import State, LongTermState
+from brainstate.graph import Node
+__all__ = [
+    'LearningRateScheduler',
+    'ConstantLR',
+    'StepLR',
+    'MultiStepLR',
+    'CosineAnnealingLR',
+    'CosineAnnealingWarmRestarts',
+    'ExponentialLR',
+    'ExponentialDecayLR',
+    'InverseTimeDecayLR',
+    'PolynomialDecayLR',
+    'PiecewiseConstantLR',
+]
+# learning rate schedules #
+# ----------------------- #
+def make_schedule(scalar_or_schedule):
+    if isinstance(scalar_or_schedule, LearningRateScheduler):
+        return scalar_or_schedule
+    elif isinstance(scalar_or_schedule, (int, float, State)):
+        return ConstantLR(scalar_or_schedule)
+    else:
+        raise TypeError(type(scalar_or_schedule))
+class LearningRateScheduler(Node):
+    """
+    The learning rate scheduler.
+    Parameters
+    ----------
+    lr: float, State
+      The learning rate.
+    last_epoch: int
+      The index of last epoch.
+    """
+    def __init__(self, lr: Union[float, State], last_epoch: int = -1):
+        super().__init__()
+        if isinstance(lr, State):
+            lr.value = jnp.asarray(lr.value, dtype=environ.dftype())
+        else:
+            lr = jnp.asarray(lr, dtype=environ.dftype())
+        self._lr = lr
+        assert last_epoch >= -1, 'last_epoch should be greater than -1.'
+        self.last_epoch = LongTermState(jnp.asarray(last_epoch, dtype=environ.ditype()))
+    @property
+    def lr(self):
+        return self._lr.value if isinstance(self._lr, State) else self._lr
+    @lr.setter
+    def lr(self, value):
+        if isinstance(value, State):
+            value = value.value
+        assert jnp.ndim(value) == 0, 'The learning rate should be a scalar.'
+        if isinstance(self._lr, State):
+            self._lr.value = value
+        else:
+            self._lr = value
+    def step_epoch(self):
+        """
+        Update the epoch count.
+        """
+        self.last_epoch.value += 1
+    def step_call(self):
+        """
+        Update the call count.
+        """
+        pass
+    def __call__(self, i=None):
+        raise NotImplementedError
+class ConstantLR(LearningRateScheduler):
+    """
+    Constant learning rate scheduler.
+    """
+    def __call__(self, i=None):
+        return self.lr
+class CallBasedLRScheduler(LearningRateScheduler):
+    """
+    The learning rate scheduler based on the call count.
+    Parameters
+    ----------
+    lr: float
+      The learning rate.
+    last_epoch: int
+      The index of last epoch.
+    last_call: int
+      The index of last call.
+    """
+    def __init__(self, lr: Union[float, State], last_epoch: int = -1, last_call: int = -1):
+        super().__init__(lr=lr, last_epoch=last_epoch)
+        assert last_call >= -1, 'last_call should be greater than -1.'
+        self.last_call = LongTermState(jnp.asarray(last_call, dtype=environ.ditype()))
+    def step_call(self):
+        """
+        Update the call count.
+        """
+        self.last_call.value += 1
+class StepLR(LearningRateScheduler):
+    """Decays the learning rate of each parameter group by gamma every
+    `step_size` epochs.
+    Parameters
+    ----------
+    lr: float
+      Initial learning rate.
+    step_size: int
+      Period of learning rate decay.
+    gamma: float
+      Multiplicative factor of learning rate decay.
+      Default: 0.1.
+    last_epoch: int
+      The index of last epoch. Default: -1.
+    """
+    def __init__(
+        self,
+        lr: float,
+        step_size: int,
+        gamma: float = 0.1,
+        last_epoch: int = -1
+    ):
+        super().__init__(lr=lr, last_epoch=last_epoch)
+        assert step_size >= 1, 'step_size should be greater than or equal to 1.'
+        assert 1. >= gamma >= 0, 'gamma should be in the range [0, 1].'
+        self.step_size = step_size
+        self.gamma = gamma
+    def __call__(self, i=None):
+        i = (self.last_epoch.value + 1) if i is None else i
+        return self.lr * self.gamma ** (jnp.floor_divide(i, self.step_size))
+class MultiStepLR(LearningRateScheduler):
+    """Decays the learning rate of each parameter group by gamma once the
+    number of epoch reaches one of the milestones. Notice that such decay can
+    happen simultaneously with other changes to the learning rate from outside
+    this scheduler. When last_epoch=-1, sets initial lr as lr.
+    Parameters
+    ----------
+    lr: float
+      Initial learning rate.
+    milestones: sequence of int
+      List of epoch indices. Must be increasing.
+    gamma: float
+      Multiplicative factor of learning rate decay.
+      Default: 0.1.
+    last_epoch: int
+      The index of last epoch. Default: -1.
+    """
+    def __init__(
+        self,
+        lr: float,
+        milestones: Sequence[int],
+        gamma: float = 0.1,
+        last_epoch: int = -1
+    ):
+        super().__init__(lr=lr, last_epoch=last_epoch)
+        assert len(milestones) > 0, 'milestones should be a non-empty sequence.'
+        assert all([milestones[i] < milestones[i + 1] for i in range(len(milestones) - 1)]), (
+            'milestones should be a sequence of increasing integers.'
+        )
+        assert 1. >= gamma >= 0, 'gamma should be in the range [0, 1].'
+        self.milestones = jnp.asarray((-1,) + tuple(milestones) + (np.iinfo(np.int32).max,), dtype=environ.ditype())
+        self.gamma = gamma
+    def __call__(self, i=None):
+        i = (self.last_epoch.value + 1) if i is None else i
+        conditions = jnp.logical_and((i >= self.milestones[:-1]), (i < self.milestones[1:]))
+        p = jnp.argmax(conditions)
+        return self.lr * self.gamma ** p
+class CosineAnnealingLR(LearningRateScheduler):
+    r"""Set the learning rate of each parameter group using a cosine annealing
+    schedule, where :math:`\eta_{max}` is set to the initial lr and
+    :math:`T_{cur}` is the number of epochs since the last restart in SGDR:
+    .. math::
+        \begin{aligned}
+            \eta_t & = \eta_{min} + \frac{1}{2}(\eta_{max} - \eta_{min})\left(1
+            + \cos\left(\frac{T_{cur}}{T_{max}}\pi\right)\right),
+            & T_{cur} \neq (2k+1)T_{max}; \\
+            \eta_{t+1} & = \eta_{t} + \frac{1}{2}(\eta_{max} - \eta_{min})
+            \left(1 - \cos\left(\frac{1}{T_{max}}\pi\right)\right),
+            & T_{cur} = (2k+1)T_{max}.
+        \end{aligned}
+    When last_epoch=-1, sets initial lr as lr. Notice that because the schedule
+    is defined recursively, the learning rate can be simultaneously modified
+    outside this scheduler by other operators. If the learning rate is set
+    solely by this scheduler, the learning rate at each step becomes:
+    .. math::
+        \eta_t = \eta_{min} + \frac{1}{2}(\eta_{max} - \eta_{min})\left(1 +
+        \cos\left(\frac{T_{cur}}{T_{max}}\pi\right)\right)
+    It has been proposed in
+    `SGDR: Stochastic Gradient Descent with Warm Restarts`_. Note that this only
+    implements the cosine annealing part of SGDR, and not the restarts.
+    Parameters
+    ----------
+    lr: float
+      Initial learning rate.
+    T_max: int
+      Maximum number of iterations.
+    eta_min: float
+      Minimum learning rate. Default: 0.
+    last_epoch: int
+      The index of last epoch. Default: -1.
+    .. _SGDR\: Stochastic Gradient Descent with Warm Restarts:
+        https://arxiv.org/abs/1608.03983
+    """
+    def __init__(
+        self,
+        lr: float,
+        T_max: int,
+        eta_min: float = 0.,
+        last_epoch: int = -1,
+    ):
+        super().__init__(lr=lr, last_epoch=last_epoch)
+        assert T_max >= 1, 'T_max should be greater than or equal to 1.'
+        self._init_epoch = last_epoch
+        self.T_max = T_max
+        self.eta_min = eta_min
+    def __call__(self, i=None):
+        i = (self.last_epoch.value + 1) if i is None else i
+        return self.eta_min + (self.lr - self.eta_min) * (1 + jnp.cos(jnp.pi * i / self.T_max)) / 2
+class CosineAnnealingWarmRestarts(CallBasedLRScheduler):
+    r"""Set the learning rate of each parameter group using a cosine annealing
+    schedule, where :math:`\eta_{max}` is set to the initial lr, :math:`T_{cur}`
+    is the number of epochs since the last restart and :math:`T_{i}` is the number
+    of epochs between two warm restarts in SGDR:
+    .. math::
+        \eta_t = \eta_{min} + \frac{1}{2}(\eta_{max} - \eta_{min})\left(1 +
+        \cos\left(\frac{T_{cur}}{T_{i}}\pi\right)\right)
+    When :math:`T_{cur}=T_{i}`, set :math:`\eta_t = \eta_{min}`.
+    When :math:`T_{cur}=0` after restart, set :math:`\eta_t=\eta_{max}`.
+    It has been proposed in
+    `SGDR: Stochastic Gradient Descent with Warm Restarts`_.
+    Parameters
+    ----------
+    lr: float
+      Initial learning rate.
+    num_call_per_epoch: int
+      The number the scheduler to call in each epoch.
+      This usually means the number of batch in each epoch training.
+    T_0: int
+      Number of iterations for the first restart.
+    T_mult: int
+      A factor increases :math:`T_{i}` after a restart. Default: 1.
+    eta_min: float
+      Minimum learning rate. Default: 0.
+    last_call: int
+      The index of last call. Default: -1.
+    .. _SGDR\: Stochastic Gradient Descent with Warm Restarts:
+        https://arxiv.org/abs/1608.03983
+    """
+    def __init__(
+        self,
+        lr: float,
+        num_call_per_epoch: int,
+        T_0: int,
+        T_mult: int = 1,
+        eta_min: float = 0.,
+        last_epoch: int = -1,
+        last_call: int = -1
+    ):
+        super().__init__(lr=lr, last_call=last_call, last_epoch=last_epoch)
+        if T_0 <= 0 or not isinstance(T_0, int):
+            raise ValueError("Expected positive integer T_0, but got {}".format(T_0))
+        if T_mult < 1 or not isinstance(T_mult, int):
+            raise ValueError("Expected integer T_mult >= 1, but got {}".format(T_mult))
+        self.T_mult = T_mult
+        self.eta_min = eta_min
+        self.T_0 = T_0
+        self.num_call_per_epoch = num_call_per_epoch
+    def _cond1(self, epoch):
+        if self.T_mult == 1:
+            T_cur = epoch % self.T_0
+            T_i = self.T_0
+        else:
+            n = jnp.floor(jnp.log(epoch / self.T_0 * (self.T_mult - 1) + 1) / jnp.log(self.T_mult))
+            T_cur = epoch - self.T_0 * (self.T_mult ** n - 1) / (self.T_mult - 1)
+            T_i = self.T_0 * self.T_mult ** n
+        return T_cur, T_i
+    def _cond2(self, epoch):
+        return epoch, self.T_0
+    def __call__(self, i=None):
+        epoch = self.current_epoch(i)
+        T_cur, T_i = jax.lax.cond(epoch >= self.T_0, self._cond1, self._cond2, epoch)
+        return self.eta_min + (self.lr - self.eta_min) * (1 + jnp.cos(jnp.pi * T_cur / T_i)) / 2
+    def current_epoch(self, i=None):
+        i = (self.last_call.value + 1) if i is None else i
+        return jnp.floor(i / self.num_call_per_epoch)
+class ExponentialLR(LearningRateScheduler):
+    """Decays the learning rate of each parameter group by gamma every epoch.
+    When last_epoch=-1, sets initial lr as lr.
+    Parameters
+    ----------
+    lr: float
+      Initial learning rate.
+    gamma: float
+      Multiplicative factor of learning rate decay.
+    last_epoch: int
+      The index of last epoch. Default: -1.
+    """
+    def __init__(self,
+                 lr: float,
+                 gamma: float,
+                 last_epoch: int = -1):
+        super(ExponentialLR, self).__init__(lr=lr, last_epoch=last_epoch)
+        assert 1. >= gamma >= 0, 'gamma should be in the range [0, 1].'
+        self.gamma = gamma
+    def __call__(self, i: int = None):
+        i = (self.last_epoch.value + 1) if i is None else i
+        return self.lr * self.gamma ** i
+class ExponentialDecayLR(CallBasedLRScheduler):
+    def __init__(self, lr, decay_steps, decay_rate, last_epoch: int = -1, last_call: int = -1):
+        super().__init__(lr=lr, last_epoch=last_epoch, last_call=last_call)
+        self.decay_steps = decay_steps
+        self.decay_rate = decay_rate
+    def __call__(self, i=None):
+        i = (self.last_call.value + 1) if i is None else i
+        return self.lr * self.decay_rate ** (i / self.decay_steps)
+class InverseTimeDecayLR(ExponentialDecayLR):
+    def __init__(self, lr, decay_steps, decay_rate, staircase=False,
+                 last_epoch: int = -1, last_call: int = -1):
+        super().__init__(lr, decay_steps, decay_rate, last_epoch=last_epoch, last_call=last_call)
+        self.staircase = staircase
+    def __call__(self, i=None):
+        i = (self.last_call.value + 1) if i is None else i
+        if self.staircase:
+            return self.lr / (1 + self.decay_rate * jnp.floor(i / self.decay_steps))
+        else:
+            return self.lr / (1 + self.decay_rate * i / self.decay_steps)
+class PolynomialDecayLR(CallBasedLRScheduler):
+    def __init__(self, lr, decay_steps, final_lr, power=1.0, last_epoch: int = -1, last_call: int = -1):
+        super(PolynomialDecayLR, self).__init__(lr, last_epoch=last_epoch, last_call=last_call)
+        self.decay_steps = decay_steps
+        self.final_lr = final_lr
+        self.power = power
+    def __call__(self, i=None):
+        i = (self.last_call.value + 1) if i is None else i
+        i = jnp.minimum(i, self.decay_steps)
+        step_mult = (1 - i / self.decay_steps) ** self.power
+        return step_mult * (self.lr - self.final_lr) + self.final_lr
+class PiecewiseConstantLR(CallBasedLRScheduler):
+    def __init__(self, boundaries, values, last_epoch: int = -1, last_call: int = -1):
+        super().__init__(0., last_epoch=last_epoch, last_call=last_call)
+        boundaries = jnp.array(boundaries)
+        values = jnp.array(values)
+        if not boundaries.ndim == values.ndim == 1:
+            raise ValueError("boundaries and values must be sequences")
+        if not boundaries.shape[0] == values.shape[0] - 1:
+            raise ValueError("boundaries length must be one shorter than values length")
+        self.boundaries = boundaries
+        self.values = values
+    def __call__(self, i=None):
+        i = (self.last_call.value + 1) if i is None else i
+        return self.values[jnp.sum(i > self.boundaries)]

brainstate 0.1.8__py2.py3-none-any.whl → 0.1.9__py2.py3-none-any.whl

brainstate 0.1.8py2.py3-none-any.whl → 0.1.9py2.py3-none-any.whl