PyPI - brainstate - Versions diffs - 0.1.10__py2.py3-none-any.whl → 0.2.0__py2.py3-none-any.whl - Mend

brainstate 0.1.10py2.py3-none-any.whl → 0.2.0py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (163) hide show

brainstate/__init__.py +130 -19
brainstate/_compatible_import.py +201 -9
brainstate/_compatible_import_test.py +681 -0
brainstate/_deprecation.py +210 -0
brainstate/_deprecation_test.py +2319 -0
brainstate/{util/error.py → _error.py} +10 -20
brainstate/_state.py +94 -47
brainstate/_state_test.py +1 -1
brainstate/_utils.py +1 -1
brainstate/environ.py +1279 -347
brainstate/environ_test.py +1187 -26
brainstate/graph/__init__.py +6 -13
brainstate/graph/_node.py +240 -0
brainstate/graph/_node_test.py +589 -0
brainstate/graph/{_graph_operation.py → _operation.py} +632 -746
brainstate/graph/_operation_test.py +1147 -0
brainstate/mixin.py +1209 -141
brainstate/mixin_test.py +991 -51
brainstate/nn/__init__.py +74 -72
brainstate/nn/_activations.py +587 -295
brainstate/nn/_activations_test.py +109 -86
brainstate/nn/_collective_ops.py +393 -274
brainstate/nn/_collective_ops_test.py +746 -15
brainstate/nn/_common.py +114 -66
brainstate/nn/_common_test.py +154 -0
brainstate/nn/_conv.py +1652 -143
brainstate/nn/_conv_test.py +838 -227
brainstate/nn/_delay.py +15 -28
brainstate/nn/_delay_test.py +25 -20
brainstate/nn/_dropout.py +359 -167
brainstate/nn/_dropout_test.py +429 -52
brainstate/nn/_dynamics.py +14 -90
brainstate/nn/_dynamics_test.py +1 -12
brainstate/nn/_elementwise.py +492 -313
brainstate/nn/_elementwise_test.py +806 -145
brainstate/nn/_embedding.py +369 -19
brainstate/nn/_embedding_test.py +156 -0
brainstate/nn/{_fixedprob.py → _event_fixedprob.py} +10 -16
brainstate/nn/{_fixedprob_test.py → _event_fixedprob_test.py} +6 -5
brainstate/nn/{_linear_mv.py → _event_linear.py} +2 -2
brainstate/nn/{_linear_mv_test.py → _event_linear_test.py} +6 -5
brainstate/nn/_exp_euler.py +200 -38
brainstate/nn/_exp_euler_test.py +350 -8
brainstate/nn/_linear.py +391 -71
brainstate/nn/_linear_test.py +427 -59
brainstate/nn/_metrics.py +1070 -0
brainstate/nn/_metrics_test.py +611 -0
brainstate/nn/_module.py +10 -3
brainstate/nn/_module_test.py +1 -1
brainstate/nn/_normalizations.py +688 -329
brainstate/nn/_normalizations_test.py +663 -37
brainstate/nn/_paddings.py +1020 -0
brainstate/nn/_paddings_test.py +723 -0
brainstate/nn/_poolings.py +1404 -342
brainstate/nn/_poolings_test.py +828 -92
brainstate/nn/{_rate_rnns.py → _rnns.py} +446 -54
brainstate/nn/_rnns_test.py +593 -0
brainstate/nn/_utils.py +132 -5
brainstate/nn/_utils_test.py +402 -0
brainstate/{init/_random_inits.py → nn/init.py} +301 -45
brainstate/{init/_random_inits_test.py → nn/init_test.py} +51 -20
brainstate/random/__init__.py +247 -1
brainstate/random/_rand_funs.py +668 -346
brainstate/random/_rand_funs_test.py +74 -1
brainstate/random/_rand_seed.py +541 -76
brainstate/random/_rand_seed_test.py +1 -1
brainstate/random/_rand_state.py +601 -393
brainstate/random/_rand_state_test.py +551 -0
brainstate/transform/__init__.py +59 -0
brainstate/transform/_ad_checkpoint.py +176 -0
brainstate/{compile → transform}/_ad_checkpoint_test.py +1 -1
brainstate/{augment → transform}/_autograd.py +360 -113
brainstate/{augment → transform}/_autograd_test.py +2 -2
brainstate/transform/_conditions.py +316 -0
brainstate/{compile → transform}/_conditions_test.py +11 -11
brainstate/{compile → transform}/_error_if.py +22 -20
brainstate/{compile → transform}/_error_if_test.py +1 -1
brainstate/transform/_eval_shape.py +145 -0
brainstate/{augment → transform}/_eval_shape_test.py +1 -1
brainstate/{compile → transform}/_jit.py +99 -46
brainstate/{compile → transform}/_jit_test.py +3 -3
brainstate/{compile → transform}/_loop_collect_return.py +219 -80
brainstate/{compile → transform}/_loop_collect_return_test.py +1 -1
brainstate/{compile → transform}/_loop_no_collection.py +133 -34
brainstate/{compile → transform}/_loop_no_collection_test.py +2 -2
brainstate/transform/_make_jaxpr.py +2016 -0
brainstate/transform/_make_jaxpr_test.py +1510 -0
brainstate/transform/_mapping.py +529 -0
brainstate/transform/_mapping_test.py +194 -0
brainstate/{compile → transform}/_progress_bar.py +78 -25
brainstate/{augment → transform}/_random.py +65 -45
brainstate/{compile → transform}/_unvmap.py +102 -5
brainstate/transform/_util.py +286 -0
brainstate/typing.py +594 -61
brainstate/typing_test.py +780 -0
brainstate/util/__init__.py +9 -32
brainstate/util/_others.py +1025 -0
brainstate/util/_others_test.py +962 -0
brainstate/util/_pretty_pytree.py +1301 -0
brainstate/util/_pretty_pytree_test.py +675 -0
brainstate/util/{pretty_repr.py → _pretty_repr.py} +161 -27
brainstate/util/_pretty_repr_test.py +696 -0
brainstate/util/filter.py +557 -81
brainstate/util/filter_test.py +912 -0
brainstate/util/struct.py +769 -382
brainstate/util/struct_test.py +602 -0
{brainstate-0.1.10.dist-info → brainstate-0.2.0.dist-info}/METADATA +34 -17
brainstate-0.2.0.dist-info/RECORD +111 -0
brainstate/augment/__init__.py +0 -30
brainstate/augment/_eval_shape.py +0 -99
brainstate/augment/_mapping.py +0 -1060
brainstate/augment/_mapping_test.py +0 -597
brainstate/compile/__init__.py +0 -38
brainstate/compile/_ad_checkpoint.py +0 -204
brainstate/compile/_conditions.py +0 -256
brainstate/compile/_make_jaxpr.py +0 -888
brainstate/compile/_make_jaxpr_test.py +0 -156
brainstate/compile/_util.py +0 -147
brainstate/functional/__init__.py +0 -27
brainstate/graph/_graph_node.py +0 -244
brainstate/graph/_graph_node_test.py +0 -73
brainstate/graph/_graph_operation_test.py +0 -563
brainstate/init/__init__.py +0 -26
brainstate/init/_base.py +0 -52
brainstate/init/_generic.py +0 -244
brainstate/init/_regular_inits.py +0 -105
brainstate/init/_regular_inits_test.py +0 -50
brainstate/nn/_inputs.py +0 -608
brainstate/nn/_ltp.py +0 -28
brainstate/nn/_neuron.py +0 -705
brainstate/nn/_neuron_test.py +0 -161
brainstate/nn/_others.py +0 -46
brainstate/nn/_projection.py +0 -486
brainstate/nn/_rate_rnns_test.py +0 -63
brainstate/nn/_readout.py +0 -209
brainstate/nn/_readout_test.py +0 -53
brainstate/nn/_stp.py +0 -236
brainstate/nn/_synapse.py +0 -505
brainstate/nn/_synapse_test.py +0 -131
brainstate/nn/_synaptic_projection.py +0 -423
brainstate/nn/_synouts.py +0 -162
brainstate/nn/_synouts_test.py +0 -57
brainstate/nn/metrics.py +0 -388
brainstate/optim/__init__.py +0 -38
brainstate/optim/_base.py +0 -64
brainstate/optim/_lr_scheduler.py +0 -448
brainstate/optim/_lr_scheduler_test.py +0 -50
brainstate/optim/_optax_optimizer.py +0 -152
brainstate/optim/_optax_optimizer_test.py +0 -53
brainstate/optim/_sgd_optimizer.py +0 -1104
brainstate/random/_random_for_unit.py +0 -52
brainstate/surrogate.py +0 -1957
brainstate/transform.py +0 -23
brainstate/util/caller.py +0 -98
brainstate/util/others.py +0 -540
brainstate/util/pretty_pytree.py +0 -945
brainstate/util/pretty_pytree_test.py +0 -159
brainstate/util/pretty_table.py +0 -2954
brainstate/util/scaling.py +0 -258
brainstate-0.1.10.dist-info/RECORD +0 -130
{brainstate-0.1.10.dist-info → brainstate-0.2.0.dist-info}/WHEEL +0 -0
{brainstate-0.1.10.dist-info → brainstate-0.2.0.dist-info}/licenses/LICENSE +0 -0
{brainstate-0.1.10.dist-info → brainstate-0.2.0.dist-info}/top_level.txt +0 -0

brainstate/optim/_lr_scheduler.py DELETED Viewed

@@ -1,448 +0,0 @@
-# Copyright 2024 BDP Ecosystem Limited. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-# -*- coding: utf-8 -*-
-from typing import Sequence, Union
-import jax
-import jax.numpy as jnp
-import numpy as np
-from brainstate import environ
-from brainstate._state import State, LongTermState
-from brainstate.graph import Node
-__all__ = [
-    'LearningRateScheduler',
-    'ConstantLR',
-    'StepLR',
-    'MultiStepLR',
-    'CosineAnnealingLR',
-    'CosineAnnealingWarmRestarts',
-    'ExponentialLR',
-    'ExponentialDecayLR',
-    'InverseTimeDecayLR',
-    'PolynomialDecayLR',
-    'PiecewiseConstantLR',
-]
-# learning rate schedules #
-# ----------------------- #
-def make_schedule(scalar_or_schedule):
-    if isinstance(scalar_or_schedule, LearningRateScheduler):
-        return scalar_or_schedule
-    elif isinstance(scalar_or_schedule, (int, float, State)):
-        return ConstantLR(scalar_or_schedule)
-    else:
-        raise TypeError(type(scalar_or_schedule))
-class LearningRateScheduler(Node):
-    """
-    The learning rate scheduler.
-    Parameters
-    ----------
-    lr: float, State
-      The learning rate.
-    last_epoch: int
-      The index of last epoch.
-    """
-    def __init__(self, lr: Union[float, State], last_epoch: int = -1):
-        super().__init__()
-        if isinstance(lr, State):
-            lr.value = jnp.asarray(lr.value, dtype=environ.dftype())
-        else:
-            lr = jnp.asarray(lr, dtype=environ.dftype())
-        self._lr = lr
-        assert last_epoch >= -1, 'last_epoch should be greater than -1.'
-        self.last_epoch = LongTermState(jnp.asarray(last_epoch, dtype=environ.ditype()))
-    @property
-    def lr(self):
-        return self._lr.value if isinstance(self._lr, State) else self._lr
-    @lr.setter
-    def lr(self, value):
-        if isinstance(value, State):
-            value = value.value
-        assert jnp.ndim(value) == 0, 'The learning rate should be a scalar.'
-        if isinstance(self._lr, State):
-            self._lr.value = value
-        else:
-            self._lr = value
-    def step_epoch(self):
-        """
-        Update the epoch count.
-        """
-        self.last_epoch.value += 1
-    def step_call(self):
-        """
-        Update the call count.
-        """
-        pass
-    def __call__(self, i=None):
-        raise NotImplementedError
-class ConstantLR(LearningRateScheduler):
-    """
-    Constant learning rate scheduler.
-    """
-    def __call__(self, i=None):
-        return self.lr
-class CallBasedLRScheduler(LearningRateScheduler):
-    """
-    The learning rate scheduler based on the call count.
-    Parameters
-    ----------
-    lr: float
-      The learning rate.
-    last_epoch: int
-      The index of last epoch.
-    last_call: int
-      The index of last call.
-    """
-    def __init__(self, lr: Union[float, State], last_epoch: int = -1, last_call: int = -1):
-        super().__init__(lr=lr, last_epoch=last_epoch)
-        assert last_call >= -1, 'last_call should be greater than -1.'
-        self.last_call = LongTermState(jnp.asarray(last_call, dtype=environ.ditype()))
-    def step_call(self):
-        """
-        Update the call count.
-        """
-        self.last_call.value += 1
-class StepLR(LearningRateScheduler):
-    """Decays the learning rate of each parameter group by gamma every
-    `step_size` epochs.
-    Parameters
-    ----------
-    lr: float
-      Initial learning rate.
-    step_size: int
-      Period of learning rate decay.
-    gamma: float
-      Multiplicative factor of learning rate decay.
-      Default: 0.1.
-    last_epoch: int
-      The index of last epoch. Default: -1.
-    """
-    def __init__(
-        self,
-        lr: float,
-        step_size: int,
-        gamma: float = 0.1,
-        last_epoch: int = -1
-    ):
-        super().__init__(lr=lr, last_epoch=last_epoch)
-        assert step_size >= 1, 'step_size should be greater than or equal to 1.'
-        assert 1. >= gamma >= 0, 'gamma should be in the range [0, 1].'
-        self.step_size = step_size
-        self.gamma = gamma
-    def __call__(self, i=None):
-        i = (self.last_epoch.value + 1) if i is None else i
-        return self.lr * self.gamma ** (jnp.floor_divide(i, self.step_size))
-class MultiStepLR(LearningRateScheduler):
-    """Decays the learning rate of each parameter group by gamma once the
-    number of epoch reaches one of the milestones. Notice that such decay can
-    happen simultaneously with other changes to the learning rate from outside
-    this scheduler. When last_epoch=-1, sets initial lr as lr.
-    Parameters
-    ----------
-    lr: float
-      Initial learning rate.
-    milestones: sequence of int
-      List of epoch indices. Must be increasing.
-    gamma: float
-      Multiplicative factor of learning rate decay.
-      Default: 0.1.
-    last_epoch: int
-      The index of last epoch. Default: -1.
-    """
-    def __init__(
-        self,
-        lr: float,
-        milestones: Sequence[int],
-        gamma: float = 0.1,
-        last_epoch: int = -1
-    ):
-        super().__init__(lr=lr, last_epoch=last_epoch)
-        assert len(milestones) > 0, 'milestones should be a non-empty sequence.'
-        assert all([milestones[i] < milestones[i + 1] for i in range(len(milestones) - 1)]), (
-            'milestones should be a sequence of increasing integers.'
-        )
-        assert 1. >= gamma >= 0, 'gamma should be in the range [0, 1].'
-        self.milestones = jnp.asarray((-1,) + tuple(milestones) + (np.iinfo(np.int32).max,), dtype=environ.ditype())
-        self.gamma = gamma
-    def __call__(self, i=None):
-        i = (self.last_epoch.value + 1) if i is None else i
-        conditions = jnp.logical_and((i >= self.milestones[:-1]), (i < self.milestones[1:]))
-        p = jnp.argmax(conditions)
-        return self.lr * self.gamma ** p
-class CosineAnnealingLR(LearningRateScheduler):
-    r"""Set the learning rate of each parameter group using a cosine annealing
-    schedule, where :math:`\eta_{max}` is set to the initial lr and
-    :math:`T_{cur}` is the number of epochs since the last restart in SGDR:
-    .. math::
-        \begin{aligned}
-            \eta_t & = \eta_{min} + \frac{1}{2}(\eta_{max} - \eta_{min})\left(1
-            + \cos\left(\frac{T_{cur}}{T_{max}}\pi\right)\right),
-            & T_{cur} \neq (2k+1)T_{max}; \\
-            \eta_{t+1} & = \eta_{t} + \frac{1}{2}(\eta_{max} - \eta_{min})
-            \left(1 - \cos\left(\frac{1}{T_{max}}\pi\right)\right),
-            & T_{cur} = (2k+1)T_{max}.
-        \end{aligned}
-    When last_epoch=-1, sets initial lr as lr. Notice that because the schedule
-    is defined recursively, the learning rate can be simultaneously modified
-    outside this scheduler by other operators. If the learning rate is set
-    solely by this scheduler, the learning rate at each step becomes:
-    .. math::
-        \eta_t = \eta_{min} + \frac{1}{2}(\eta_{max} - \eta_{min})\left(1 +
-        \cos\left(\frac{T_{cur}}{T_{max}}\pi\right)\right)
-    It has been proposed in
-    `SGDR: Stochastic Gradient Descent with Warm Restarts`_. Note that this only
-    implements the cosine annealing part of SGDR, and not the restarts.
-    Parameters
-    ----------
-    lr: float
-      Initial learning rate.
-    T_max: int
-      Maximum number of iterations.
-    eta_min: float
-      Minimum learning rate. Default: 0.
-    last_epoch: int
-      The index of last epoch. Default: -1.
-    .. _SGDR\: Stochastic Gradient Descent with Warm Restarts:
-        https://arxiv.org/abs/1608.03983
-    """
-    def __init__(
-        self,
-        lr: float,
-        T_max: int,
-        eta_min: float = 0.,
-        last_epoch: int = -1,
-    ):
-        super().__init__(lr=lr, last_epoch=last_epoch)
-        assert T_max >= 1, 'T_max should be greater than or equal to 1.'
-        self._init_epoch = last_epoch
-        self.T_max = T_max
-        self.eta_min = eta_min
-    def __call__(self, i=None):
-        i = (self.last_epoch.value + 1) if i is None else i
-        return self.eta_min + (self.lr - self.eta_min) * (1 + jnp.cos(jnp.pi * i / self.T_max)) / 2
-class CosineAnnealingWarmRestarts(CallBasedLRScheduler):
-    r"""Set the learning rate of each parameter group using a cosine annealing
-    schedule, where :math:`\eta_{max}` is set to the initial lr, :math:`T_{cur}`
-    is the number of epochs since the last restart and :math:`T_{i}` is the number
-    of epochs between two warm restarts in SGDR:
-    .. math::
-        \eta_t = \eta_{min} + \frac{1}{2}(\eta_{max} - \eta_{min})\left(1 +
-        \cos\left(\frac{T_{cur}}{T_{i}}\pi\right)\right)
-    When :math:`T_{cur}=T_{i}`, set :math:`\eta_t = \eta_{min}`.
-    When :math:`T_{cur}=0` after restart, set :math:`\eta_t=\eta_{max}`.
-    It has been proposed in
-    `SGDR: Stochastic Gradient Descent with Warm Restarts`_.
-    Parameters
-    ----------
-    lr: float
-      Initial learning rate.
-    num_call_per_epoch: int
-      The number the scheduler to call in each epoch.
-      This usually means the number of batch in each epoch training.
-    T_0: int
-      Number of iterations for the first restart.
-    T_mult: int
-      A factor increases :math:`T_{i}` after a restart. Default: 1.
-    eta_min: float
-      Minimum learning rate. Default: 0.
-    last_call: int
-      The index of last call. Default: -1.
-    .. _SGDR\: Stochastic Gradient Descent with Warm Restarts:
-        https://arxiv.org/abs/1608.03983
-    """
-    def __init__(
-        self,
-        lr: float,
-        num_call_per_epoch: int,
-        T_0: int,
-        T_mult: int = 1,
-        eta_min: float = 0.,
-        last_epoch: int = -1,
-        last_call: int = -1
-    ):
-        super().__init__(lr=lr, last_call=last_call, last_epoch=last_epoch)
-        if T_0 <= 0 or not isinstance(T_0, int):
-            raise ValueError("Expected positive integer T_0, but got {}".format(T_0))
-        if T_mult < 1 or not isinstance(T_mult, int):
-            raise ValueError("Expected integer T_mult >= 1, but got {}".format(T_mult))
-        self.T_mult = T_mult
-        self.eta_min = eta_min
-        self.T_0 = T_0
-        self.num_call_per_epoch = num_call_per_epoch
-    def _cond1(self, epoch):
-        if self.T_mult == 1:
-            T_cur = epoch % self.T_0
-            T_i = self.T_0
-        else:
-            n = jnp.floor(jnp.log(epoch / self.T_0 * (self.T_mult - 1) + 1) / jnp.log(self.T_mult))
-            T_cur = epoch - self.T_0 * (self.T_mult ** n - 1) / (self.T_mult - 1)
-            T_i = self.T_0 * self.T_mult ** n
-        return T_cur, T_i
-    def _cond2(self, epoch):
-        return epoch, self.T_0
-    def __call__(self, i=None):
-        epoch = self.current_epoch(i)
-        T_cur, T_i = jax.lax.cond(epoch >= self.T_0, self._cond1, self._cond2, epoch)
-        return self.eta_min + (self.lr - self.eta_min) * (1 + jnp.cos(jnp.pi * T_cur / T_i)) / 2
-    def current_epoch(self, i=None):
-        i = (self.last_call.value + 1) if i is None else i
-        return jnp.floor(i / self.num_call_per_epoch)
-class ExponentialLR(LearningRateScheduler):
-    """Decays the learning rate of each parameter group by gamma every epoch.
-    When last_epoch=-1, sets initial lr as lr.
-    Parameters
-    ----------
-    lr: float
-      Initial learning rate.
-    gamma: float
-      Multiplicative factor of learning rate decay.
-    last_epoch: int
-      The index of last epoch. Default: -1.
-    """
-    def __init__(self,
-                 lr: float,
-                 gamma: float,
-                 last_epoch: int = -1):
-        super(ExponentialLR, self).__init__(lr=lr, last_epoch=last_epoch)
-        assert 1. >= gamma >= 0, 'gamma should be in the range [0, 1].'
-        self.gamma = gamma
-    def __call__(self, i: int = None):
-        i = (self.last_epoch.value + 1) if i is None else i
-        return self.lr * self.gamma ** i
-class ExponentialDecayLR(CallBasedLRScheduler):
-    def __init__(self, lr, decay_steps, decay_rate, last_epoch: int = -1, last_call: int = -1):
-        super().__init__(lr=lr, last_epoch=last_epoch, last_call=last_call)
-        self.decay_steps = decay_steps
-        self.decay_rate = decay_rate
-    def __call__(self, i=None):
-        i = (self.last_call.value + 1) if i is None else i
-        return self.lr * self.decay_rate ** (i / self.decay_steps)
-class InverseTimeDecayLR(ExponentialDecayLR):
-    def __init__(self, lr, decay_steps, decay_rate, staircase=False,
-                 last_epoch: int = -1, last_call: int = -1):
-        super().__init__(lr, decay_steps, decay_rate, last_epoch=last_epoch, last_call=last_call)
-        self.staircase = staircase
-    def __call__(self, i=None):
-        i = (self.last_call.value + 1) if i is None else i
-        if self.staircase:
-            return self.lr / (1 + self.decay_rate * jnp.floor(i / self.decay_steps))
-        else:
-            return self.lr / (1 + self.decay_rate * i / self.decay_steps)
-class PolynomialDecayLR(CallBasedLRScheduler):
-    def __init__(self, lr, decay_steps, final_lr, power=1.0, last_epoch: int = -1, last_call: int = -1):
-        super(PolynomialDecayLR, self).__init__(lr, last_epoch=last_epoch, last_call=last_call)
-        self.decay_steps = decay_steps
-        self.final_lr = final_lr
-        self.power = power
-    def __call__(self, i=None):
-        i = (self.last_call.value + 1) if i is None else i
-        i = jnp.minimum(i, self.decay_steps)
-        step_mult = (1 - i / self.decay_steps) ** self.power
-        return step_mult * (self.lr - self.final_lr) + self.final_lr
-class PiecewiseConstantLR(CallBasedLRScheduler):
-    def __init__(self, boundaries, values, last_epoch: int = -1, last_call: int = -1):
-        super().__init__(0., last_epoch=last_epoch, last_call=last_call)
-        boundaries = jnp.array(boundaries)
-        values = jnp.array(values)
-        if not boundaries.ndim == values.ndim == 1:
-            raise ValueError("boundaries and values must be sequences")
-        if not boundaries.shape[0] == values.shape[0] - 1:
-            raise ValueError("boundaries length must be one shorter than values length")
-        self.boundaries = boundaries
-        self.values = values
-    def __call__(self, i=None):
-        i = (self.last_call.value + 1) if i is None else i
-        return self.values[jnp.sum(i > self.boundaries)]

brainstate/optim/_lr_scheduler_test.py DELETED Viewed

@@ -1,50 +0,0 @@
-# Copyright 2024 BDP Ecosystem Limited. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-from __future__ import annotations
-import unittest
-import jax.numpy as jnp
-import brainstate
-class TestMultiStepLR(unittest.TestCase):
-    def test1(self):
-        lr = brainstate.optim.MultiStepLR(0.1, [10, 20, 30], gamma=0.1)
-        for i in range(40):
-            r = lr(i)
-            if i < 10:
-                self.assertEqual(r, 0.1)
-            elif i < 20:
-                self.assertTrue(jnp.allclose(r, 0.01))
-            elif i < 30:
-                self.assertTrue(jnp.allclose(r, 0.001))
-            else:
-                self.assertTrue(jnp.allclose(r, 0.0001))
-    def test2(self):
-        lr = brainstate.compile.jit(brainstate.optim.MultiStepLR(0.1, [10, 20, 30], gamma=0.1))
-        for i in range(40):
-            r = lr(i)
-            if i < 10:
-                self.assertEqual(r, 0.1)
-            elif i < 20:
-                self.assertTrue(jnp.allclose(r, 0.01))
-            elif i < 30:
-                self.assertTrue(jnp.allclose(r, 0.001))
-            else:
-                self.assertTrue(jnp.allclose(r, 0.0001))

brainstate/optim/_optax_optimizer.py DELETED Viewed

@@ -1,152 +0,0 @@
-# Copyright 2024 BDP Ecosystem Limited. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-import importlib.util
-from typing import Hashable, Dict, Optional
-from brainstate._state import ShortTermState, State, StateDictManager
-from brainstate.typing import PyTree
-from ._base import Optimizer
-optax_installed = importlib.util.find_spec('optax') is not None
-__all__ = [
-    'OptaxOptimizer',
-    'LBFGS',
-]
-class OptaxOptimizer(Optimizer):
-    """Simple train state for the common case with a single Optax optimizer.
-    Example usage::
-      >>> import jax
-      >>> import jax.numpy as jnp
-      >>> import brainstate as brainstate
-      >>> import optax
-      ...
-      >>> class Model(brainstate.nn.Module):
-      ...   def __init__(self):
-      ...     super().__init__()
-      ...     self.linear1 = brainstate.nn.Linear(2, 3)
-      ...     self.linear2 = brainstate.nn.Linear(3, 4)
-      ...   def __call__(self, x):
-      ...     return self.linear2(self.linear1(x))
-      ...
-      >>> x = brainstate.random.randn(1, 2)
-      >>> y = jnp.ones((1, 4))
-      ...
-      >>> model = Model()
-      >>> tx = optax.adam(1e-3)
-      >>> optimizer = brainstate.optim.OptaxOptimizer(tx)
-      >>> optimizer.register_trainable_weights(model.states(brainstate.ParamState))
-      ...
-      >>> loss_fn = lambda: ((model(x) - y) ** 2).mean()
-      >>> loss_fn()
-      Array(1.7055722, dtype=float32)
-      >>> grads = brainstate.augment.grad(loss_fn, model.states(brainstate.ParamState))()
-      >>> optimizer.update(grads)
-      >>> loss_fn()
-      Array(1.6925814, dtype=float32)
-    For more exotic usecases (e.g. multiple optimizers) it's probably best to
-    fork the class and modify it.
-    Attributes:
-      param_states: The parameter states to update.
-      tx: An Optax gradient transformation.
-    """
-    param_states: StateDictManager
-    opt_state: Optional[ShortTermState]
-    def __init__(
-        self,
-        tx: 'optax.GradientTransformation',
-    ):
-        """
-        Instantiate the class and wrap the :class:`FlattedDict` and Optax gradient
-        transformation. Instantiate the optimizer state to keep track of
-        :class:`State`.
-        Args:
-          tx: An Optax gradient transformation.
-        """
-        super().__init__()
-        # tx must be an instance of optax.GradientTransformation
-        import optax  # type: ignore[import-not-found,import-untyped]
-        if not isinstance(tx, optax.GradientTransformation):
-            raise TypeError(f"tx must be an instance of optax.GradientTransformation, got {tx}")
-        self.tx = tx
-        # optimizer state
-        self.opt_state = None
-    def register_trainable_weights(self, param_states: Dict[Hashable, State]):
-        # model
-        if not isinstance(param_states, dict):
-            raise TypeError(f"states must be a dict, got {param_states}")
-        for k, v in param_states.items():
-            if not isinstance(v, State):
-                raise TypeError(f"states values must be ParamState, got {v}")
-        self.param_states.update(param_states)
-        self.param_states.unique_()
-        # wrt
-        self.opt_state = ShortTermState(self.tx.init({k: v.value for k, v in self.param_states.items()}))
-        return self
-    def update(self, grads: Dict[Hashable, PyTree]):
-        """Update the model states with the gradients.
-        Args:
-          grads: the gradients derived from ``brainstate.augment.grad``.
-        """
-        if self.opt_state is None:
-            raise ValueError("register_trainable_weights must be called before update.")
-        import optax  # type: ignore[import-not-found,import-untyped]
-        grads = {k: grads[k] for k in self.param_states.keys()}
-        states = {k: v.value for k, v in self.param_states.items()}
-        # compute updates
-        updates, new_opt_state = self.tx.update(grads, self.opt_state.value, states)
-        new_params = optax.apply_updates(states, updates)
-        # update model states and optimizer states
-        for k, v in self.param_states.items():
-            v.value = new_params[k]
-        self.opt_state.value = new_opt_state
-class LBFGS(OptaxOptimizer):
-    def __init__(
-        self,
-        lr: float,
-        memory_size: int = 10,
-        scale_init_precond: bool = True,
-    ):
-        import optax  # type: ignore[import-not-found,import-untyped]
-        super().__init__(
-            optax.lbfgs(
-                lr,
-                memory_size=memory_size,
-                scale_init_precond=scale_init_precond,
-                linesearch=None,
-            )
-        )

brainstate/optim/_optax_optimizer_test.py DELETED Viewed

@@ -1,53 +0,0 @@
-# Copyright 2024 BDP Ecosystem Limited. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-import unittest
-import jax
-import optax
-import brainstate
-class TestOptaxOptimizer(unittest.TestCase):
-    def test1(self):
-        class Model(brainstate.nn.Module):
-            def __init__(self):
-                super().__init__()
-                self.linear1 = brainstate.nn.Linear(2, 3)
-                self.linear2 = brainstate.nn.Linear(3, 4)
-            def __call__(self, x):
-                return self.linear2(self.linear1(x))
-        x = brainstate.random.randn(1, 2)
-        y = jax.numpy.ones((1, 4))
-        model = Model()
-        tx = optax.adam(1e-3)
-        optimizer = brainstate.optim.OptaxOptimizer(tx)
-        optimizer.register_trainable_weights(model.states(brainstate.ParamState))
-        loss_fn = lambda: ((model(x) - y) ** 2).mean()
-        prev_loss = loss_fn()
-        grads = brainstate.augment.grad(loss_fn, model.states(brainstate.ParamState))()
-        optimizer.update(grads)
-        new_loss = loss_fn()
-        print(new_loss, prev_loss)
-        self.assertLess(new_loss, prev_loss)

brainstate 0.1.10__py2.py3-none-any.whl → 0.2.0__py2.py3-none-any.whl

brainstate 0.1.10py2.py3-none-any.whl → 0.2.0py2.py3-none-any.whl