PyPI - torchzero - Versions diffs - 0.4.0__py3-none-any.whl → 0.4.1__py3-none-any.whl - Mend

torchzero 0.4.0py3-none-any.whl → 0.4.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (112) hide show

tests/test_identical.py +22 -22
tests/test_opts.py +199 -198
torchzero/__init__.py +1 -1
torchzero/core/__init__.py +1 -1
torchzero/core/functional.py +1 -1
torchzero/core/modular.py +5 -5
torchzero/core/module.py +2 -2
torchzero/core/objective.py +10 -10
torchzero/core/transform.py +1 -1
torchzero/linalg/__init__.py +3 -2
torchzero/linalg/eigh.py +223 -4
torchzero/linalg/orthogonalize.py +2 -4
torchzero/linalg/qr.py +12 -0
torchzero/linalg/solve.py +1 -3
torchzero/linalg/svd.py +47 -20
torchzero/modules/__init__.py +4 -3
torchzero/modules/adaptive/__init__.py +11 -3
torchzero/modules/adaptive/adagrad.py +10 -10
torchzero/modules/adaptive/adahessian.py +2 -2
torchzero/modules/adaptive/adam.py +1 -1
torchzero/modules/adaptive/adan.py +1 -1
torchzero/modules/adaptive/adaptive_heavyball.py +1 -1
torchzero/modules/adaptive/esgd.py +2 -2
torchzero/modules/adaptive/ggt.py +186 -0
torchzero/modules/adaptive/lion.py +2 -1
torchzero/modules/adaptive/lre_optimizers.py +299 -0
torchzero/modules/adaptive/mars.py +2 -2
torchzero/modules/adaptive/matrix_momentum.py +1 -1
torchzero/modules/adaptive/msam.py +4 -4
torchzero/modules/adaptive/muon.py +9 -6
torchzero/modules/adaptive/natural_gradient.py +32 -15
torchzero/modules/adaptive/psgd/__init__.py +5 -0
torchzero/modules/adaptive/psgd/_psgd_utils.py +37 -0
torchzero/modules/adaptive/psgd/psgd.py +1390 -0
torchzero/modules/adaptive/psgd/psgd_dense_newton.py +174 -0
torchzero/modules/adaptive/psgd/psgd_kron_newton.py +203 -0
torchzero/modules/adaptive/psgd/psgd_kron_whiten.py +185 -0
torchzero/modules/adaptive/psgd/psgd_lra_newton.py +118 -0
torchzero/modules/adaptive/psgd/psgd_lra_whiten.py +116 -0
torchzero/modules/adaptive/rprop.py +2 -2
torchzero/modules/adaptive/sam.py +4 -4
torchzero/modules/adaptive/shampoo.py +28 -3
torchzero/modules/adaptive/soap.py +3 -3
torchzero/modules/adaptive/sophia_h.py +2 -2
torchzero/modules/clipping/clipping.py +7 -7
torchzero/modules/conjugate_gradient/cg.py +2 -2
torchzero/modules/experimental/__init__.py +5 -0
torchzero/modules/experimental/adanystrom.py +258 -0
torchzero/modules/experimental/common_directions_whiten.py +142 -0
torchzero/modules/experimental/cubic_adam.py +160 -0
torchzero/modules/experimental/eigen_sr1.py +182 -0
torchzero/modules/experimental/eigengrad.py +207 -0
torchzero/modules/experimental/l_infinity.py +1 -1
torchzero/modules/experimental/matrix_nag.py +122 -0
torchzero/modules/experimental/newton_solver.py +2 -2
torchzero/modules/experimental/newtonnewton.py +34 -40
torchzero/modules/grad_approximation/fdm.py +2 -2
torchzero/modules/grad_approximation/rfdm.py +4 -4
torchzero/modules/least_squares/gn.py +68 -45
torchzero/modules/line_search/backtracking.py +2 -2
torchzero/modules/line_search/line_search.py +1 -1
torchzero/modules/line_search/strong_wolfe.py +2 -2
torchzero/modules/misc/escape.py +1 -1
torchzero/modules/misc/gradient_accumulation.py +1 -1
torchzero/modules/misc/misc.py +1 -1
torchzero/modules/misc/multistep.py +4 -7
torchzero/modules/misc/regularization.py +2 -2
torchzero/modules/misc/split.py +1 -1
torchzero/modules/misc/switch.py +2 -2
torchzero/modules/momentum/cautious.py +3 -3
torchzero/modules/momentum/momentum.py +1 -1
torchzero/modules/ops/higher_level.py +1 -1
torchzero/modules/ops/multi.py +1 -1
torchzero/modules/projections/projection.py +5 -2
torchzero/modules/quasi_newton/__init__.py +1 -1
torchzero/modules/quasi_newton/damping.py +1 -1
torchzero/modules/quasi_newton/diagonal_quasi_newton.py +1 -1
torchzero/modules/quasi_newton/lbfgs.py +3 -3
torchzero/modules/quasi_newton/lsr1.py +3 -3
torchzero/modules/quasi_newton/quasi_newton.py +44 -29
torchzero/modules/quasi_newton/sg2.py +69 -205
torchzero/modules/restarts/restars.py +17 -17
torchzero/modules/second_order/inm.py +33 -25
torchzero/modules/second_order/newton.py +132 -130
torchzero/modules/second_order/newton_cg.py +3 -3
torchzero/modules/second_order/nystrom.py +83 -32
torchzero/modules/second_order/rsn.py +41 -44
torchzero/modules/smoothing/laplacian.py +1 -1
torchzero/modules/smoothing/sampling.py +2 -3
torchzero/modules/step_size/adaptive.py +6 -6
torchzero/modules/step_size/lr.py +2 -2
torchzero/modules/trust_region/cubic_regularization.py +1 -1
torchzero/modules/trust_region/levenberg_marquardt.py +2 -2
torchzero/modules/trust_region/trust_cg.py +1 -1
torchzero/modules/variance_reduction/svrg.py +4 -5
torchzero/modules/weight_decay/reinit.py +2 -2
torchzero/modules/weight_decay/weight_decay.py +5 -5
torchzero/modules/wrappers/optim_wrapper.py +4 -4
torchzero/modules/zeroth_order/cd.py +1 -1
torchzero/optim/mbs.py +291 -0
torchzero/optim/wrappers/nevergrad.py +0 -9
torchzero/optim/wrappers/optuna.py +2 -0
torchzero/utils/benchmarks/__init__.py +0 -0
torchzero/utils/benchmarks/logistic.py +122 -0
torchzero/utils/derivatives.py +4 -4
{torchzero-0.4.0.dist-info → torchzero-0.4.1.dist-info}/METADATA +1 -1
torchzero-0.4.1.dist-info/RECORD +209 -0
torchzero/modules/adaptive/lmadagrad.py +0 -241
torchzero-0.4.0.dist-info/RECORD +0 -191
/torchzero/modules/{functional.py → opt_utils.py} +0 -0
{torchzero-0.4.0.dist-info → torchzero-0.4.1.dist-info}/WHEEL +0 -0
{torchzero-0.4.0.dist-info → torchzero-0.4.1.dist-info}/top_level.txt +0 -0

torchzero/optim/mbs.py ADDED Viewed

@@ -0,0 +1,291 @@
+from typing import NamedTuple
+import math
+from collections.abc import Iterable
+from decimal import ROUND_HALF_UP, Decimal
+import numpy as np
+def format_number(number, n):
+    """Rounds to n significant digits after the decimal point."""
+    if number == 0: return 0
+    if math.isnan(number) or math.isinf(number) or (not math.isfinite(number)): return number
+    if n <= 0: raise ValueError("n must be positive")
+    dec = Decimal(str(number))
+    if dec.is_zero(): return 0
+    if number > 10**n or dec % 1 == 0: return int(dec)
+    if abs(dec) >= 1:
+        places = n
+    else:
+        frac_str = format(abs(dec), 'f').split('.')[1]
+        leading_zeros = len(frac_str) - len(frac_str.lstrip('0'))
+        places = leading_zeros + n
+    quantizer = Decimal('1e-' + str(places))
+    rounded_dec = dec.quantize(quantizer, rounding=ROUND_HALF_UP)
+    if rounded_dec % 1 == 0: return int(rounded_dec)
+    return float(rounded_dec)
+def _nonfinite_to_inf(x):
+    if not math.isfinite(x): return math.inf
+    return x
+def _tofloatlist(x) -> list[float]:
+    if isinstance(x, (int,float)): return [x]
+    if isinstance(x, np.ndarray) and x.size == 1: return [float(x.item())]
+    return [float(i) for i in x]
+class Trial(NamedTuple):
+    x: float
+    f: tuple[float, ...]
+class Solution(NamedTuple):
+    x: float
+    f: tuple[float, ...]
+    trials: list[Trial]
+class MBS:
+    """Univariate minimization via grid search followed by refining, supports multi-objective functions.
+    This tends to outperform bayesian optimization for learning rate tuning, it is also good for plotting.
+    First it evaluates all points defined in ``grid``. The grid doesn't have to be dense and the solution doesn't
+    have to be between the endpoints.
+    Then it picks ``num_candidates`` best points per each objective. If any of those points are endpoints,
+    it expands the search space by ``step`` in that direction and evaluates the new endpoint.
+    Otherwise it keeps picking points between best points and evaluating them, until ``num_binary`` evaluations
+    have been performed.
+    Args:
+        grid (Iterable[float], optional): values for initial grid search. If ``log_scale=True``, should be in log10 scale.
+        step (float, optional): expansion step size. Defaults to 1.
+        num_candidates (int, optional): number of best points to sample new points around on each iteration. Defaults to 2.
+        num_binary (int, optional): maximum number of new points sampled via binary search. Defaults to 7.
+        num_expansions (int, optional): maximum number of expansions (not counted towards binary search points). Defaults to 7.
+        rounding (int, optional): rounding is to significant digits, avoids evaluating points that are too close.
+        lb (float | None, optional): lower bound. If ``log_scale=True``, should be in log10 scale.
+        ub (float | None, optional): upper bound. If ``log_scale=True``, should be in log10 scale.
+        log_scale (bool, optional):
+            whether to minimize in log10 scale. If true, it is assumed that
+            ``grid``, ``lb`` and ``ub`` are given in log10 scale.
+    Example:
+    ```python
+    def objective(x: float):
+        x = x * 4
+        return -(np.sin(x) * (x / 3) + np.cos(x*2.5) * 2 - 0.05 * (x-5)**2)
+    mbs = MBS(grid=[-1, 0, 1, 2, 3, 4], step=1, num_binary=10, num_expansions=10)
+    x, f, trials = mbs.run(objective)
+    # x - solution
+    # f - value at solution x
+    # trials - list of trials, each trial is a named tuple: Trial(x, f)
+    """
+    def __init__(
+        self,
+        grid: Iterable[float],
+        step: float,
+        num_candidates: int = 3,
+        num_binary: int = 20,
+        num_expansions: int = 20,
+        rounding: int| None = 2,
+        lb = None,
+        ub = None,
+        log_scale: bool = False,
+    ):
+        self.objectives: dict[int, dict[float,float]] = {}
+        """dictionary of objectives, each maps point (x) to value (v)"""
+        self.evaluated: set[float] = set()
+        """set of evaluated points (x)"""
+        grid = tuple(grid)
+        if len(grid) == 0: raise ValueError("At least one grid search point must be specified")
+        self.grid = sorted(grid)
+        self.step = step
+        self.num_candidates = num_candidates
+        self.num_binary = num_binary
+        self.num_expansions = num_expansions
+        self.rounding = rounding
+        self.log_scale = log_scale
+        self.lb = lb
+        self.ub = ub
+    def _get_best_x(self, n: int, objective: int):
+        """n best points"""
+        obj = self.objectives[objective]
+        v_to_x = [(v,x) for x,v in obj.items()]
+        v_to_x.sort(key = lambda vx: vx[0])
+        xs = [x for v,x in v_to_x]
+        return xs[:n]
+    def _suggest_points_around(self, x: float, objective: int):
+        """suggests points around x"""
+        points = list(self.objectives[objective].keys())
+        points.sort()
+        if x not in points: raise RuntimeError(f"{x} not in {points}")
+        expansions = []
+        if x == points[0]:
+            expansions.append((x-self.step, 'expansion'))
+        if x == points[-1]:
+            expansions.append((x+self.step, 'expansion'))
+        if len(expansions) != 0: return expansions
+        idx = points.index(x)
+        xm = points[idx-1]
+        xp = points[idx+1]
+        x1 = (x - (x - xm)/2)
+        x2 = (x + (xp - x)/2)
+        return [(x1, 'binary'), (x2, 'binary')]
+    def _out_of_bounds(self, x):
+        if self.lb is not None and x < self.lb: return True
+        if self.ub is not None and x > self.ub: return True
+        return False
+    def _evaluate(self, fn, x):
+        """Evaluate a point, returns False if point is already in history"""
+        if self.rounding is not None: x = format_number(x, self.rounding)
+        if x in self.evaluated: return False
+        if self._out_of_bounds(x): return False
+        self.evaluated.add(x)
+        if self.log_scale: vals = _tofloatlist(fn(10 ** x))
+        else: vals = _tofloatlist(fn(x))
+        vals = [_nonfinite_to_inf(v) for v in vals]
+        for idx, v in enumerate(vals):
+            if idx not in self.objectives: self.objectives[idx] = {}
+            self.objectives[idx][x] = v
+        return True
+    def run(self, fn) -> Solution:
+        # step 1 - gr id search
+        for x in self.grid:
+            self._evaluate(fn, x)
+        # step 2 - binary search
+        while True:
+            if (self.num_candidates <= 0) or (self.num_expansions <= 0 and self.num_binary <= 0): break
+            # suggest candidates
+            candidates: list[tuple[float, str]] = []
+            # sample around best points
+            for objective in self.objectives:
+                best_points = self._get_best_x(self.num_candidates, objective)
+                for p in best_points:
+                    candidates.extend(self._suggest_points_around(p, objective=objective))
+            # filter
+            if self.num_expansions <= 0:
+                candidates = [(x,t) for x,t in candidates if t != 'expansion']
+            if self.num_candidates <= 0:
+                candidates = [(x,t) for x,t in candidates if t != 'binary']
+            # if expansion was suggested, discard anything else
+            types = [t for x, t in candidates]
+            if any(t == 'expansion' for t in types):
+                candidates = [(x,t) for x,t in candidates if t == 'expansion']
+            # evaluate candidates
+            terminate = False
+            at_least_one_evaluated = False
+            for x, t in candidates:
+                evaluated = self._evaluate(fn, x)
+                if not evaluated: continue
+                at_least_one_evaluated = True
+                if t == 'expansion': self.num_expansions -= 1
+                elif t == 'binary': self.num_binary -= 1
+                if self.num_binary < 0:
+                    terminate = True
+                    break
+            if terminate: break
+            if not at_least_one_evaluated:
+                if self.rounding is None: break
+                self.rounding += 1
+                if self.rounding == 100: break
+        # create dict[float, tuple[float,...]]
+        ret = {}
+        for i, objective in enumerate(self.objectives.values()):
+            for x, v in objective.items():
+                if self.log_scale: x = 10 ** x
+                if x not in ret: ret[x] = [None for _ in self.objectives]
+                ret[x][i] = v
+        for v in ret.values():
+            assert len(v) == len(self.objectives), v
+            assert all(i is not None for i in v), v
+        # ret maps x to list of per-objective values, e.g. {1: [0.1, 0.3], ...}
+        # now make a list of trials as they are easier to work with
+        trials: list[Trial] = []
+        for x, values in ret.items():
+            trials.append(Trial(x=x, f=values))
+        # sort trials by sum of values
+        trials.sort(key = lambda trial: sum(trial.f))
+        return Solution(x=trials[0].x, f=trials[0].f, trials=trials)
+def mbs_minimize(
+    fn,
+    grid: Iterable[float],
+    step: float,
+    num_candidates: int = 3,
+    num_binary: int = 20,
+    num_expansions: int = 20,
+    rounding=2,
+    lb:float | None = None,
+    ub:float | None = None,
+    log_scale=False,
+) -> Solution:
+    """minimize univariate function via MBS.
+    Args:
+        fn (function): objective function that accepts a float and returns a float or a sequence of floats to minimize.
+        step (float, optional): expansion step size. Defaults to 1.
+        num_candidates (int, optional): number of best points to sample new points around on each iteration. Defaults to 2.
+        num_binary (int, optional): maximum number of new points sampled via binary search. Defaults to 7.
+        num_expansions (int, optional): maximum number of expansions (not counted towards binary search points). Defaults to 7.
+        rounding (int, optional): rounding is to significant digits, avoids evaluating points that are too close.
+        lb (float | None, optional): lower bound. If ``log_scale=True``, should be in log10 scale.
+        ub (float | None, optional): upper bound. If ``log_scale=True``, should be in log10 scale.
+        log_scale (bool, optional):
+            whether to minimize in log10 scale. If true, it is assumed that
+            ``grid``, ``lb`` and ``ub`` are given in log10 scale.
+    Example:
+    ```python
+    def objective(x: float):
+        x = x * 4
+        return -(np.sin(x) * (x / 3) + np.cos(x*2.5) * 2 - 0.05 * (x-5)**2)
+    x, f, trials = mbs_minimize(objective, grid=[-1, 0, 1, 2, 3, 4], step=1, num_binary=10, num_expansions=10)
+    # x - solution
+    # f - value at solution x
+    # trials - list of trials, each trial is a named tuple: Trial(x, f)
+    """
+    mbs = MBS(grid, step=step, num_candidates=num_candidates, num_binary=num_binary, num_expansions=num_expansions, rounding=rounding, lb=lb, ub=ub, log_scale=log_scale)
+    return mbs.run(fn)

torchzero/optim/wrappers/nevergrad.py CHANGED Viewed

@@ -55,15 +55,6 @@ class NevergradWrapper(WrapperBase):
         mutable_sigma = False,
         use_init = True,
     ):
-        """_summary_
-        Args:
-            params (_type_): _description_
-            opt_cls (type[ng.optimizers.base.Optimizer] | abc.Callable[..., ng.optimizers.base.Optimizer]): _description_
-            budget (int | None, optional): _description_. Defaults to None.
-            mutable_sigma (bool, optional): _description_. Defaults to False.
-            use_init (bool, optional): _description_. Defaults to True.
-        """
         defaults = dict(lb=lb, ub=ub, use_init=use_init, mutable_sigma=mutable_sigma)
         super().__init__(params, defaults)
         self.opt_cls = opt_cls

torchzero/optim/wrappers/optuna.py CHANGED Viewed

@@ -45,6 +45,7 @@ class OptunaSampler(WrapperBase):
             self.study = optuna.create_study(sampler=self.sampler)
         # some optuna samplers use torch
+        # and require torch.enable_grad
         with torch.enable_grad():
             trial = self.study.ask()
@@ -58,6 +59,7 @@ class OptunaSampler(WrapperBase):
         params.from_vec_(vec)
         loss = closure()
         with torch.enable_grad(): self.study.tell(trial, tofloat(torch.nan_to_num(totensor(loss), 1e32)))
         return loss

torchzero/utils/benchmarks/__init__.py ADDED Viewed

File without changes

torchzero/utils/benchmarks/logistic.py ADDED Viewed

@@ -0,0 +1,122 @@
+from functools import partial
+from typing import Any, cast
+import numpy as np
+import torch
+import tqdm
+def generate_correlated_logistic_data(n_samples=2000, n_features=32, n_correlated_pairs=512, correlation=0.99, seed=0):
+    """Hard logistic regression dataset with correlated features"""
+    generator = np.random.default_rng(seed)
+    # ------------------------------------- X ------------------------------------ #
+    X = generator.standard_normal(size=(n_samples, n_features))
+    weights = generator.uniform(-2, 2, n_features)
+    used_pairs = []
+    for i in range(n_correlated_pairs):
+        idxs = None
+        while idxs is None or idxs in used_pairs:
+            idxs = tuple(generator.choice(n_features, size=2, replace=False).tolist())
+        used_pairs.append(idxs)
+        idx1, idx2 = idxs
+        noise = generator.standard_normal(n_samples) * np.sqrt(1 - correlation**2)
+        X[:, idx2] = correlation * X[:, idx1] + noise
+        w = generator.integers(1, 51)
+        weights[idx1] = w
+        weights[idx2] = -w
+    # ---------------------------------- logits ---------------------------------- #
+    logits = X @ weights
+    probabilities = 1 / (1 + np.exp(-logits))
+    y = generator.binomial(1, probabilities).astype(np.float32)
+    X = X - X.mean(0, keepdims=True)
+    X = X / X.std(0, keepdims=True)
+    return X, y
+# if __name__ == '__main__':
+#     X, y = generate_correlated_logistic_data()
+#     plt.figure(figsize=(10, 8))
+#     sns.heatmap(pl.DataFrame(X).corr(), annot=True, cmap='coolwarm', fmt=".2f")
+#     plt.show()
+def _tensorlist_equal(t1, t2):
+    return all(a == b for a, b in zip(t1, t2))
+_placeholder = cast(Any, ...)
+def run_logistic_regression(X: torch.Tensor, y: torch.Tensor, opt_fn, max_steps: int, tol:float=0, l1:float=0, l2:float=0, pbar:bool=False, *, _assert_on_evaluated_same_params: bool = False):
+    # ------------------------------- verify inputs ------------------------------ #
+    n_samples, n_features = X.size()
+    if y.ndim != 1: raise ValueError(f"y should be 1d, got {y.shape}")
+    if y.size(0) != n_samples: raise ValueError(f"y should have {n_samples} elements, got {y.shape}")
+    if y.device != X.device: raise ValueError(f"X and y should be on same device, got {X.device = }, {y.device = }")
+    device = X.device
+    dtype = X.dtype
+    # ---------------------------- model and criterion --------------------------- #
+    n_targets = int(y.amax()) + 1
+    binary = n_targets == 2
+    if binary:
+        criterion = torch.nn.functional.binary_cross_entropy_with_logits
+        model = torch.nn.Linear(n_features, 1).to(device=device, dtype=dtype)
+        y = y.to(dtype=dtype)
+    else:
+        model = torch.nn.Linear(n_features, n_targets).to(device=device, dtype=dtype)
+        criterion = torch.nn.functional.cross_entropy
+        y = y.long()
+    optimizer = opt_fn(list(model.parameters()))
+    # ---------------------------------- closure --------------------------------- #
+    def _l1_penalty():
+        return sum(p.abs().sum() for p in model.parameters())
+    def _l2_penalty():
+        return sum(p.square().sum() for p in model.parameters())
+    def closure(backward=True, evaluated_params: list = _placeholder, epoch: int = _placeholder):
+        y_hat = model(X)
+        loss = criterion(y_hat.squeeze(), y)
+        if l1 > 0: loss += _l1_penalty() * l1
+        if l2 > 0: loss += _l2_penalty() * l2
+        if backward:
+            optimizer.zero_grad()
+            loss.backward()
+        # here I also test to make sure the optimizer doesn't evaluate same parameters twice per step
+        # this is for tests
+        if _assert_on_evaluated_same_params:
+            for p in evaluated_params:
+                assert not _tensorlist_equal(p, model.parameters()), f"evaluated same parameters on epoch {epoch}"
+            evaluated_params.append([p.clone() for p in model.parameters()])
+        return loss
+    # --------------------------------- optimize --------------------------------- #
+    losses = []
+    epochs = tqdm.trange(max_steps, disable=not pbar)
+    for epoch in epochs:
+        evaluated_params = []
+        loss = float(optimizer.step(partial(closure, evaluated_params=evaluated_params, epoch=epoch)))
+        losses.append(loss)
+        epochs.set_postfix_str(f"{loss:.5f}")
+        if loss <= tol:
+            break
+    return losses

torchzero/utils/derivatives.py CHANGED Viewed

@@ -7,7 +7,7 @@ from .torch_tools import swap_tensors_no_use_count_check, vec_to_tensors
 from .tensorlist import TensorList
 def _jacobian(outputs: Sequence[torch.Tensor], wrt: Sequence[torch.Tensor], create_graph=False):
-    flat_outputs = torch.cat([i.reshape(-1) for i in outputs])
+    flat_outputs = torch.cat([i.ravel() for i in outputs])
     grad_ouputs = torch.eye(len(flat_outputs), device=outputs[0].device, dtype=outputs[0].dtype)
     jac = []
     for i in range(flat_outputs.numel()):
@@ -24,7 +24,7 @@ def _jacobian(outputs: Sequence[torch.Tensor], wrt: Sequence[torch.Tensor], crea
 def _jacobian_batched(outputs: Sequence[torch.Tensor], wrt: Sequence[torch.Tensor], create_graph=False):
-    flat_outputs = torch.cat([i.reshape(-1) for i in outputs])
+    flat_outputs = torch.cat([i.ravel() for i in outputs])
     return torch.autograd.grad(
         flat_outputs,
         wrt,
@@ -40,10 +40,10 @@ def flatten_jacobian(jacs: Sequence[torch.Tensor]) -> torch.Tensor:
     Args:
         jacs (Sequence[torch.Tensor]):
-            output from jacobian_wrt where ach tensor has the shape `(*output.shape, *wrt[i].shape)`.
+            output from jacobian_wrt where ach tensor has the shape ``(*output.shape, *wrt[i].shape)``.
     Returns:
-        torch.Tensor: has the shape `(output.ndim, wrt.ndim)`.
+        torch.Tensor: has the shape ``(output.ndim, wrt.ndim)``.
     """
     if not jacs:
         return torch.empty(0, 0)

{torchzero-0.4.0.dist-info → torchzero-0.4.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: torchzero
-Version: 0.4.0
+Version: 0.4.1
 Summary: Modular optimization library for PyTorch.
 Author-email: Ivan Nikishev <nkshv2@gmail.com>
 Project-URL: Homepage, https://github.com/inikishev/torchzero

torchzero 0.4.0__py3-none-any.whl → 0.4.1__py3-none-any.whl

torchzero 0.4.0py3-none-any.whl → 0.4.1py3-none-any.whl