PyPI - junshan-kit - Versions diffs - 2.2.8__py2.py3-none-any.whl → 2.7.3__py2.py3-none-any.whl - Mend

junshan-kit 2.2.8py2.py3-none-any.whl → 2.7.3py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

junshan_kit/BenchmarkFunctions.py +7 -0
junshan_kit/Check_Info.py +44 -0
junshan_kit/DataHub.py +214 -0
junshan_kit/DataProcessor.py +306 -16
junshan_kit/DataSets.py +330 -18
junshan_kit/Evaluate_Metrics.py +113 -0
junshan_kit/FiguresHub.py +286 -0
junshan_kit/ModelsHub.py +239 -0
junshan_kit/OptimizerHup/OptimizerFactory.py +130 -0
junshan_kit/OptimizerHup/SPBM.py +350 -0
junshan_kit/OptimizerHup/SPBM_func.py +602 -0
junshan_kit/OptimizerHup/__init__.py +0 -0
junshan_kit/ParametersHub.py +690 -0
junshan_kit/Print_Info.py +109 -0
junshan_kit/TrainingHub.py +324 -0
junshan_kit/kit.py +83 -24
{junshan_kit-2.2.8.dist-info → junshan_kit-2.7.3.dist-info}/METADATA +6 -2
junshan_kit-2.7.3.dist-info/RECORD +20 -0
{junshan_kit-2.2.8.dist-info → junshan_kit-2.7.3.dist-info}/WHEEL +1 -1
junshan_kit-2.2.8.dist-info/RECORD +0 -7

junshan_kit/FiguresHub.py ADDED Viewed

@@ -0,0 +1,286 @@
+"""
+----------------------------------------------------------------------
+>>> Author       : Junshan Yin
+>>> Last Updated : 2025-11-14
+----------------------------------------------------------------------
+"""
+import math, os
+import matplotlib.pyplot as plt
+import numpy as np
+import matplotlib as mpl
+from collections import defaultdict
+from junshan_kit import kit, ParametersHub
+def marker_schedule(marker_schedule=None):
+    if marker_schedule == "SPBM":
+        based_marker = {
+            "ADAM": "s",  # square
+            "ALR-SMAG": "h",  # pixel marker
+            "Bundle": "o",  # circle
+            "SGD": "p",  # pentagon
+            "SPSmax": "4",  # tri-right
+            "SPBM-PF": "*",  # star
+            "SPBM-TR": "s",  # star
+        }
+    else:
+        based_marker = {
+            "point": ".",  # point marker
+            "pixel": ",",  # pixel marker
+            "circle": "o",  # circle
+            "triangle_down": "v",  # down triangle
+            "triangle_up": "^",  # up triangle
+            "triangle_left": "<",  # left triangle
+            "triangle_right": ">",  # right triangle
+            "tri_down": "1",  # tri-down
+            "tri_up": "2",  # tri-up
+            "tri_left": "3",  # tri-left
+            "tri_right": "4",  # tri-right
+            "square": "s",  # square
+            "pentagon": "p",  # pentagon
+            "star": "*",  # star
+            "hexagon1": "h",  # hexagon 1
+            "hexagon2": "H",  # hexagon 2
+            "plus": "+",  # plus
+            "x": "x",  # x
+            "diamond": "D",  # diamond
+            "thin_diamond": "d",  # thin diamond
+            "vline": "|",  # vertical line
+            "hline": "_",  # horizontal line
+        }
+    return based_marker
+def colors_schedule(colors_schedule=None):
+    if colors_schedule == "SPBM":
+        based_color = {
+            "ADAM":      "#7f7f7f",
+            "ALR-SMAG":  "#796378",
+            "Bundle":    "#17becf",
+            "SGD":       "#2ca02c",
+            "SPSmax":    "#BA6262",
+            "SPBM-PF":   "#1f77b4",
+            "SPBM-TR":   "#d62728",
+        }
+    else:
+        based_color = {
+            "ADAM":     "#1f77b4",
+            "ALR-SMAG": "#ff7f0e",
+            "Bundle":   "#2ca02c",
+            "SGD":      "#d62728",
+            "SPSmax":   "#9467bd",
+            "SPBM-PF":  "#8c564b",
+            "SPBM-TR":  "#e377c2",
+            "dddd":     "#7f7f7f",
+            "xxx":      "#bcbd22",
+            "ED":       "#17becf",
+        }
+    return based_color
+def Search_Paras(Paras, args, model_name, data_name, optimizer_name, metric_key = "training_loss"):
+    param_dict = Paras["Results_dict"][model_name][data_name][optimizer_name]
+    num_polts = len(param_dict)
+    cols = 3
+    rows = math.ceil(num_polts / cols)
+    fig, axes = plt.subplots(rows, cols, figsize=(5 * cols, 4 * rows))
+    axes = axes.flatten()
+    for idx, (param_str, info) in enumerate(param_dict.items()):
+        ax = axes[idx]
+        metric_list = info.get(metric_key, [])
+        # duration = info.get('duration', 0)
+        ax.plot(metric_list)
+        # ax.set_title(f"time:{duration:.8f}s - seed: {Paras['seed']}, ID: {Paras['time_str']} \n params = {param_str}", fontsize=10)
+        ax.set_title(f'time = {info["train_time"]:.2f}, seed: {Paras["seed"]}, ID: {Paras["time_str"]} \n params = {param_str}', fontsize=10)
+        ax.set_xlabel("epochs")
+        ax.set_ylabel(ParametersHub.fig_ylabel(metric_key))
+        ax.grid(True)
+        if Paras.get('use_log_scale', False) and any(k in metric_key for k in ['loss', 'grad']):
+            ax.set_yscale("log")
+    # Delete the redundant subfigures
+    for i in range(len(param_dict), len(axes)):
+        fig.delaxes(axes[i])
+    plt.suptitle(f'{model_name} on {data_name} - {optimizer_name} (training/test samples: {Paras["train_data_num"]}/{Paras["test_data_num"]}), {Paras["device"]}', fontsize=16)
+    plt.tight_layout(rect=(0, 0, 1, 0.9))
+    filename = f'{Paras["Results_folder"]}/{metric_key}_{ParametersHub.model_abbr(model_name)}_{data_name}_{optimizer_name}.pdf'
+    fig.savefig(filename)
+    print(f"✅ Saved: {filename}")
+    plt.close('all')
+def Read_Results_from_pkl(info_dict, Exp_name, model_name):
+    draw_data = defaultdict(dict)
+    for data_name, info in info_dict.items():
+        for optimizer_name, info_opt in info["optimizer"].items():
+            pkl_path = f'{Exp_name}/seed_{info["seed"]}/{model_name}/{data_name}/{optimizer_name}/train_{info["train_test"][0]}_test_{info["train_test"][1]}/Batch_size_{info["batch_size"]}/epoch_{info["epochs"]}/{info_opt["ID"]}/Results_{ParametersHub.model_abbr(model_name)}_{data_name}_{optimizer_name}.pkl'
+            data_ = kit.read_pkl_data(pkl_path)
+            param_str = ParametersHub.opt_paras_str(info["optimizer"][optimizer_name])
+            # draw_data[data_name][optimizer_name] = data_[param_str][info["metric_key"]]
+            # draw_data[data_name][optimizer_name][param_str] = param_str
+            # Store both metric list and parameter string
+            draw_data[data_name][optimizer_name] = {
+                "metrics": data_[param_str][info["metric_key"]],
+                "param_str": param_str
+            }
+    return draw_data
+def Mul_Plot(model_name, info_dict, Exp_name = "SPBM", cols = 3, save_path = None, save_name = None, fig_show = False):
+    # matplotlib settings
+    mpl.rcParams['font.family'] = 'Times New Roman'
+    mpl.rcParams["mathtext.fontset"] = "stix"
+    mpl.rcParams["axes.unicode_minus"] = False
+    mpl.rcParams["font.size"] = 12
+    mpl.rcParams["font.family"] = "serif"
+    # Read data
+    draw_data = defaultdict(dict)
+    for data_name, info in info_dict.items():
+        for optimizer_name, info_opt in info["optimizer"].items():
+            pkl_path = f'{Exp_name}/seed_{info["seed"]}/{model_name}/{data_name}/{optimizer_name}/train_{info["train_test"][0]}_test_{info["train_test"][1]}/Batch_size_{info["batch_size"]}/epoch_{info["epochs"]}/{info_opt["ID"]}/Results_{ParametersHub.model_abbr(model_name)}_{data_name}_{optimizer_name}.pkl'
+            data_ = kit.read_pkl_data(pkl_path)
+            param_str = ParametersHub.opt_paras_str(info["optimizer"][optimizer_name])
+            draw_data[data_name][optimizer_name] = data_[param_str][info["metric_key"]]
+    # Draw figures
+    num_datasets = len(draw_data)
+    nrows = math.ceil(num_datasets / cols)
+    fig, axes = plt.subplots(nrows, cols, figsize=(5 * cols, 4 * nrows), squeeze=False)
+    axes = axes.flatten()
+    for idx, (data_name, info) in enumerate(draw_data.items()):
+        ax = axes[idx]
+        for optimizer_name, metric_list in info.items():
+            ax.plot(metric_list, label=optimizer_name, color = colors_schedule("SPBM")[optimizer_name])
+            # marker
+            if info_dict[data_name]["marker"] is not None:
+                x = np.array(info_dict[data_name]["marker"])
+                metric_list_arr = np.array(metric_list)
+                ax.scatter(x, metric_list_arr[x], marker=marker_schedule("SPBM")[optimizer_name], color = colors_schedule("SPBM")[optimizer_name])
+        ax.set_title(f'{data_name}', fontsize=12)
+        ax.set_xlabel("epochs", fontsize=12)
+        ax.set_ylabel(ParametersHub.fig_ylabel(info_dict[data_name]["metric_key"]), fontsize=12)
+        if any(k in info_dict[data_name]["metric_key"] for k in ['loss', 'grad']):
+            ax.set_yscale("log")
+        ax.grid(True)
+    # Hide redundant axes
+    for ax in axes[num_datasets:]:
+        ax.axis('off')
+    # legend
+    all_handles, all_labels = [], []
+    for ax in axes[:num_datasets]:
+        h, l = ax.get_legend_handles_labels()
+        all_handles.extend(h)
+        all_labels.extend(l)
+    # duplicate removal
+    unique = dict(zip(all_labels, all_handles))
+    handles = list(unique.values())
+    labels = list(unique.keys())
+    fig.legend(
+        handles,
+        labels,
+        loc="lower center",
+        bbox_to_anchor=(0.5, -0.08),
+        ncol=len(handles),
+        fontsize=12
+    )
+    plt.tight_layout()
+    if save_name is None:
+        save_path = f'{model_name}.pdf'
+    else:
+        os.makedirs(save_name, exist_ok=True)
+        save_path = f'{save_name}/{save_name}.pdf'
+    plt.savefig(save_path, bbox_inches="tight")
+    if fig_show:
+        plt.show()
+    plt.close()  # Colse the fig
+def Opt_Paras_Plot(model_name, info_dict, Exp_name = "SPBM", svae_path = None, save_name = None, fig_show = False):
+    mpl.rcParams['font.family'] = 'Times New Roman'
+    mpl.rcParams["mathtext.fontset"] = "stix"
+    mpl.rcParams["axes.unicode_minus"] = False
+    mpl.rcParams["font.size"] = 12
+    mpl.rcParams["font.family"] = "serif"
+    # Read data
+    draw_data = Read_Results_from_pkl(info_dict, Exp_name, model_name)
+    if len(draw_data) >1:
+        print('*' * 40)
+        print("Only one data can be drawn at a time.")
+        print(info_dict.keys())
+        print('*' * 40)
+        assert False
+    plt.figure(figsize=(9, 6))  # Optional: set figure size
+    data_name = None
+    for data_name, _info in draw_data.items():
+        for optimizer_name, metric_dict in _info.items():
+            plt.plot(metric_dict["metrics"], label=f'{optimizer_name}_{metric_dict["param_str"]}',
+                    color=colors_schedule("SPBM")[optimizer_name])
+    if data_name is not None:
+        plt.title(f'{data_name}')
+    plt.legend(loc='upper center', bbox_to_anchor=(0.5, -0.15), ncol=1)
+    plt.grid(True)
+    if any(k in info_dict[data_name]["metric_key"] for k in ['loss', 'grad']):
+        plt.yscale("log")
+    plt.tight_layout()  # Adjust layout so the legend fits
+    plt.xlabel("epochs")  # Or whatever your x-axis represents
+    plt.ylabel(f'{ParametersHub.fig_ylabel(info_dict[data_name]["metric_key"])}')
+    if save_name is None:
+        save_path = f'{model_name}.pdf'
+    else:
+        os.makedirs(save_name, exist_ok=True)
+        save_path = f'{save_name}/{save_name}.pdf'
+    plt.savefig(save_path, bbox_inches="tight")
+    if fig_show:
+        plt.show()
+    plt.close()

junshan_kit/ModelsHub.py ADDED Viewed

@@ -0,0 +1,239 @@
+import torchvision,torch, random
+import numpy as np
+from torchvision.models import resnet18,resnet34, ResNet18_Weights, ResNet34_Weights
+import torch.nn as nn
+# ---------------- Build ResNet18 - Caltech101 -----------------------
+def Build_ResNet18_Caltech101_Resize_32():
+    """
+    1. Modify the first convolutional layer for smaller input (e.g., 32x32 instead of 224x224)
+    Original: kernel_size=7, stride=2, padding=3 → changed to 3x3 kernel, stride=1, padding=1
+    2. Adjust the final fully connected layer to match the number of Caltech101 classes (101)
+    """
+    model = resnet18(weights=None)
+    model.conv1 = nn.Conv2d(3, 64, kernel_size=3, stride=1, padding=1, bias=False) # 1
+    model.fc = nn.Linear(model.fc.in_features, 101) # 2
+    return model
+# ---------------- Build ResNet18 - CIFAR100 -----------------------
+def Build_ResNet18_CIFAR100():
+    """
+    1. Modify the first convolutional layer for smaller input (e.g., 32x32 instead of 224x224)
+    Original: kernel_size=7, stride=2, padding=3 → changed to 3x3 kernel, stride=1, padding=1
+    2. Adjust the final fully connected layer to match the number of CIFAR-100 classes (100)
+    """
+    model = resnet18(weights=None)
+    # model = resnet18(weights=ResNet18_Weights.DEFAULT)
+    model.conv1 = nn.Conv2d(3, 64, kernel_size=3, stride=1, padding=1, bias=False)  # 1
+    model.fc = nn.Linear(model.fc.in_features, 100)  # 2
+    return model
+# ---------------- Build ResNet18 - MNIST ----------------------------
+def Build_ResNet18_MNIST():
+    """
+    1. Modify the first convolutional layer to accept grayscale input (1 channel instead of 3)
+    Original: in_channels=3 → changed to in_channels=1
+    2. Adjust the final fully connected layer to match the number of MNIST classes (10)
+    """
+    model = resnet18(weights=None)
+    model.conv1 = nn.Conv2d(1, 64, kernel_size=7, stride=2, padding=3, bias=False)  # 1
+    model.fc = nn.Linear(model.fc.in_features, 10)  # 2
+    return model
+# ---------------- Build ResNet34 - CIFAR100 -----------------------
+def Build_ResNet34_CIFAR100():
+    model = resnet34(weights=None)
+    model.conv1 = nn.Conv2d(3, 64, kernel_size=3, stride=1, padding=1, bias=False)
+    model.fc = nn.Linear(model.fc.in_features, 100)
+    return model
+# ---------------- Build ResNet18 - MNIST ----------------------------
+def Build_ResNet34_MNIST():
+    # Do not load the pre-trained weights
+    model = resnet34(weights=None)
+    model.conv1 = nn.Conv2d(1, 64, kernel_size=7, stride=2, padding=3, bias=False)
+    model.fc = nn.Linear(model.fc.in_features, 10)
+    return model
+# ---------------- Build ResNet34 - Caltech101 -----------------------
+def Build_ResNet34_Caltech101_Resize_32():
+    model = resnet34(weights=None)
+    model.conv1 = nn.Conv2d(3, 64, kernel_size=3, stride=1, padding=1, bias=False)
+    model.fc = nn.Linear(model.fc.in_features, 101)
+    return model
+#**************************************************************
+# ---------------------- LeastSquares -------------------------
+#**************************************************************
+# ---------------- LeastSquares - MNIST -----------------------
+def Build_LeastSquares_MNIST():
+    """
+    1. flatten MNIST images (1x28x28 → 784)
+    2. Use a linear layer for multi-classification
+    """
+    return nn.Sequential(
+        nn.Flatten(),
+        nn.Linear(28 * 28, 10))
+# ---------------- LeastSquares - CIFAR100 --------------------
+def Build_LeastSquares_CIFAR100():
+    """
+    1. flatten MNIST images (3 * 32 * 32 → 784)
+    2. Use a linear layer for multi-classification
+    """
+    return nn.Sequential(
+        nn.Flatten(),
+        nn.Linear(3 * 32 * 32, 100))
+# ---------------- LeastSquares - Caltech101 ------------------
+def Build_LeastSquares_Caltech101_Resize_32():
+    return nn.Sequential(
+        nn.Flatten(),
+        nn.Linear(3*32*32, 101)
+    )
+#*************************************************************
+# --------------- LogRegressionBinary ------------------------
+#*************************************************************
+# -------------- LogRegressionBinary - MNIST ------------------
+def Build_LogRegressionBinary_MNIST():
+    """
+    1. flatten MNIST images (1x28x28 → 784)
+    2. Use a linear layer for binary classification
+    """
+    return nn.Sequential(
+        nn.Flatten(),
+        nn.Linear(28 * 28, 1))
+# --------------- LogRegressionBinary - CIFAR100 --------------
+def Build_LogRegressionBinary_CIFAR100():
+    """
+    1. flatten CIFAR100 images
+    2. Use a linear layer for binary classification
+    """
+    return nn.Sequential(
+        nn.Flatten(),
+        nn.Linear(3* 32 * 32, 1))
+# -------------- LogRegressionBinary - RCV1 ------------------
+def Build_LogRegressionBinary_RCV1():
+    """
+    1. Use a linear layer for binary classification
+    """
+    return nn.Sequential(
+        nn.Linear(47236, 1))
+# <LogRegressionBinaryL2>
+#**************************************************************
+# ------------- LogRegressionBinaryL2 -------------------------
+#**************************************************************
+def Build_LogRegressionBinaryL2_RCV1():
+    """
+    1. Use a linear layer for binary classification
+    """
+    return nn.Sequential(
+        nn.Linear(47236, 1))
+# <LogRegressionBinaryL2>
+# ---------------------------------------------------------
+def Build_LogRegressionBinaryL2_MNIST():
+    """
+    1. flatten MNIST images (1x28x28 -> 784)
+    2. Use a linear layer for binary classification
+    """
+    return nn.Sequential(
+        nn.Flatten(),
+        nn.Linear(28 * 28, 1))
+# ---------------------------------------------------------
+def Build_LogRegressionBinaryL2_CIFAR100():
+    """
+    1. flatten CIFAR100 images
+    2. Use a linear layer for binary classification
+    """
+    return nn.Sequential(
+        nn.Flatten(),
+        nn.Linear(3* 32 * 32, 1))
+# ---------------------------------------------------------
+def Build_LogRegressionBinaryL2_Duke():
+    """
+    Use a linear layer for binary classification
+    """
+    return nn.Sequential(
+        nn.Flatten(),
+        nn.Linear(7129, 1))
+# ---------------------------------------------------------
+def Build_LogRegressionBinaryL2_Ijcnn():
+    """
+    Use a linear layer for binary classification
+    """
+    return nn.Sequential(
+        nn.Flatten(),
+        nn.Linear(22, 1))
+# ---------------------------------------------------------
+def Build_LogRegressionBinaryL2_w8a():
+    """
+    Use a linear layer for binary classification
+    """
+    return nn.Sequential(
+        nn.Flatten(),
+        nn.Linear(300, 1))
+# ---------------------------------------------------------
+def Build_LogRegressionBinaryL2_Adult_Income_Prediction():
+    return nn.Sequential(
+        nn.Linear(108, 1))
+def Build_LogRegressionBinaryL2_Credit_Card_Fraud_Detection():
+    return nn.Sequential(
+        nn.Linear(30, 1))
+def Build_LogRegressionBinaryL2_Diabetes_Health_Indicators():
+    return nn.Sequential(
+        nn.Linear(52, 1))
+def Build_LogRegressionBinaryL2_Electric_Vehicle_Population():
+    return nn.Sequential(
+        nn.Linear(835, 1))
+def Build_LogRegressionBinaryL2_Global_House_Purchase():
+    return nn.Sequential(
+        nn.Linear(81, 1))
+def Build_LogRegressionBinaryL2_Health_Lifestyle():
+    return nn.Sequential(
+        nn.Linear(15, 1))
+def Build_LogRegressionBinaryL2_Homesite_Quote_Conversion():
+    return nn.Sequential(
+        nn.Linear(655, 1))
+def Build_LogRegressionBinaryL2_TN_Weather_2020_2025():
+    return nn.Sequential(
+        nn.Linear(121, 1))

junshan_kit/OptimizerHup/OptimizerFactory.py ADDED Viewed

@@ -0,0 +1,130 @@
+from junshan_kit.OptimizerHup import SPBM, SPBM_func
+import torch, time, os
+from torch.optim.optimizer import Optimizer
+from torch.nn.utils import parameters_to_vector, vector_to_parameters
+class SPSmax(Optimizer):
+    def __init__(self, params, model, hyperparams, Paras):
+        defaults = dict()
+        super().__init__(params, defaults)
+        self.model = model
+        self.c = hyperparams['c']
+        self.gamma = hyperparams['gamma']
+        if 'f_star' not in Paras or Paras['f_star'] is None:
+            self.f_star = 0
+        else:
+            self.f_star = Paras['f_star']
+        self.step_size = []
+    def step(self, closure=None):
+        if closure is None:
+            raise RuntimeError("Closure required for SPSmax")
+        # Reset the gradient and perform forward computation
+        loss = closure()
+        with torch.no_grad():
+            xk = parameters_to_vector(self.model.parameters())
+            # print(torch.norm(xk))
+            g_k = parameters_to_vector([p.grad if p.grad is not None else torch.zeros_like(p) for p in self.model.parameters()])
+            # Step-size
+            step_size = (loss - self.f_star) / ((self.c * torch.norm(g_k, p=2) ** 2) + 1e-8)
+            step_size = min(step_size, self.gamma)
+            self.step_size.append(step_size)
+            # Update
+            xk = xk - step_size * g_k
+            # print(len(self.f_his))
+            vector_to_parameters(xk, self.model.parameters())
+        # emporarily return loss (tensor type)
+        return loss
+class ALR_SMAG(Optimizer):
+    def __init__(self, params, model, hyperparams, Paras):
+        defaults = dict()
+        super().__init__(params, defaults)
+        self.model = model
+        self.c = hyperparams['c']
+        self.eta_max = hyperparams['eta_max']
+        self.beta = hyperparams['beta']
+        if 'f_star' not in Paras or Paras['f_star'] is None:
+            self.f_star = 0
+        else:
+            self.f_star = Paras['f_star']
+        self.step_size = []
+        self.d_k = torch.zeros_like(parameters_to_vector(self.model.parameters()))
+    def step(self, closure=None):
+        if closure is None:
+            raise RuntimeError("Closure required for SPSmax")
+        # Reset the gradient and perform forward computation
+        loss = closure()
+        with torch.no_grad():
+            xk = parameters_to_vector(self.model.parameters())
+            # print(torch.norm(xk))
+            g_k = parameters_to_vector([p.grad if p.grad is not None else torch.zeros_like(p) for p in self.model.parameters()])
+            self.d_k = self.beta * self.d_k + g_k
+            # Step-size
+            step_size = (loss - self.f_star) / ((self.c * torch.norm(self.d_k, p=2) ** 2) + 1e-8)
+            step_size = min(step_size, self.eta_max)
+            self.step_size.append(step_size)
+            # Update
+            xk = xk - step_size * g_k
+            # print(len(self.f_his))
+            vector_to_parameters(xk, self.model.parameters())
+        # emporarily return loss (tensor type)
+        return loss
+class Bundle(Optimizer):
+    def __init__(self, params, model, hyperparams, Paras):
+        defaults = dict()
+        super().__init__(params, defaults)
+        self.model = model
+        self.cutting_num = hyperparams['cutting_number']
+        self.delta = hyperparams['delta']
+        self.Paras = Paras
+        self.x_his, self.g_his, self.f_his = [], [], []
+    def step(self, closure=None):
+        if closure is None:
+            raise RuntimeError("Closure required for CuttingPlaneOptimizer")
+        # Reset the gradient and perform forward computation
+        loss = closure()
+        with torch.no_grad():
+            xk = parameters_to_vector(self.model.parameters())
+            # print(torch.norm(xk))
+            g_k = parameters_to_vector([p.grad if p.grad is not None else torch.zeros_like(p) for p in self.model.parameters()])
+            # Add cutting plane
+            x_his, f_his, g_his = SPBM_func.add_cutting(self.x_his, self.f_his, self.g_his,xk.detach().clone(), g_k.detach().clone(), loss.detach().clone(), self.cutting_num)
+            # the coefficient of dual problem
+            Gk, rk, ek = SPBM_func.get_var(x_his, f_his, g_his, self.delta)
+            # SOVER (dual)
+            xk = SPBM_func.bundle(Gk, ek, xk, self.delta, self.Paras)
+            # print(len(self.f_his))
+            vector_to_parameters(xk, self.model.parameters())
+        # loss（tensor）
+        return loss

junshan-kit 2.2.8__py2.py3-none-any.whl → 2.7.3__py2.py3-none-any.whl

junshan-kit 2.2.8py2.py3-none-any.whl → 2.7.3py2.py3-none-any.whl