PyPI - deepliif - Versions diffs - 1.1.11__py3-none-any.whl → 1.1.12__py3-none-any.whl - Mend

deepliif 1.1.11py3-none-any.whl → 1.1.12py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

cli.py +354 -67
deepliif/data/__init__.py +7 -7
deepliif/data/aligned_dataset.py +2 -3
deepliif/data/unaligned_dataset.py +38 -19
deepliif/models/CycleGAN_model.py +282 -0
deepliif/models/DeepLIIFExt_model.py +47 -25
deepliif/models/DeepLIIF_model.py +69 -19
deepliif/models/SDG_model.py +57 -26
deepliif/models/__init__ - run_dask_multi dev.py +943 -0
deepliif/models/__init__ - timings.py +764 -0
deepliif/models/__init__.py +328 -265
deepliif/models/att_unet.py +199 -0
deepliif/models/base_model.py +32 -8
deepliif/models/networks.py +108 -34
deepliif/options/__init__.py +49 -5
deepliif/postprocessing.py +1034 -227
deepliif/postprocessing__OLD__DELETE.py +440 -0
deepliif/util/__init__.py +85 -64
deepliif/util/visualizer.py +106 -19
{deepliif-1.1.11.dist-info → deepliif-1.1.12.dist-info}/METADATA +75 -23
deepliif-1.1.12.dist-info/RECORD +40 -0
deepliif-1.1.11.dist-info/RECORD +0 -35
{deepliif-1.1.11.dist-info → deepliif-1.1.12.dist-info}/LICENSE.md +0 -0
{deepliif-1.1.11.dist-info → deepliif-1.1.12.dist-info}/WHEEL +0 -0
{deepliif-1.1.11.dist-info → deepliif-1.1.12.dist-info}/entry_points.txt +0 -0
{deepliif-1.1.11.dist-info → deepliif-1.1.12.dist-info}/top_level.txt +0 -0

deepliif/data/__init__.py CHANGED Viewed

@@ -55,28 +55,28 @@ def get_option_setter(dataset_name):
     return dataset_class.modify_commandline_options
-def create_dataset(opt):
+def create_dataset(opt, phase=None, batch_size=None):
     """Create a dataset given the option.
     This function wraps the class CustomDatasetDataLoader.
         This is the main interface between this package and 'train.py'/'test.py'
     """
-    return CustomDatasetDataLoader(opt)
+    return CustomDatasetDataLoader(opt, phase=phase if phase else opt.phase, batch_size=batch_size if batch_size else opt.batch_size)
 class CustomDatasetDataLoader(object):
     """Wrapper class of Dataset class that performs multi-threaded data loading"""
-    def __init__(self, opt):
+    def __init__(self, opt, phase=None, batch_size=None):
         """Initialize this class
         Step 1: create a dataset instance given the name [dataset_mode]
         Step 2: create a multi-threaded data loader.
         """
-        self.batch_size = opt.batch_size
+        self.batch_size = batch_size if batch_size else opt.batch_size
         self.max_dataset_size = opt.max_dataset_size
         dataset_class = find_dataset_using_name(opt.dataset_mode)
-        self.dataset = dataset_class(opt)
+        self.dataset = dataset_class(opt, phase=phase if phase else opt.phase)
         print("dataset [%s] was created" % type(self.dataset).__name__)
         sampler = None
@@ -95,7 +95,7 @@ class CustomDatasetDataLoader(object):
             self.dataloader = torch.utils.data.DataLoader(
                 self.dataset,
                 sampler=sampler,
-                batch_size=opt.batch_size,
+                batch_size=batch_size,
                 shuffle=not opt.serial_batches if sampler is None else False,
                 num_workers=int(opt.num_threads)
             )
@@ -106,7 +106,7 @@ class CustomDatasetDataLoader(object):
             self.dataloader = torch.utils.data.DataLoader(
                 self.dataset,
                 sampler=sampler,
-                batch_size=opt.batch_size,
+                batch_size=batch_size,
                 shuffle=not opt.serial_batches if sampler is None else False,
                 num_workers=int(opt.num_threads),
                 worker_init_fn=seed_worker,

deepliif/data/aligned_dataset.py CHANGED Viewed

@@ -11,7 +11,7 @@ class AlignedDataset(BaseDataset):
     During test time, you need to prepare a directory '/path/to/data/test'.
     """
-    def __init__(self, opt):
+    def __init__(self, opt, phase='train'):
         """Initialize this dataset class.
         Parameters:
@@ -19,7 +19,7 @@ class AlignedDataset(BaseDataset):
         """
         BaseDataset.__init__(self, opt.dataroot)
         self.preprocess = opt.preprocess
-        self.dir_AB = os.path.join(opt.dataroot, opt.phase)  # get the image directory
+        self.dir_AB = os.path.join(opt.dataroot, phase)  # get the image directory
         self.AB_paths = sorted(make_dataset(self.dir_AB, opt.max_dataset_size))  # get image paths
         assert(opt.load_size >= opt.crop_size)   # crop_size should be smaller than the size of loaded image
         self.input_nc = opt.output_nc if opt.direction == 'BtoA' else opt.input_nc
@@ -95,7 +95,6 @@ class AlignedDataset(BaseDataset):
                 A = AB.crop((w2 * i, 0, w2 * (i+1), h))
                 A = A_transform(A)
                 A_Array.append(A)
             for i in range(self.input_no, self.input_no + self.modalities_no + 1):
                 B = AB.crop((w2 * i, 0, w2 * (i + 1), h))
                 B = B_transform(B)

deepliif/data/unaligned_dataset.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import os.path
-from deepliif.data.base_dataset import BaseDataset, get_transform
+from deepliif.data.base_dataset import BaseDataset, get_params, get_transform
 from deepliif.data.image_folder import make_dataset
 from PIL import Image
 import random
@@ -16,25 +16,39 @@ class UnalignedDataset(BaseDataset):
     '/path/to/data/testA' and '/path/to/data/testB' during test time.
     """
-    def __init__(self, opt):
+    def __init__(self, opt, phase='train'):
         """Initialize this dataset class.
         Parameters:
             opt (Option class) -- stores all the experiment flags; needs to be a subclass of BaseOptions
         """
         BaseDataset.__init__(self, opt)
-        self.dir_A = os.path.join(opt.dataroot, opt.phase + 'A')  # create a path '/path/to/data/trainA'
-        self.dir_B = os.path.join(opt.dataroot, opt.phase + 'B')  # create a path '/path/to/data/trainB'
+        self.opt = opt
+        self.input_nc = opt.output_nc if opt.direction == 'BtoA' else opt.input_nc
+        self.output_nc = opt.input_nc if opt.direction == 'BtoA' else opt.output_nc
+        self.preprocess = opt.preprocess
+        self.no_flip = opt.no_flip
+        self.modalities_no = opt.modalities_no
+        self.seg_no = opt.seg_no
+        self.input_no = opt.input_no
+        self.seg_gen = opt.seg_gen
+        self.load_size = opt.load_size
+        self.crop_size = opt.crop_size
+        self.model = opt.model
+        self.dir_A = os.path.join(opt.dataroot, phase + 'A')  # create a path '/path/to/data/trainA'
+        # trainB1/trainB2/trainB3... are organized as elements of DATASET B which is a list
+        self.dirs_B = [os.path.join(opt.dataroot, phase + f'B{i}') for i in range(1,self.modalities_no+1)]  # create a list of paths ['/path/to/data/trainB',...]
         self.A_paths = sorted(make_dataset(self.dir_A, opt.max_dataset_size))   # load images from '/path/to/data/trainA'
-        self.B_paths = sorted(make_dataset(self.dir_B, opt.max_dataset_size))    # load images from '/path/to/data/trainB'
+        self.B_paths = [sorted(make_dataset(dir_B, opt.max_dataset_size)) for dir_B in self.dirs_B]    # load images from '/path/to/data/trainB', '/path/to/data/trainC', ...
         self.A_size = len(self.A_paths)  # get the size of dataset A
-        self.B_size = len(self.B_paths)  # get the size of dataset B
+        self.B_sizes = [len(B_paths) for B_paths in self.B_paths]  # get the size of dataset B1, B2, B3, ...
         btoA = self.opt.direction == 'BtoA'
         input_nc = self.opt.output_nc if btoA else self.opt.input_nc       # get the number of channels of input image
         output_nc = self.opt.input_nc if btoA else self.opt.output_nc      # get the number of channels of output image
-        self.transform_A = get_transform(self.opt, grayscale=(input_nc == 1))
-        self.transform_B = get_transform(self.opt, grayscale=(output_nc == 1))
     def __getitem__(self, index):
         """Return a data point and its metadata information.
@@ -50,22 +64,27 @@ class UnalignedDataset(BaseDataset):
         """
         A_path = self.A_paths[index % self.A_size]  # make sure index is within then range
         if self.opt.serial_batches:   # make sure index is within then range
-            index_B = index % self.B_size
+            indice_B = [index % B_size for B_size in self.B_sizes]
         else:   # randomize the index for domain B to avoid fixed pairs.
-            index_B = random.randint(0, self.B_size - 1)
-        B_path = self.B_paths[index_B]
+            indice_B = [random.randint(0, B_size - 1) for B_size in self.B_sizes]
+        B_paths = [B_paths[index_B] for B_paths, index_B in zip(self.B_paths, indice_B)]
         A_img = Image.open(A_path).convert('RGB')
-        B_img = Image.open(B_path).convert('RGB')
+        B_imgs = [Image.open(B_path).convert('RGB') for B_path in B_paths]
         # apply image transformation
-        A = self.transform_A(A_img)
-        B = self.transform_B(B_img)
-        return {'A': A, 'B': B, 'A_paths': A_path, 'B_paths': B_path}
+        transform_params = get_params(self.preprocess, self.load_size, self.crop_size, A_img.size)
+        A_transform = get_transform(self.preprocess, self.load_size, self.crop_size, self.no_flip, transform_params, grayscale=(self.input_nc == 1))
+        B_transform = get_transform(self.preprocess, self.load_size, self.crop_size, self.no_flip, transform_params, grayscale=(self.output_nc == 1))
+        A = A_transform(A_img)
+        Bs = [B_transform(B_img) for B_img in B_imgs]
+        return {'A': A, 'Bs': Bs, 'A_paths': A_path, 'B_paths': B_paths}
     def __len__(self):
         """Return the total number of images in the dataset.
-        As we have two datasets with potentially different number of images,
-        we take a maximum of
+        The effective size of this dataset will be the size of datasetA through which we loop and grab a random/matching image B1/B2/B3... for
         """
-        return max(self.A_size, self.B_size)
+        return self.A_size #max(self.A_size, self.B_size)

deepliif/models/CycleGAN_model.py ADDED Viewed

@@ -0,0 +1,282 @@
+import torch
+from packaging import version
+from torch import nn
+import itertools
+from ..util.image_pool import ImagePool
+from .base_model import BaseModel
+from . import networks
+from .networks import get_optimizer
+class CycleGANModel(BaseModel):
+    """
+    This class implements the CycleGAN model, for learning image-to-image translation without paired data.
+    The model training requires '--dataset_mode unaligned' dataset.
+    By default, it uses a '--netG resnet_9blocks' ResNet generator,
+    a '--netD basic' discriminator (PatchGAN introduced by pix2pix),
+    and a least-square GANs objective ('--gan_mode lsgan').
+    CycleGAN paper: https://arxiv.org/pdf/1703.10593.pdf
+    """
+    def __init__(self, opt):
+        """Initialize the CycleGAN class.
+        Parameters:
+            opt (Option class)-- stores all the experiment flags; needs to be a subclass of BaseOptions
+        """
+        BaseModel.__init__(self, opt)
+        self.mod_gen_no = self.opt.modalities_no
+        if not hasattr(self.opt,'upsample'):
+            self.opt.upsample = 'convtranspose'
+        if not hasattr(self.opt,'label_smoothing'):
+            self.opt.label_smoothing = 0
+        use_spectral_norm = self.opt.norm == 'spectral'
+        self.loss_G_weights = opt.loss_G_weights
+        self.loss_D_weights = opt.loss_D_weights
+        self.loss_cyc_weights = [1 / self.mod_gen_no] * self.mod_gen_no
+        self.opt.lambda_identity = 0 # do not use lambda identity for the first trial
+        # specify the training losses you want to print out. The training/test scripts will call <BaseModel.get_current_losses>
+        self.loss_names = ['D_A', 'G_A', 'cycle_A', 'idt_A', 'D_B', 'G_B', 'cycle_B', 'idt_B']
+        # specify the images you want to save/display. The training/test scripts will call <BaseModel.get_current_visuals>
+        l_suffix = range(1, self.opt.modalities_no + 1)
+        visual_names_A = [f'real_As_{i}' for i in l_suffix] + [f'fake_Bs_{i}' for i in l_suffix] + [f'rec_As_{i}' for i in l_suffix]
+        visual_names_B = [f'real_Bs_{i}' for i in l_suffix] + [f'fake_As_{i}' for i in l_suffix] + [f'rec_Bs_{i}' for i in l_suffix]
+        # if self.is_train and self.opt.lambda_identity > 0.0:  # if identity loss is used, we also visualize idt_B=G_A(B) ad idt_A=G_A(B)
+        #     visual_names_A.append('idt_B')
+        #     visual_names_B.append('idt_A')
+        self.visual_names = visual_names_A + visual_names_B  # combine visualizations for A and B
+        # specify the models you want to save to the disk. The training/test scripts will call <BaseModel.save_networks> and <BaseModel.load_networks>.
+        if self.is_train:
+            self.model_names = [f'GA_{i}' for i in l_suffix] + [f'GB_{i}' for i in l_suffix] + [f'DA_{i}' for i in l_suffix] + [f'DB_{i}' for i in l_suffix]
+        else:  # during test time, only load Gs
+            if self.opt.BtoA:
+                self.model_names = [f'GB_{i}' for i in l_suffix]
+            else:
+                self.model_names = [f'GA_{i}' for i in l_suffix]
+        # define networks (both Generators and discriminators)
+        # The naming is different from those used in the paper.
+        # Code (vs. paper): G_A (G), G_B (F), D_A (D_Y), D_B (D_X)
+        if isinstance(opt.net_g, str):
+            self.opt.net_g = [self.opt.net_g] * self.mod_gen_no
+        if version.parse(torch.__version__) < version.parse('1.11.0'):
+            self.netGA = list()
+            self.netGB = list()
+        else:
+            self.netGA = nn.ModuleList()
+            self.netGB = nn.ModuleList()
+        for i in range(self.mod_gen_no):
+            if self.is_train or not self.opt.BtoA:
+                self.netGA.append(networks.define_G(self.opt.input_nc, self.opt.output_nc, self.opt.ngf, self.opt.net_g[i], self.opt.norm,
+                                                 not self.opt.no_dropout, self.opt.init_type, self.opt.init_gain, self.gpu_ids, self.opt.padding,
+                                                upsample=self.opt.upsample))
+            if self.is_train or self.opt.BtoA:
+                self.netGB.append(networks.define_G(self.opt.output_nc, self.opt.input_nc, self.opt.ngf, self.opt.net_g[i], self.opt.norm,
+                                                 not self.opt.no_dropout, self.opt.init_type, self.opt.init_gain, self.gpu_ids, self.opt.padding,
+                                                 upsample=self.opt.upsample))
+        if self.is_train:  # define a discriminator; conditional GANs need to take both input and output images; Therefore, #channels for D is input_nc + output_nc
+            if version.parse(torch.__version__) < version.parse('1.11.0'):
+                self.netDA = list()
+                self.netDB = list()
+            else:
+                self.netDA = nn.ModuleList()
+                self.netDB = nn.ModuleList()
+            for i in range(self.mod_gen_no):
+                self.netDA.append(networks.define_D(self.opt.output_nc, self.opt.ndf, self.opt.net_d,
+                                                 self.opt.n_layers_D, self.opt.norm, self.opt.init_type, self.opt.init_gain,
+                                                 self.gpu_ids))
+                self.netDB.append(networks.define_D(self.opt.input_nc, self.opt.ndf, self.opt.net_d,
+                                                 self.opt.n_layers_D, self.opt.norm, self.opt.init_type, self.opt.init_gain,
+                                                 self.gpu_ids))
+        if self.is_train:
+            if opt.lambda_identity > 0.0:  # only works when input and output images have the same number of channels
+                assert(opt.input_nc == opt.output_nc)
+            self.fake_A_pools = [ImagePool(opt.pool_size) for _ in range(self.opt.modalities_no)]  # create image buffer to store previously generated images
+            self.fake_B_pools = [ImagePool(opt.pool_size) for _ in range(self.opt.modalities_no)]  # create image buffer to store previously generated images
+            # define loss functions
+            # label smoothing currently only applies to discriminator losses & generatoe of lsgan/vanilla
+            self.criterionGAN = networks.GANLoss(opt.gan_mode, label_smoothing=self.opt.label_smoothing).to(self.device)  # define GAN loss.
+            self.criterionCycle = torch.nn.L1Loss()
+            self.criterionIdt = torch.nn.L1Loss()
+            self.criterionSmoothL1 = torch.nn.SmoothL1Loss()
+            self.criterionVGG = networks.VGGLoss().to(self.device)
+            # initialize optimizers
+            params = []
+            for i in range(len(self.netGA)):
+                params += list(self.netGA[i].parameters())
+            for i in range(len(self.netGB)):
+                params += list(self.netGB[i].parameters())
+            try:
+                self.optimizer_G = get_optimizer(opt.optimizer)(params, lr=opt.lr_g, betas=(opt.beta1, 0.999))
+            except:
+                print(f'betas are not used for optimizer torch.optim.{opt.optimizer} in generators')
+                self.optimizer_G = get_optimizer(opt.optimizer)(params, lr=opt.lr_g)
+            params = []
+            for i in range(len(self.netDA)):
+                params += list(self.netDA[i].parameters())
+            for i in range(len(self.netDB)):
+                params += list(self.netDB[i].parameters())
+            # a smaller learning rate for discriminators to postpone training failure due to discriminators quickly become too strong
+            try:
+                self.optimizer_D = get_optimizer(opt.optimizer)(params, lr=opt.lr_d, betas=(opt.beta1, 0.999))
+            except:
+                print(f'betas are not used for optimizer torch.optim.{opt.optimizer} in generators')
+                self.optimizer_D = get_optimizer(opt.optimizer)(params, lr=opt.lr_d)
+            self.optimizers.append(self.optimizer_G)
+            self.optimizers.append(self.optimizer_D)
+    def set_input(self, input):
+        """Unpack input data from the dataloader and perform necessary pre-processing steps.
+        Parameters:
+            input (dict): include the data itself and its metadata information.
+        The option 'direction' can be used to swap domain A and domain B.
+        """
+        self.real_As = [input['A'].to(self.device) for _ in range(self.opt.modalities_no)]
+        self.real_Bs = [x.to(self.device) for x in input['Bs']]
+        self.image_paths = input['A_paths']
+    def forward(self):
+        """
+        Run forward pass; called by both functions <optimize_parameters> and <test>.
+        During inference, some output list could be empty. For example, if only netGAs are loaded,
+        there will not be valid elements in self.rec_As and self.fake_As.
+        """
+        self.fake_Bs = [netGA(real_A) for netGA, real_A in zip(self.netGA, self.real_As)]  # G_A(A)
+        self.rec_As = [netGB(fake_B) for netGB, fake_B in zip(self.netGB, self.fake_Bs)]   # G_B(G_A(A))
+        self.fake_As = [netGB(real_B) for netGB, real_B in zip(self.netGB, self.real_Bs)]  # G_B(B)
+        self.rec_Bs = [netGA(fake_A) for netGA, fake_A in zip(self.netGA, self.fake_As)]   # G_A(G_B(B))
+    def backward_D_basic(self, netD, real, fake, scale_factor=1):
+        """Calculate GAN loss for the discriminator
+        Parameters:
+            netD (network)      -- the discriminator D
+            real (tensor array) -- real images
+            fake (tensor array) -- images generated by a generator
+        Return the discriminator loss.
+        We also call loss_D.backward() to calculate the gradients.
+        """
+        # Real
+        pred_real = netD(real)
+        loss_D_real = self.criterionGAN(pred_real, True)
+        # Fake
+        pred_fake = netD(fake.detach())
+        loss_D_fake = self.criterionGAN(pred_fake, False)
+        # Combined loss and calculate gradients
+        loss_D = (loss_D_real + loss_D_fake) * 0.5 * scale_factor
+        loss_D.backward()
+        return loss_D
+    def backward_D_A(self):
+        """Calculate GAN loss for discriminator D_A"""
+        fake_Bs = [fake_B_pool.query(fake_B) for fake_B_pool, fake_B in zip(self.fake_B_pools, self.fake_Bs)]
+        real_Bs = self.real_Bs
+        self.loss_D_A = 0
+        for i, (netDA, real_B, fake_B) in enumerate(zip(self.netDA, real_Bs, fake_Bs)):
+            self.loss_D_A += self.backward_D_basic(netDA, real_B, fake_B, scale_factor=self.loss_D_weights[i])
+        #self.loss_D_A.backward()
+    def backward_D_B(self):
+        """Calculate GAN loss for discriminator D_B"""
+        fake_As = [fake_A_pool.query(fake_A) for fake_A_pool, fake_A in zip(self.fake_A_pools, self.fake_As)]
+        real_As = self.real_As
+        self.loss_D_B = 0
+        for i, (netDB, real_A, fake_A) in enumerate(zip(self.netDB, real_As, fake_As)):
+            self.loss_D_B += self.backward_D_basic(netDB, real_A, fake_A, scale_factor=self.loss_D_weights[i])
+        #self.loss_D_B.backward()
+    def backward_G(self):
+        """Calculate the loss for generators G_A and G_B"""
+        # default lambda values from cyclegan implementation:
+        # https://github.com/junyanz/pytorch-CycleGAN-and-pix2pix/blob/c3268edd50ec37a81600c9b981841f48929671b8/models/cycle_gan_model.py#L41
+        lambda_idt = 0#self.opt.lambda_identity # identity loss is used to preserve color consistency between input and output images, which we do not want to encourage
+        lambda_A = 10#self.opt.lambda_A
+        lambda_B = 10#self.opt.lambda_B
+        # Identity loss
+        if lambda_idt > 0:
+            # G_A should be identity if real_B is fed: ||G_A(B) - B||
+            self.idt_A = self.netG_A(self.real_B)
+            self.loss_idt_A = self.criterionIdt(self.idt_A, self.real_B) * lambda_B * lambda_idt
+            # G_B should be identity if real_A is fed: ||G_B(A) - A||
+            self.idt_B = self.netG_B(self.real_A)
+            self.loss_idt_B = self.criterionIdt(self.idt_B, self.real_A) * lambda_A * lambda_idt
+        else:
+            self.loss_idt_A = 0
+            self.loss_idt_B = 0
+        # GAN loss D_A(G_A(A))
+        self.loss_G_A = 0
+        for i, (netDA, fake_B, real_B) in enumerate(zip(self.netDA, self.fake_Bs, self.real_Bs)):
+            self.loss_G_A += self.criterionGAN(netDA(fake_B), True) * self.loss_G_weights[i]
+            self.loss_G_A += self.criterionVGG(fake_B, real_B) * self.loss_G_weights[i]
+        # GAN loss D_B(G_B(B))
+        self.loss_G_B = 0
+        for i, (netDB, fake_A, real_A) in enumerate(zip(self.netDB, self.fake_As, self.real_As)):
+            self.loss_G_B += self.criterionGAN(netDB(fake_A), True) * self.loss_G_weights[i]
+            self.loss_G_B += self.criterionVGG(fake_A, real_A) * self.loss_G_weights[i]
+        # Forward cycle loss || G_B(G_A(A)) - A||
+        self.loss_cycle_A = 0
+        for i, (rec_A, real_A) in enumerate(zip(self.rec_As, self.real_As)):
+            self.loss_cycle_A += self.criterionCycle(rec_A, real_A) * lambda_A * self.loss_cyc_weights[i]
+        # Backward cycle loss || G_A(G_B(B)) - B||
+        self.loss_cycle_B = 0
+        for i, (rec_B, real_B) in enumerate(zip(self.rec_Bs, self.real_Bs)):
+            self.loss_cycle_B += self.criterionCycle(rec_B, real_B) * lambda_B * self.loss_cyc_weights[i]
+        # VGG loss
+        # self.loss_G_VGG = self.criterionVGG(self.fake_B_1, self.real_B_1) * self.opt.lambda_feat
+        # smooth L1
+        # self.loss_G_A_L1 = self.criterionSmoothL1(self.fake_B_1, self.real_B_1) * self.opt.lambda_L1
+        # combined loss and calculate gradients
+        self.loss_G = self.loss_G_A + self.loss_G_B + self.loss_cycle_A + self.loss_cycle_B + self.loss_idt_A + self.loss_idt_B
+        self.loss_G.backward()
+    def optimize_parameters(self):
+        """Calculate losses, gradients, and update network weights; called in every training iteration"""
+        # forward
+        self.forward()      # compute fake images and reconstruction images.
+        # G_A and G_B
+        self.set_requires_grad(self.netDA + self.netDB, False)  # Ds require no gradients when optimizing Gs
+        self.optimizer_G.zero_grad()  # set G_A and G_B's gradients to zero
+        self.backward_G()             # calculate gradients for G_A and G_B
+        self.optimizer_G.step()       # update G_A and G_B's weights
+        # D_A and D_B
+        self.set_requires_grad(self.netDA + self.netDB, True)
+        self.optimizer_D.zero_grad()   # set D_A and D_B's gradients to zero
+        self.backward_D_A()      # calculate gradients for D_A
+        self.backward_D_B()      # calculate graidents for D_B
+        self.optimizer_D.step()  # update D_A and D_B's weights

deepliif/models/DeepLIIFExt_model.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import torch
 from .base_model import BaseModel
 from . import networks
+from .networks import get_optimizer
 class DeepLIIFExtModel(BaseModel):
@@ -18,19 +19,16 @@ class DeepLIIFExtModel(BaseModel):
         # self.seg_gen_no = self.opt.modalities_no + 1
         # weights of the modalities in generating segmentation mask
-        self.seg_weights = [0, 0, 0]
-        if opt.seg_gen:
-            self.seg_weights = [0.3] * self.mod_gen_no
-            self.seg_weights[1] = 0.4
+        self.seg_weights = opt.seg_weights
         # self.seg_weights = opt.seg_weights
         # assert len(self.seg_weights) == self.seg_gen_no, 'The number of the segmentation weights (seg_weights) is not equal to the number of target images (modalities_no)!'
         # print(self.seg_weights)
         # loss weights in calculating the final loss
-        self.loss_G_weights = [1 / self.mod_gen_no] * self.mod_gen_no
+        self.loss_G_weights = opt.loss_G_weights
         self.loss_GS_weights = [1 / self.mod_gen_no] * self.mod_gen_no
-        self.loss_D_weights = [1 / self.mod_gen_no] * self.mod_gen_no
+        self.loss_D_weights = opt.loss_D_weights
         self.loss_DS_weights = [1 / self.mod_gen_no] * self.mod_gen_no
         # self.gpu_ids is a possibly modifed one for model initialization
@@ -72,22 +70,19 @@ class DeepLIIFExtModel(BaseModel):
                     self.model_names.extend(['GS_' + str(i)])
         # define networks (both generator and discriminator)
+        if isinstance(opt.net_g, str):
+            self.opt.net_g = [self.opt.net_g] * self.mod_gen_no
+        if isinstance(opt.net_gs, str):
+            self.opt.net_gs = [self.opt.net_gs]*self.mod_gen_no
         self.netG = [None for _ in range(self.mod_gen_no)]
         self.netGS = [None for _ in range(self.mod_gen_no)]
         for i in range(self.mod_gen_no):
-            self.netG[i] = networks.define_G(self.opt.input_nc, self.opt.output_nc, self.opt.ngf, self.opt.net_g, self.opt.norm,
+            self.netG[i] = networks.define_G(self.opt.input_nc, self.opt.output_nc, self.opt.ngf, self.opt.net_g[i], self.opt.norm,
                                              not self.opt.no_dropout, self.opt.init_type, self.opt.init_gain, self.gpu_ids, self.opt.padding)
-            print('***************************************')
-            print(self.opt.input_nc, self.opt.output_nc, self.opt.ngf, self.opt.net_g, self.opt.norm,
-                                             not self.opt.no_dropout, self.opt.init_type, self.opt.init_gain, self.gpu_ids, self.opt.padding)
-            print('***************************************')
         for i in range(self.mod_gen_no):
             if self.opt.seg_gen:
-                # if i == 0:
-                #     self.netGS[i] = networks.define_G(self.opt.input_nc, self.opt.output_nc, self.opt.ngf, self.opt.net_gs, self.opt.norm,
-                #                                       not self.opt.no_dropout, self.opt.init_type, self.opt.init_gain, self.gpu_ids)
-                # else:
-                self.netGS[i] = networks.define_G(self.opt.input_nc * 3, self.opt.output_nc, self.opt.ngf, self.opt.net_gs, self.opt.norm,
+                self.netGS[i] = networks.define_G(self.opt.input_nc * 3, self.opt.output_nc, self.opt.ngf, self.opt.net_gs[i], self.opt.norm,
                                                   not self.opt.no_dropout, self.opt.init_type, self.opt.init_gain, self.gpu_ids)
         if self.is_train:  # define a discriminator; conditional GANs need to take both input and output images; Therefore, #channels for D is input_nc + output_nc
@@ -99,11 +94,6 @@ class DeepLIIFExtModel(BaseModel):
                                                  self.gpu_ids)
             for i in range(self.mod_gen_no):
                 if self.opt.seg_gen:
-                    # if i == 0:
-                    #     self.netDS[i] = networks.define_D(self.opt.input_nc + self.opt.output_nc, self.opt.ndf, self.opt.net_ds,
-                    #                                       self.opt.n_layers_D, self.opt.norm, self.opt.init_type, self.opt.init_gain,
-                    #                                       self.gpu_ids)
-                    # else:
                     self.netDS[i] = networks.define_D(self.opt.input_nc * 3 + self.opt.output_nc, self.opt.ndf, self.opt.net_ds,
                                                       self.opt.n_layers_D, self.opt.norm, self.opt.init_type, self.opt.init_gain,
                                                       self.gpu_ids)
@@ -113,9 +103,7 @@ class DeepLIIFExtModel(BaseModel):
             # define loss functions
             self.criterionGAN_mod = networks.GANLoss(self.opt.gan_mode).to(self.device)
             self.criterionGAN_seg = networks.GANLoss(self.opt.gan_mode_s).to(self.device)
             self.criterionSmoothL1 = torch.nn.SmoothL1Loss()
             self.criterionVGG = networks.VGGLoss().to(self.device)
             # initialize optimizers; schedulers will be automatically created by function <BaseModel.setup>.
@@ -125,7 +113,11 @@ class DeepLIIFExtModel(BaseModel):
             for i in range(len(self.netGS)):
                 if self.netGS[i]:
                     params += list(self.netGS[i].parameters())
-            self.optimizer_G = torch.optim.Adam(params, lr=opt.lr, betas=(opt.beta1, 0.999))
+            try:
+                self.optimizer_G = get_optimizer(opt.optimizer)(params, lr=opt.lr_g, betas=(opt.beta1, 0.999))
+            except:
+                print(f'betas are not used for optimizer torch.optim.{opt.optimizer} in generators')
+                self.optimizer_G = get_optimizer(opt.optimizer)(params, lr=opt.lr_g)
             params = []
             for i in range(len(self.netD)):
@@ -133,7 +125,11 @@ class DeepLIIFExtModel(BaseModel):
             for i in range(len(self.netDS)):
                 if self.netDS[i]:
                     params += list(self.netDS[i].parameters())
-            self.optimizer_D = torch.optim.Adam(params, lr=opt.lr, betas=(opt.beta1, 0.999))
+            try:
+                self.optimizer_D = get_optimizer(opt.optimizer)(params, lr=opt.lr_d, betas=(opt.beta1, 0.999))
+            except:
+                print(f'betas are not used for optimizer torch.optim.{opt.optimizer} in discriminators')
+                self.optimizer_D = get_optimizer(opt.optimizer)(params, lr=opt.lr_d)
             self.optimizers.append(self.optimizer_G)
             self.optimizers.append(self.optimizer_D)
@@ -295,3 +291,29 @@ class DeepLIIFExtModel(BaseModel):
         self.optimizer_G.zero_grad()  # set G's gradients to zero
         self.backward_G()  # calculate graidents for G
         self.optimizer_G.step()  # udpate G's weights
+    def calculate_losses(self):
+        """
+        Calculate losses but do not optimize parameters. Used in validation loss calculation during training.
+        """
+        self.forward()  # compute fake images: G(A)
+        # update D
+        for i in range(self.mod_gen_no):
+            self.set_requires_grad(self.netD[i], True)  # enable backprop for D1
+        for i in range(self.mod_gen_no):
+            if self.netDS[i]:
+                self.set_requires_grad(self.netDS[i], True)
+        self.optimizer_D.zero_grad()  # set D's gradients to zero
+        self.backward_D()  # calculate gradients for D
+        # update G
+        for i in range(self.mod_gen_no):
+            self.set_requires_grad(self.netD[i], False)
+        for i in range(self.mod_gen_no):
+            if self.netDS[i]:
+                self.set_requires_grad(self.netDS[i], False)
+        self.optimizer_G.zero_grad()  # set G's gradients to zero
+        self.backward_G()  # calculate graidents for G

deepliif 1.1.11__py3-none-any.whl → 1.1.12__py3-none-any.whl

deepliif 1.1.11py3-none-any.whl → 1.1.12py3-none-any.whl