PyPI - hcpdiff - Versions diffs - 0.9.1__py3-none-any.whl → 2.2__py3-none-any.whl - Mend

hcpdiff 0.9.1py3-none-any.whl → 2.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (211) hide show

hcpdiff/__init__.py +4 -4
hcpdiff/ckpt_manager/__init__.py +4 -5
hcpdiff/ckpt_manager/ckpt.py +24 -0
hcpdiff/ckpt_manager/format/__init__.py +4 -0
hcpdiff/ckpt_manager/format/diffusers.py +59 -0
hcpdiff/ckpt_manager/format/emb.py +21 -0
hcpdiff/ckpt_manager/format/lora_webui.py +252 -0
hcpdiff/ckpt_manager/format/sd_single.py +41 -0
hcpdiff/ckpt_manager/loader.py +64 -0
hcpdiff/data/__init__.py +4 -28
hcpdiff/data/cache/__init__.py +1 -0
hcpdiff/data/cache/vae.py +102 -0
hcpdiff/data/dataset.py +20 -0
hcpdiff/data/handler/__init__.py +3 -0
hcpdiff/data/handler/controlnet.py +18 -0
hcpdiff/data/handler/diffusion.py +90 -0
hcpdiff/data/handler/text.py +111 -0
hcpdiff/data/source/__init__.py +3 -3
hcpdiff/data/source/folder_class.py +12 -29
hcpdiff/data/source/text.py +40 -0
hcpdiff/data/source/text2img.py +36 -74
hcpdiff/data/source/text2img_cond.py +9 -15
hcpdiff/diffusion/__init__.py +0 -0
hcpdiff/diffusion/noise/__init__.py +2 -0
hcpdiff/diffusion/noise/pyramid_noise.py +42 -0
hcpdiff/diffusion/noise/zero_terminal.py +39 -0
hcpdiff/diffusion/sampler/__init__.py +5 -0
hcpdiff/diffusion/sampler/base.py +72 -0
hcpdiff/diffusion/sampler/ddpm.py +20 -0
hcpdiff/diffusion/sampler/diffusers.py +66 -0
hcpdiff/diffusion/sampler/edm.py +22 -0
hcpdiff/diffusion/sampler/sigma_scheduler/__init__.py +3 -0
hcpdiff/diffusion/sampler/sigma_scheduler/base.py +14 -0
hcpdiff/diffusion/sampler/sigma_scheduler/ddpm.py +197 -0
hcpdiff/diffusion/sampler/sigma_scheduler/edm.py +48 -0
hcpdiff/easy/__init__.py +2 -0
hcpdiff/easy/cfg/__init__.py +3 -0
hcpdiff/easy/cfg/sd15_train.py +207 -0
hcpdiff/easy/cfg/sdxl_train.py +147 -0
hcpdiff/easy/cfg/t2i.py +228 -0
hcpdiff/easy/model/__init__.py +2 -0
hcpdiff/easy/model/cnet.py +31 -0
hcpdiff/easy/model/loader.py +79 -0
hcpdiff/easy/sampler.py +46 -0
hcpdiff/evaluate/__init__.py +1 -0
hcpdiff/evaluate/previewer.py +60 -0
hcpdiff/loss/__init__.py +4 -1
hcpdiff/loss/base.py +41 -0
hcpdiff/loss/gw.py +35 -0
hcpdiff/loss/ssim.py +37 -0
hcpdiff/loss/vlb.py +79 -0
hcpdiff/loss/weighting.py +66 -0
hcpdiff/models/__init__.py +2 -2
hcpdiff/models/cfg_context.py +17 -14
hcpdiff/models/compose/compose_hook.py +44 -23
hcpdiff/models/compose/compose_tokenizer.py +21 -8
hcpdiff/models/compose/sdxl_composer.py +4 -4
hcpdiff/models/controlnet.py +16 -16
hcpdiff/models/lora_base_patch.py +14 -25
hcpdiff/models/lora_layers.py +3 -9
hcpdiff/models/lora_layers_patch.py +14 -24
hcpdiff/models/text_emb_ex.py +84 -6
hcpdiff/models/textencoder_ex.py +54 -18
hcpdiff/models/wrapper/__init__.py +3 -0
hcpdiff/models/wrapper/pixart.py +19 -0
hcpdiff/models/wrapper/sd.py +218 -0
hcpdiff/models/wrapper/utils.py +20 -0
hcpdiff/parser/__init__.py +1 -0
hcpdiff/parser/embpt.py +32 -0
hcpdiff/tools/convert_caption_txt2json.py +1 -1
hcpdiff/tools/dataset_generator.py +94 -0
hcpdiff/tools/download_hf_model.py +24 -0
hcpdiff/tools/init_proj.py +3 -21
hcpdiff/tools/lora_convert.py +18 -17
hcpdiff/tools/save_model.py +12 -0
hcpdiff/tools/sd2diffusers.py +1 -1
hcpdiff/train_colo.py +1 -1
hcpdiff/train_deepspeed.py +1 -1
hcpdiff/trainer_ac.py +79 -0
hcpdiff/trainer_ac_single.py +31 -0
hcpdiff/utils/__init__.py +0 -2
hcpdiff/utils/inpaint_pipe.py +7 -2
hcpdiff/utils/net_utils.py +29 -6
hcpdiff/utils/pipe_hook.py +24 -7
hcpdiff/utils/utils.py +21 -4
hcpdiff/workflow/__init__.py +15 -10
hcpdiff/workflow/daam/__init__.py +1 -0
hcpdiff/workflow/daam/act.py +66 -0
hcpdiff/workflow/daam/hook.py +109 -0
hcpdiff/workflow/diffusion.py +118 -128
hcpdiff/workflow/fast.py +31 -0
hcpdiff/workflow/flow.py +67 -0
hcpdiff/workflow/io.py +36 -130
hcpdiff/workflow/model.py +46 -43
hcpdiff/workflow/text.py +60 -47
hcpdiff/workflow/utils.py +32 -12
hcpdiff/workflow/vae.py +37 -38
hcpdiff-2.2.dist-info/METADATA +299 -0
hcpdiff-2.2.dist-info/RECORD +115 -0
{hcpdiff-0.9.1.dist-info → hcpdiff-2.2.dist-info}/WHEEL +1 -1
hcpdiff-2.2.dist-info/entry_points.txt +5 -0
hcpdiff/ckpt_manager/base.py +0 -16
hcpdiff/ckpt_manager/ckpt_diffusers.py +0 -45
hcpdiff/ckpt_manager/ckpt_pkl.py +0 -138
hcpdiff/ckpt_manager/ckpt_safetensor.py +0 -64
hcpdiff/ckpt_manager/ckpt_webui.py +0 -54
hcpdiff/data/bucket.py +0 -358
hcpdiff/data/caption_loader.py +0 -80
hcpdiff/data/cond_dataset.py +0 -40
hcpdiff/data/crop_info_dataset.py +0 -40
hcpdiff/data/data_processor.py +0 -33
hcpdiff/data/pair_dataset.py +0 -146
hcpdiff/data/sampler.py +0 -54
hcpdiff/data/source/base.py +0 -30
hcpdiff/data/utils.py +0 -80
hcpdiff/deprecated/__init__.py +0 -1
hcpdiff/deprecated/cfg_converter.py +0 -81
hcpdiff/deprecated/lora_convert.py +0 -31
hcpdiff/infer_workflow.py +0 -57
hcpdiff/loggers/__init__.py +0 -13
hcpdiff/loggers/base_logger.py +0 -76
hcpdiff/loggers/cli_logger.py +0 -40
hcpdiff/loggers/preview/__init__.py +0 -1
hcpdiff/loggers/preview/image_previewer.py +0 -149
hcpdiff/loggers/tensorboard_logger.py +0 -30
hcpdiff/loggers/wandb_logger.py +0 -31
hcpdiff/loggers/webui_logger.py +0 -9
hcpdiff/loss/min_snr_loss.py +0 -52
hcpdiff/models/layers.py +0 -81
hcpdiff/models/plugin.py +0 -348
hcpdiff/models/wrapper.py +0 -75
hcpdiff/noise/__init__.py +0 -3
hcpdiff/noise/noise_base.py +0 -16
hcpdiff/noise/pyramid_noise.py +0 -50
hcpdiff/noise/zero_terminal.py +0 -44
hcpdiff/train_ac.py +0 -566
hcpdiff/train_ac_single.py +0 -39
hcpdiff/utils/caption_tools.py +0 -105
hcpdiff/utils/cfg_net_tools.py +0 -321
hcpdiff/utils/cfg_resolvers.py +0 -16
hcpdiff/utils/ema.py +0 -52
hcpdiff/utils/img_size_tool.py +0 -248
hcpdiff/vis/__init__.py +0 -3
hcpdiff/vis/base_interface.py +0 -12
hcpdiff/vis/disk_interface.py +0 -48
hcpdiff/vis/webui_interface.py +0 -17
hcpdiff/viser_fast.py +0 -138
hcpdiff/visualizer.py +0 -265
hcpdiff/visualizer_reloadable.py +0 -237
hcpdiff/workflow/base.py +0 -59
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/anime/text2img_anime.yaml +0 -21
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/anime/text2img_anime_lora.yaml +0 -58
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/change_vae.yaml +0 -6
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/euler_a.yaml +0 -8
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/img2img.yaml +0 -10
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/img2img_controlnet.yaml +0 -19
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/inpaint.yaml +0 -11
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/load_lora.yaml +0 -26
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/load_unet_part.yaml +0 -18
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/offload_2GB.yaml +0 -6
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/save_model.yaml +0 -44
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/text2img.yaml +0 -53
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/text2img_DA++.yaml +0 -34
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/text2img_sdxl.yaml +0 -9
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/plugins/plugin_controlnet.yaml +0 -17
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/te_struct.txt +0 -193
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/dataset/base_dataset.yaml +0 -29
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/dataset/regularization_dataset.yaml +0 -31
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/CustomDiffusion.yaml +0 -74
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/DreamArtist++.yaml +0 -135
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/DreamArtist.yaml +0 -45
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/DreamBooth.yaml +0 -62
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/FT_sdxl.yaml +0 -33
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/Lion_optimizer.yaml +0 -17
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/TextualInversion.yaml +0 -41
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/add_logger_tensorboard_wandb.yaml +0 -15
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/controlnet.yaml +0 -53
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/ema.yaml +0 -10
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/fine-tuning.yaml +0 -53
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/locon.yaml +0 -24
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/lora_anime_character.yaml +0 -77
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/lora_conventional.yaml +0 -56
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/lora_sdxl.yaml +0 -41
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/min_snr.yaml +0 -7
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/preview_in_training.yaml +0 -6
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples_noob/DreamBooth.yaml +0 -70
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples_noob/TextualInversion.yaml +0 -45
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples_noob/fine-tuning.yaml +0 -45
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples_noob/lora.yaml +0 -63
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/train_base.yaml +0 -81
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/tuning_base.yaml +0 -42
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/unet_struct.txt +0 -932
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/workflow/highres_fix_latent.yaml +0 -86
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/workflow/highres_fix_pixel.yaml +0 -99
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/workflow/text2img.yaml +0 -59
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/workflow/text2img_lora.yaml +0 -70
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/zero2.json +0 -32
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/zero3.json +0 -39
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/caption.txt +0 -1
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/name.txt +0 -1
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/name_2pt_caption.txt +0 -1
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/name_caption.txt +0 -1
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/object.txt +0 -27
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/object_caption.txt +0 -27
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/style.txt +0 -19
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/style_caption.txt +0 -19
hcpdiff-0.9.1.dist-info/METADATA +0 -199
hcpdiff-0.9.1.dist-info/RECORD +0 -160
hcpdiff-0.9.1.dist-info/entry_points.txt +0 -2
{hcpdiff-0.9.1.dist-info → hcpdiff-2.2.dist-info/licenses}/LICENSE +0 -0
{hcpdiff-0.9.1.dist-info → hcpdiff-2.2.dist-info}/top_level.txt +0 -0

hcpdiff/data/pair_dataset.py DELETED Viewed

@@ -1,146 +0,0 @@
-"""
-pair_dataset.py
-====================
-    :Name:        text-image pair dataset
-    :Author:      Dong Ziyi
-    :Affiliation: HCP Lab, SYSU
-    :Created:     10/03/2023
-    :Licence:     Apache-2.0
-"""
-import os.path
-from argparse import Namespace
-import cv2
-import torch
-from PIL import Image
-from torch.utils.data import Dataset
-from tqdm.auto import tqdm
-from typing import Tuple
-from hcpdiff.utils.caption_tools import *
-from hcpdiff.utils.utils import get_file_name, get_file_ext
-from .bucket import BaseBucket
-from .source import DataSource, ComposeDataSource
-class TextImagePairDataset(Dataset):
-    """
-    A dataset to prepare the instance and class images with the prompts for fine-tuning the model.
-    It pre-processes the images and the tokenizes prompts.
-    """
-    def __init__(self, tokenizer, tokenizer_repeats: int = 1, att_mask_encode: bool = False,
-                 bucket: BaseBucket = None, source: Dict[str, DataSource] = None, return_path: bool = False,
-                 cache_path:str=None, encoder_attention_mask=False, **kwargs):
-        self.return_path = return_path
-        self.tokenizer = tokenizer
-        self.tokenizer_repeats = tokenizer_repeats
-        self.bucket: BaseBucket = bucket
-        self.att_mask_encode = att_mask_encode
-        self.source = ComposeDataSource(source)
-        self.latents = None  # Cache latents for faster training. Works only without image argumentations.
-        self.cache_path = cache_path
-        self.encoder_attention_mask = encoder_attention_mask
-    def load_data(self, path:str, data_source:DataSource, size:Tuple[int]):
-        image_dict = data_source.load_image(path)
-        image = image_dict['image']
-        att_mask = image_dict.get('att_mask', None)
-        if att_mask is None:
-            data, crop_coord = self.bucket.crop_resize({"img":image}, size)
-            image = data_source.procees_image(data['img'])  # resize to bucket size
-            att_mask = torch.ones((size[1]//8, size[0]//8))
-        else:
-            data, crop_coord = self.bucket.crop_resize({"img":image, "mask":att_mask}, size)
-            image = data_source.procees_image(data['img'])
-            att_mask = torch.tensor(cv2.resize(data['mask'], (size[0]//8, size[1]//8), interpolation=cv2.INTER_LINEAR))
-        return {'img':image, 'mask':att_mask}
-    @torch.no_grad()
-    def cache_latents(self, vae, weight_dtype, device, show_prog=True):
-        if self.cache_path and os.path.exists(self.cache_path):
-            self.latents = torch.load(self.cache_path)
-            return
-        self.latents = {}
-        self.bucket.rest(0)
-        for (path, data_source), size in tqdm(self.bucket, disable=not show_prog):
-            img_name = data_source.get_image_name(path)
-            if img_name not in self.latents:
-                data = self.load_data(path, data_source, size)
-                image = data['img'].unsqueeze(0).to(device, dtype=weight_dtype)
-                latents = vae.encode(image).latent_dist.sample().squeeze(0)
-                data['img'] = (latents*vae.config.scaling_factor).cpu()
-                self.latents[img_name] = data
-        if self.cache_path:
-            torch.save(self.latents, self.cache_path)
-    def __len__(self):
-        return len(self.bucket)
-    def __getitem__(self, index):
-        (path, data_source), size = self.bucket[index]
-        img_name = data_source.get_image_name(path)
-        if self.latents is None:
-            data = self.load_data(path, data_source, size)
-        else:
-            data = self.latents[img_name].copy()
-        prompt_ist = data_source.load_caption(img_name)
-        # tokenize Sp or (Sn, Sp)
-        tokens = self.tokenizer(prompt_ist, truncation=True, padding="max_length", return_tensors="pt",
-                                    max_length=self.tokenizer.model_max_length*self.tokenizer_repeats)
-        data['prompt'] = tokens.input_ids.squeeze()
-        if self.encoder_attention_mask and 'attention_mask' in tokens:
-            data['attn_mask'] = tokens.attention_mask.squeeze()
-        if 'position_ids' in tokens:
-            data['position_ids'] = tokens.position_ids.squeeze()
-        if self.return_path:
-            return data, path
-        else:
-            return data
-    @staticmethod
-    def collate_fn(batch):
-        '''
-        batch: [{img:tensor, prompt:str, ..., plugin_input:{...}},{}]
-        '''
-        has_plugin_input = 'plugin_input' in batch[0]
-        if has_plugin_input:
-            plugin_input = {k:[] for k in batch[0]['plugin_input'].keys()}
-        datas = {k:[] for k in batch[0].keys() if k != 'plugin_input' and k != 'prompt'}
-        sn_list, sp_list = [], []
-        for data in batch:
-            if has_plugin_input:
-                for k, v in data.pop('plugin_input').items():
-                    plugin_input[k].append(v)
-            prompt = data.pop('prompt')
-            if len(prompt.shape) == 2:
-                sn_list.append(prompt[0])
-                sp_list.append(prompt[1])
-            else:
-                sp_list.append(prompt)
-            for k, v in data.items():
-                datas[k].append(v)
-        for k, v in datas.items():
-            datas[k] = torch.stack(v)
-            if k == 'mask':
-                datas[k] = datas[k].unsqueeze(1)
-        sn_list += sp_list
-        datas['prompt'] = torch.stack(sn_list)
-        if has_plugin_input:
-            datas['plugin_input'] = {k:torch.stack(v) for k, v in plugin_input.items()}
-        return datas

hcpdiff/data/sampler.py DELETED Viewed

@@ -1,54 +0,0 @@
-import torch
-from torch.utils.data.distributed import DistributedSampler
-from typing import Iterator
-import platform
-import math
-class DistributedCycleSampler(DistributedSampler):
-    _cycle = 1000
-    def __iter__(self) -> Iterator:
-        def _iter():
-            while True:
-                if self.shuffle:
-                    # deterministically shuffle based on epoch and seed
-                    g = torch.Generator()
-                    g.manual_seed(self.seed + self.epoch)
-                    indices = torch.randperm(len(self.dataset), generator=g).tolist()  # type: ignore[arg-type]
-                else:
-                    indices = list(range(len(self.dataset)))  # type: ignore[arg-type]
-                if not self.drop_last:
-                    # add extra samples to make it evenly divisible
-                    padding_size = self.total_size - len(indices)
-                    if padding_size <= len(indices):
-                        indices += indices[:padding_size]
-                    else:
-                        indices += (indices * math.ceil(padding_size / len(indices)))[:padding_size]
-                else:
-                    # remove tail of data to make it evenly divisible.
-                    indices = indices[:self.total_size]
-                assert len(indices) == self.total_size
-                # subsample
-                indices = indices[self.rank:self.total_size:self.num_replicas]
-                assert len(indices) == self.num_samples
-                for idx in indices:
-                    yield idx
-                self.epoch+=1
-                if self.epoch>=self._cycle:
-                    break
-        return _iter()
-    def __len__(self) -> int:
-        return self.num_samples #*self._cycle
-def get_sampler():
-    # Fix DataLoader frequently reload bugs in windows
-    if platform.system().lower() == 'windows':
-        return DistributedCycleSampler
-    else:
-        return DistributedSampler

hcpdiff/data/source/base.py DELETED Viewed

@@ -1,30 +0,0 @@
-import os
-from typing import Dict, List, Tuple, Any
-class DataSource:
-    def __init__(self, img_root, repeat=1, **kwargs):
-        self.img_root = img_root
-        self.repeat = repeat
-    def get_image_list(self) -> List[Tuple[str, "DataSource"]]:
-        raise NotImplementedError()
-    def procees_image(self, image):
-        raise NotImplementedError()
-    def load_image(self, path) -> Dict[str, Any]:
-        raise NotImplementedError()
-    def get_image_name(self, path: str) -> str:
-        img_root, img_name = os.path.split(path)
-        return img_name.rsplit('.')[0]
-class ComposeDataSource(DataSource):
-    def __init__(self, source_dict: Dict[str, DataSource]):
-        self.source_dict = source_dict
-    def get_image_list(self) -> List[Tuple[str, DataSource]]:
-        img_list = []
-        for source in self.source_dict.values():
-            img_list.extend(source.get_image_list())
-        return img_list

hcpdiff/data/utils.py DELETED Viewed

@@ -1,80 +0,0 @@
-import cv2
-import numpy as np
-from PIL import Image
-from torchvision import transforms as T
-from torchvision.transforms import functional as F
-class DualRandomCrop:
-    def __init__(self, size):
-        self.size = size
-    def __call__(self, img):
-        crop_params = T.RandomCrop.get_params(img['img'], self.size)
-        img['img'] = F.crop(img['img'], *crop_params)
-        if "mask" in img:
-            img['mask'] = self.crop(img['mask'], *crop_params)
-        if "cond" in img:
-            img['cond'] = F.crop(img['cond'], *crop_params)
-        return img, crop_params[:2]
-    @staticmethod
-    def crop(img: np.ndarray, top: int, left: int, height: int, width: int) -> np.ndarray:
-        right = left+width
-        bottom = top+height
-        return img[top:bottom, left:right, ...]
-def resize_crop_fix(img, target_size, mask_interp=cv2.INTER_CUBIC):
-    w, h = img['img'].size
-    if w == target_size[0] and h == target_size[1]:
-        return img, [h,w,0,0,h,w]
-    ratio_img = w/h
-    if ratio_img>target_size[0]/target_size[1]:
-        new_size = (round(ratio_img*target_size[1]), target_size[1])
-        interp_type = Image.LANCZOS if h>target_size[1] else Image.BICUBIC
-    else:
-        new_size = (target_size[0], round(target_size[0]/ratio_img))
-        interp_type = Image.LANCZOS if w>target_size[0] else Image.BICUBIC
-    img['img'] = img['img'].resize(new_size, interp_type)
-    if "mask" in img:
-        img['mask'] = cv2.resize(img['mask'], new_size, interpolation=mask_interp)
-    if "cond" in img:
-        img['cond'] = img['cond'].resize(new_size, interp_type)
-    img, crop_coord = DualRandomCrop(target_size[::-1])(img)
-    return img, [*new_size, *crop_coord[::-1], *target_size]
-def pad_crop_fix(img, target_size):
-    w, h = img['img'].size
-    if w == target_size[0] and h == target_size[1]:
-        return img, (h,w,0,0,h,w)
-    pad_size = [0, 0, max(target_size[0]-w, 0), max(target_size[1]-h, 0)]
-    if pad_size[2]>0 or pad_size[3]>0:
-        img['img'] = F.pad(img['img'], pad_size)
-        if "mask" in img:
-            img['mask'] = np.pad(img['mask'], ((0, pad_size[3]), (0, pad_size[2])), 'constant', constant_values=(0, 0))
-        if "cond" in img:
-            img['cond'] = F.pad(img['cond'], pad_size)
-    if pad_size[2]>0 and pad_size[3]>0:
-        return img, (h,w,0,0,h,w)  # No need to crop
-    else:
-        img, crop_coord = DualRandomCrop(target_size[::-1])(img)
-        return img, crop_coord
-class CycleData():
-    def __init__(self, data_loader):
-        self.data_loader = data_loader
-    def __iter__(self):
-        self.epoch = 0
-        def cycle():
-            while True:
-                self.data_loader.dataset.bucket.rest(self.epoch)
-                for data in self.data_loader:
-                    yield data
-                self.epoch += 1
-        return cycle()

hcpdiff/deprecated/__init__.py DELETED Viewed

	@@ -1 +0,0 @@
1	- from .lora_convert import convert_to_webui_maybe_old, convert_to_webui_xl_maybe_old

hcpdiff/deprecated/cfg_converter.py DELETED Viewed

@@ -1,81 +0,0 @@
-"""
-train_ac.py
-====================
-    :Name:        convert old cfg format to new format
-    :Author:      Dong Ziyi
-    :Affiliation: HCP Lab, SYSU
-    :Created:     10/03/2023
-    :Licence:     Apache-2.0
-"""
-from omegaconf import ListConfig, DictConfig, OmegaConf
-class DatasetCFGConverter:
-    def convert_source(self, cfg_source:DictConfig):
-        if '_target_' not in cfg_source:
-            cfg_source['_target_'] = 'hcpdiff.data.source.Text2ImageAttMapSource'
-        if 'tag_transforms' in cfg_source:
-            cfg_source['text_transforms'] = cfg_source.pop('tag_transforms')
-    def convert(self, cfg:DictConfig):
-        for dataset in cfg['data'].values():
-            for source in dataset['source'].values():
-                self.convert_source(source)
-        return cfg
-class TrainCFGConverter:
-    def __init__(self):
-        self.dataset_converter = DatasetCFGConverter()
-    def convert_model(self, cfg_model:DictConfig):
-        if 'ema_unet' in cfg_model and 'ema' not in cfg_model:
-            if cfg_model['ema_unet']==0: # no ema
-                cfg_model['ema'] = None
-            else:
-                cfg_model['ema'] = OmegaConf.create({
-                    '_target_': 'hcpdiff.utils.ema.ModelEMA',
-                    '_partial_': True,
-                    'decay_max': cfg_model['ema_unet'],
-                    'power': 0.85
-                })
-        if 'tokenizer' not in cfg_model:
-            cfg_model['tokenizer'] = None
-        if 'noise_scheduler' not in cfg_model:
-            cfg_model['noise_scheduler'] = None
-        if 'unet' not in cfg_model:
-            cfg_model['unet'] = None
-        if 'text_encoder' not in cfg_model:
-            cfg_model['text_encoder'] = None
-        if 'vae' not in cfg_model:
-            cfg_model['vae'] = None
-    def convert_loss(self, cfg_train:DictConfig):
-        if cfg_train['loss']['criterion']['_target_']=='hcpdiff.loss.MSELoss':
-            cfg_train['loss']['criterion']['_target_'] = 'torch.nn.MSELoss'
-    def convert(self, cfg:DictConfig):
-        self.convert_model(cfg['model'])
-        self.convert_loss(cfg['train'])
-        if 'previewer' not in cfg:
-            cfg['previewer'] = None
-        cfg = self.dataset_converter.convert(cfg)
-        return cfg
-class InferCFGConverter:
-    def convert(self, cfg:DictConfig):
-        if 'encoder_attention_mask' not in cfg:
-            cfg['encoder_attention_mask'] = False
-        if 'amp' not in cfg:
-            if cfg['dtype']=='amp':
-                cfg['dtype'] = 'fp32'
-                cfg['amp'] = True
-            else:
-                cfg['amp'] = False
-        return cfg

hcpdiff/deprecated/lora_convert.py DELETED Viewed

@@ -1,31 +0,0 @@
-def convert_to_webui_maybe_old(new_func):
-    def convert_to_webui_(self, state, prefix):
-        sd_covert = {}
-        for k, v in state.items():
-            # new lora format
-            if k.endswith('W_down'):
-                return new_func(self, state, prefix)
-            # old lora format
-            model_k, lora_k = k.split('.___.' if ('alpha' in k or 'scale' in k) else '.___.layer.', 1)
-            sd_covert[f"{prefix}{model_k.replace('.', '_')}.{lora_k}"] = v
-        return sd_covert
-    return convert_to_webui_
-def convert_to_webui_xl_maybe_old(new_func):
-    def convert_to_webui_xl_(self, state, prefix):
-        sd_convert = {}
-        for k, v in state.items():
-            # new lora format
-            if k.endswith('W_down'):
-                return new_func(self, state, prefix)
-            # old lora format
-            model_k, lora_k = k.split('.___.' if ('alpha' in k or 'scale' in k) else '.___.layer.', 1)
-            new_k = f"{prefix}{model_k.replace('.', '_')}.{lora_k}"
-            if 'clip' in new_k:
-                new_k = new_k.replace('_clip_B', '1') if 'clip_B' in new_k else new_k.replace('_clip_bigG', '2')
-            sd_convert[new_k] = v
-        return sd_convert
-    return convert_to_webui_xl_

hcpdiff/infer_workflow.py DELETED Viewed

@@ -1,57 +0,0 @@
-import argparse
-import torch
-import hydra
-from omegaconf import OmegaConf, DictConfig
-from easydict import EasyDict
-from hcpdiff.utils.utils import load_config_with_cli
-from .workflow import MemoryMixin
-from copy import deepcopy
-class WorkflowRunner:
-    def __init__(self, cfgs):
-        self.cfgs_raw = deepcopy(cfgs)
-        self.cfgs = OmegaConf.structured(cfgs, flags={"allow_objects": True})
-        OmegaConf.resolve(self.cfgs)
-        self.memory = EasyDict(**hydra.utils.instantiate(self.cfgs.memory))
-        self.attach_memory(self.cfgs)
-    def start(self):
-        prepare_actions = hydra.utils.instantiate(self.cfgs.prepare)
-        states = self.run(prepare_actions, {'cfgs': self.cfgs_raw})
-        actions = hydra.utils.instantiate(self.cfgs.actions)
-        states = self.run(actions, states)
-    def attach_memory(self, cfgs):
-        if OmegaConf.is_dict(cfgs):
-            if '_target_' in cfgs and cfgs['_target_'].endswith('.from_memory'):
-                cfgs._set_flag('allow_objects', True)
-                cfgs['memory'] = self.memory
-            else:
-                for v in cfgs.values():
-                    self.attach_memory(v)
-        elif OmegaConf.is_list(cfgs):
-            for v in cfgs:
-                self.attach_memory(v)
-    @torch.inference_mode()
-    def run(self, actions, states):
-        N_steps = len(actions)
-        for step, act in enumerate(actions):
-            print(f'[{step+1}/{N_steps}] action: {type(act).__name__}')
-            if isinstance(act, MemoryMixin):
-                states = act(memory=self.memory, **states)
-            else:
-                states = act(**states)
-            print(f'states: {", ".join(states.keys())}')
-        return states
-if __name__ == '__main__':
-    parser = argparse.ArgumentParser(description='HCP-Diffusion workflow')
-    parser.add_argument('--cfg', type=str, default='')
-    args, cfg_args = parser.parse_known_args()
-    cfgs = load_config_with_cli(args.cfg, args_list=cfg_args)  # skip --cfg
-    runner = WorkflowRunner(cfgs)
-    runner.start()

hcpdiff/loggers/__init__.py DELETED Viewed

@@ -1,13 +0,0 @@
-from .base_logger import BaseLogger, LoggerGroup
-from .cli_logger import CLILogger
-from .webui_logger import WebUILogger
-try:
-    from .tensorboard_logger import TBLogger
-except:
-    print('tensorboard is not available')
-try:
-    from .wandb_logger import WanDBLogger
-except:
-    print('wandb is not available')

hcpdiff/loggers/base_logger.py DELETED Viewed

@@ -1,76 +0,0 @@
-from typing import Dict, Any, List
-from PIL import Image
-from .preview import ImagePreviewer
-class BaseLogger:
-    def __init__(self, exp_dir, out_path, enable_log_image=False, log_step=10, image_log_step=200):
-        self.exp_dir = exp_dir
-        self.out_path = out_path
-        self.enable_log_image = enable_log_image
-        self.log_step = log_step
-        self.image_log_step = image_log_step
-        self.enable_log = True
-        self.previewer_list: List[ImagePreviewer] = []
-    def enable(self):
-        self.enable_log = True
-    def disable(self):
-        self.enable_log = False
-    def add_previewer(self, previewer: ImagePreviewer):
-        self.previewer_list.append(previewer)
-    def info(self, info):
-        if self.enable_log:
-            self._info(info)
-    def _info(self, info):
-        raise NotImplementedError()
-    def log(self, datas: Dict[str, Any], step: int = 0):
-        if self.enable_log and step%self.log_step == 0:
-            self._log(datas, step)
-    def _log(self, datas: Dict[str, Any], step: int = 0):
-        raise NotImplementedError()
-    def log_image(self, imgs: Dict[str, Image.Image], step: int = 0):
-        if self.enable_log and self.enable_log_image and step%self.image_log_step == 0:
-            self._log_image(imgs, step)
-    def _log_image(self, imgs: Dict[str, Image.Image], step: int = 0):
-        raise NotImplementedError()
-class LoggerGroup:
-    def __init__(self, logger_list: List[BaseLogger]):
-        self.logger_list = logger_list
-    def enable(self):
-        for logger in self.logger_list:
-            logger.enable()
-    def disable(self):
-        for logger in self.logger_list:
-            logger.disable()
-    def add_previewer(self, previewer):
-        for logger in self.logger_list:
-            logger.add_previewer(previewer)
-    def info(self, info):
-        for logger in self.logger_list:
-            logger.info(info)
-    def log(self, datas: Dict[str, Any], step: int = 0):
-        for logger in self.logger_list:
-            logger.log(datas, step)
-    def log_image(self, imgs: Dict[str, Image.Image], step: int = 0):
-        for logger in self.logger_list:
-            logger.log_image(imgs, step)
-    def __len__(self):
-        return len(self.logger_list)

hcpdiff/loggers/cli_logger.py DELETED Viewed

@@ -1,40 +0,0 @@
-import os
-from typing import Dict, Any
-from PIL import Image
-from loguru import logger
-from .base_logger import BaseLogger
-class CLILogger(BaseLogger):
-    def __init__(self, exp_dir, out_path, enable_log_image=False, log_step=10, image_log_step=200,
-                 img_log_dir='preview', img_ext='png', img_quality=95):
-        super().__init__(exp_dir, out_path, enable_log_image, log_step, image_log_step)
-        if exp_dir is not None:  # exp_dir is only available in local main process
-            logger.add(os.path.join(exp_dir, out_path))
-            if enable_log_image:
-                self.img_log_dir = os.path.join(exp_dir, img_log_dir)
-                os.makedirs(self.img_log_dir, exist_ok=True)
-            self.img_ext = img_ext
-            self.img_quality = img_quality
-        else:
-            self.disable()
-    def enable(self):
-        super(CLILogger, self).enable()
-        logger.enable("__main__")
-    def disable(self):
-        super(CLILogger, self).disable()
-        logger.disable("__main__")
-    def _info(self, info):
-        logger.info(info)
-    def _log(self, datas: Dict[str, Any], step: int = 0):
-        logger.info(', '.join([f"{k} = {v['format'].format(*v['data'])}" for k, v in datas.items()]))
-    def _log_image(self, imgs: Dict[str, Image.Image], step: int = 0):
-        logger.info(f'log {len(imgs)} images')
-        for name, img in imgs.items():
-            img.save(os.path.join(self.img_log_dir, f'{step}-{name}.{self.img_ext}'), quality=self.img_quality)

hcpdiff/loggers/preview/__init__.py DELETED Viewed

	@@ -1 +0,0 @@
1	- from .image_previewer import ImagePreviewer

hcpdiff 0.9.1__py3-none-any.whl → 2.2__py3-none-any.whl

hcpdiff 0.9.1py3-none-any.whl → 2.2py3-none-any.whl