PyPI - hcpdiff - Versions diffs - 0.9.1__py3-none-any.whl → 2.2__py3-none-any.whl - Mend

hcpdiff 0.9.1py3-none-any.whl → 2.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (211) hide show

hcpdiff/__init__.py +4 -4
hcpdiff/ckpt_manager/__init__.py +4 -5
hcpdiff/ckpt_manager/ckpt.py +24 -0
hcpdiff/ckpt_manager/format/__init__.py +4 -0
hcpdiff/ckpt_manager/format/diffusers.py +59 -0
hcpdiff/ckpt_manager/format/emb.py +21 -0
hcpdiff/ckpt_manager/format/lora_webui.py +252 -0
hcpdiff/ckpt_manager/format/sd_single.py +41 -0
hcpdiff/ckpt_manager/loader.py +64 -0
hcpdiff/data/__init__.py +4 -28
hcpdiff/data/cache/__init__.py +1 -0
hcpdiff/data/cache/vae.py +102 -0
hcpdiff/data/dataset.py +20 -0
hcpdiff/data/handler/__init__.py +3 -0
hcpdiff/data/handler/controlnet.py +18 -0
hcpdiff/data/handler/diffusion.py +90 -0
hcpdiff/data/handler/text.py +111 -0
hcpdiff/data/source/__init__.py +3 -3
hcpdiff/data/source/folder_class.py +12 -29
hcpdiff/data/source/text.py +40 -0
hcpdiff/data/source/text2img.py +36 -74
hcpdiff/data/source/text2img_cond.py +9 -15
hcpdiff/diffusion/__init__.py +0 -0
hcpdiff/diffusion/noise/__init__.py +2 -0
hcpdiff/diffusion/noise/pyramid_noise.py +42 -0
hcpdiff/diffusion/noise/zero_terminal.py +39 -0
hcpdiff/diffusion/sampler/__init__.py +5 -0
hcpdiff/diffusion/sampler/base.py +72 -0
hcpdiff/diffusion/sampler/ddpm.py +20 -0
hcpdiff/diffusion/sampler/diffusers.py +66 -0
hcpdiff/diffusion/sampler/edm.py +22 -0
hcpdiff/diffusion/sampler/sigma_scheduler/__init__.py +3 -0
hcpdiff/diffusion/sampler/sigma_scheduler/base.py +14 -0
hcpdiff/diffusion/sampler/sigma_scheduler/ddpm.py +197 -0
hcpdiff/diffusion/sampler/sigma_scheduler/edm.py +48 -0
hcpdiff/easy/__init__.py +2 -0
hcpdiff/easy/cfg/__init__.py +3 -0
hcpdiff/easy/cfg/sd15_train.py +207 -0
hcpdiff/easy/cfg/sdxl_train.py +147 -0
hcpdiff/easy/cfg/t2i.py +228 -0
hcpdiff/easy/model/__init__.py +2 -0
hcpdiff/easy/model/cnet.py +31 -0
hcpdiff/easy/model/loader.py +79 -0
hcpdiff/easy/sampler.py +46 -0
hcpdiff/evaluate/__init__.py +1 -0
hcpdiff/evaluate/previewer.py +60 -0
hcpdiff/loss/__init__.py +4 -1
hcpdiff/loss/base.py +41 -0
hcpdiff/loss/gw.py +35 -0
hcpdiff/loss/ssim.py +37 -0
hcpdiff/loss/vlb.py +79 -0
hcpdiff/loss/weighting.py +66 -0
hcpdiff/models/__init__.py +2 -2
hcpdiff/models/cfg_context.py +17 -14
hcpdiff/models/compose/compose_hook.py +44 -23
hcpdiff/models/compose/compose_tokenizer.py +21 -8
hcpdiff/models/compose/sdxl_composer.py +4 -4
hcpdiff/models/controlnet.py +16 -16
hcpdiff/models/lora_base_patch.py +14 -25
hcpdiff/models/lora_layers.py +3 -9
hcpdiff/models/lora_layers_patch.py +14 -24
hcpdiff/models/text_emb_ex.py +84 -6
hcpdiff/models/textencoder_ex.py +54 -18
hcpdiff/models/wrapper/__init__.py +3 -0
hcpdiff/models/wrapper/pixart.py +19 -0
hcpdiff/models/wrapper/sd.py +218 -0
hcpdiff/models/wrapper/utils.py +20 -0
hcpdiff/parser/__init__.py +1 -0
hcpdiff/parser/embpt.py +32 -0
hcpdiff/tools/convert_caption_txt2json.py +1 -1
hcpdiff/tools/dataset_generator.py +94 -0
hcpdiff/tools/download_hf_model.py +24 -0
hcpdiff/tools/init_proj.py +3 -21
hcpdiff/tools/lora_convert.py +18 -17
hcpdiff/tools/save_model.py +12 -0
hcpdiff/tools/sd2diffusers.py +1 -1
hcpdiff/train_colo.py +1 -1
hcpdiff/train_deepspeed.py +1 -1
hcpdiff/trainer_ac.py +79 -0
hcpdiff/trainer_ac_single.py +31 -0
hcpdiff/utils/__init__.py +0 -2
hcpdiff/utils/inpaint_pipe.py +7 -2
hcpdiff/utils/net_utils.py +29 -6
hcpdiff/utils/pipe_hook.py +24 -7
hcpdiff/utils/utils.py +21 -4
hcpdiff/workflow/__init__.py +15 -10
hcpdiff/workflow/daam/__init__.py +1 -0
hcpdiff/workflow/daam/act.py +66 -0
hcpdiff/workflow/daam/hook.py +109 -0
hcpdiff/workflow/diffusion.py +118 -128
hcpdiff/workflow/fast.py +31 -0
hcpdiff/workflow/flow.py +67 -0
hcpdiff/workflow/io.py +36 -130
hcpdiff/workflow/model.py +46 -43
hcpdiff/workflow/text.py +60 -47
hcpdiff/workflow/utils.py +32 -12
hcpdiff/workflow/vae.py +37 -38
hcpdiff-2.2.dist-info/METADATA +299 -0
hcpdiff-2.2.dist-info/RECORD +115 -0
{hcpdiff-0.9.1.dist-info → hcpdiff-2.2.dist-info}/WHEEL +1 -1
hcpdiff-2.2.dist-info/entry_points.txt +5 -0
hcpdiff/ckpt_manager/base.py +0 -16
hcpdiff/ckpt_manager/ckpt_diffusers.py +0 -45
hcpdiff/ckpt_manager/ckpt_pkl.py +0 -138
hcpdiff/ckpt_manager/ckpt_safetensor.py +0 -64
hcpdiff/ckpt_manager/ckpt_webui.py +0 -54
hcpdiff/data/bucket.py +0 -358
hcpdiff/data/caption_loader.py +0 -80
hcpdiff/data/cond_dataset.py +0 -40
hcpdiff/data/crop_info_dataset.py +0 -40
hcpdiff/data/data_processor.py +0 -33
hcpdiff/data/pair_dataset.py +0 -146
hcpdiff/data/sampler.py +0 -54
hcpdiff/data/source/base.py +0 -30
hcpdiff/data/utils.py +0 -80
hcpdiff/deprecated/__init__.py +0 -1
hcpdiff/deprecated/cfg_converter.py +0 -81
hcpdiff/deprecated/lora_convert.py +0 -31
hcpdiff/infer_workflow.py +0 -57
hcpdiff/loggers/__init__.py +0 -13
hcpdiff/loggers/base_logger.py +0 -76
hcpdiff/loggers/cli_logger.py +0 -40
hcpdiff/loggers/preview/__init__.py +0 -1
hcpdiff/loggers/preview/image_previewer.py +0 -149
hcpdiff/loggers/tensorboard_logger.py +0 -30
hcpdiff/loggers/wandb_logger.py +0 -31
hcpdiff/loggers/webui_logger.py +0 -9
hcpdiff/loss/min_snr_loss.py +0 -52
hcpdiff/models/layers.py +0 -81
hcpdiff/models/plugin.py +0 -348
hcpdiff/models/wrapper.py +0 -75
hcpdiff/noise/__init__.py +0 -3
hcpdiff/noise/noise_base.py +0 -16
hcpdiff/noise/pyramid_noise.py +0 -50
hcpdiff/noise/zero_terminal.py +0 -44
hcpdiff/train_ac.py +0 -566
hcpdiff/train_ac_single.py +0 -39
hcpdiff/utils/caption_tools.py +0 -105
hcpdiff/utils/cfg_net_tools.py +0 -321
hcpdiff/utils/cfg_resolvers.py +0 -16
hcpdiff/utils/ema.py +0 -52
hcpdiff/utils/img_size_tool.py +0 -248
hcpdiff/vis/__init__.py +0 -3
hcpdiff/vis/base_interface.py +0 -12
hcpdiff/vis/disk_interface.py +0 -48
hcpdiff/vis/webui_interface.py +0 -17
hcpdiff/viser_fast.py +0 -138
hcpdiff/visualizer.py +0 -265
hcpdiff/visualizer_reloadable.py +0 -237
hcpdiff/workflow/base.py +0 -59
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/anime/text2img_anime.yaml +0 -21
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/anime/text2img_anime_lora.yaml +0 -58
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/change_vae.yaml +0 -6
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/euler_a.yaml +0 -8
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/img2img.yaml +0 -10
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/img2img_controlnet.yaml +0 -19
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/inpaint.yaml +0 -11
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/load_lora.yaml +0 -26
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/load_unet_part.yaml +0 -18
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/offload_2GB.yaml +0 -6
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/save_model.yaml +0 -44
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/text2img.yaml +0 -53
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/text2img_DA++.yaml +0 -34
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/infer/text2img_sdxl.yaml +0 -9
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/plugins/plugin_controlnet.yaml +0 -17
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/te_struct.txt +0 -193
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/dataset/base_dataset.yaml +0 -29
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/dataset/regularization_dataset.yaml +0 -31
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/CustomDiffusion.yaml +0 -74
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/DreamArtist++.yaml +0 -135
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/DreamArtist.yaml +0 -45
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/DreamBooth.yaml +0 -62
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/FT_sdxl.yaml +0 -33
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/Lion_optimizer.yaml +0 -17
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/TextualInversion.yaml +0 -41
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/add_logger_tensorboard_wandb.yaml +0 -15
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/controlnet.yaml +0 -53
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/ema.yaml +0 -10
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/fine-tuning.yaml +0 -53
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/locon.yaml +0 -24
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/lora_anime_character.yaml +0 -77
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/lora_conventional.yaml +0 -56
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/lora_sdxl.yaml +0 -41
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/min_snr.yaml +0 -7
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples/preview_in_training.yaml +0 -6
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples_noob/DreamBooth.yaml +0 -70
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples_noob/TextualInversion.yaml +0 -45
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples_noob/fine-tuning.yaml +0 -45
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/examples_noob/lora.yaml +0 -63
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/train_base.yaml +0 -81
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/train/tuning_base.yaml +0 -42
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/unet_struct.txt +0 -932
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/workflow/highres_fix_latent.yaml +0 -86
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/workflow/highres_fix_pixel.yaml +0 -99
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/workflow/text2img.yaml +0 -59
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/workflow/text2img_lora.yaml +0 -70
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/zero2.json +0 -32
hcpdiff-0.9.1.data/data/hcpdiff/cfgs/zero3.json +0 -39
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/caption.txt +0 -1
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/name.txt +0 -1
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/name_2pt_caption.txt +0 -1
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/name_caption.txt +0 -1
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/object.txt +0 -27
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/object_caption.txt +0 -27
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/style.txt +0 -19
hcpdiff-0.9.1.data/data/hcpdiff/prompt_tuning_template/style_caption.txt +0 -19
hcpdiff-0.9.1.dist-info/METADATA +0 -199
hcpdiff-0.9.1.dist-info/RECORD +0 -160
hcpdiff-0.9.1.dist-info/entry_points.txt +0 -2
{hcpdiff-0.9.1.dist-info → hcpdiff-2.2.dist-info/licenses}/LICENSE +0 -0
{hcpdiff-0.9.1.dist-info → hcpdiff-2.2.dist-info}/top_level.txt +0 -0

hcpdiff/ckpt_manager/ckpt_safetensor.py DELETED Viewed

@@ -1,64 +0,0 @@
-"""
-ckpt_safetensors.py
-====================
-    :Name:        save model with safetensors
-    :Author:      Dong Ziyi
-    :Affiliation: HCP Lab, SYSU
-    :Created:     8/04/2023
-    :Licence:     MIT
-"""
-import os
-import torch
-from safetensors import safe_open
-from safetensors.torch import save_file
-from .ckpt_pkl import CkptManagerPKL
-class CkptManagerSafe(CkptManagerPKL):
-    def _save_ckpt(self, sd_model, name=None, step=None, save_path=None):
-        if save_path is None:
-            save_path = os.path.join(self.save_dir, f"{name}-{step}.safetensors")
-        sd_unfold = self.unfold_dict(sd_model)
-        for k, v in sd_unfold.items():
-            if not v.is_contiguous():
-                sd_unfold[k] = v.contiguous()
-        save_file(sd_unfold, save_path)
-    def load_ckpt(self, ckpt_path, map_location='cpu'):
-        with safe_open(ckpt_path, framework="pt", device=map_location) as f:
-            sd_fold = self.fold_dict(f)
-        return sd_fold
-    @staticmethod
-    def unfold_dict(data, split_key=':'):
-        dict_unfold={}
-        def unfold(prefix, dict_fold):
-            for k,v in dict_fold.items():
-                k_new = k if prefix=='' else f'{prefix}{split_key}{k}'
-                if isinstance(v, dict):
-                    unfold(k_new, v)
-                elif isinstance(v, list) or isinstance(v, tuple):
-                    unfold(k_new, {i:d for i,d in enumerate(v)})
-                else:
-                    dict_unfold[k_new]=v
-        unfold('', data)
-        return dict_unfold
-    @staticmethod
-    def fold_dict(safe_f, split_key=':'):
-        dict_fold = {}
-        for k in safe_f.keys():
-            k_list = k.split(split_key)
-            dict_last = dict_fold
-            for item in k_list[:-1]:
-                if item not in dict_last:
-                    dict_last[item] = {}
-                dict_last = dict_last[item]
-            dict_last[k_list[-1]]=safe_f.get_tensor(k)
-        return dict_fold

hcpdiff/ckpt_manager/ckpt_webui.py DELETED Viewed

@@ -1,54 +0,0 @@
-from .base import CkptManagerBase
-import os
-from diffusers import StableDiffusionPipeline, UNet2DConditionModel
-from hcpdiff.models.plugin import BasePluginBlock
-from hcpdiff.tools.sd2diffusers import load_sd_ckpt, patch_method
-class CkptManagerWebui(CkptManagerBase):
-    def set_save_dir(self, save_dir, emb_dir=None):
-        os.makedirs(save_dir, exist_ok=True)
-        self.save_dir = save_dir
-        self.emb_dir = emb_dir
-    def save(self, step, unet, TE, lora_unet, lora_TE, all_plugin_unet, all_plugin_TE, embs, pipe: StableDiffusionPipeline, **kwargs):
-        def state_dict_unet(*args, model=unet, **kwargs):
-            plugin_names = {k for k, v in model.named_modules() if isinstance(v, BasePluginBlock)}
-            model_sd = {}
-            for k, v in model.state_dict_().items():
-                for name in plugin_names:
-                    if k.startswith(name):
-                        break
-                else:
-                    model_sd[k] = v
-            return model_sd
-        unet.state_dict_ = unet.state_dict
-        unet.state_dict = state_dict_unet
-        def state_dict_TE(*args, model=TE, **kwargs):
-            plugin_names = {k for k, v in model.named_modules() if isinstance(v, BasePluginBlock)}
-            model_sd = {}
-            for k, v in model.state_dict_().items():
-                for name in plugin_names:
-                    if k.startswith(name):
-                        break
-                else:
-                    model_sd[k] = v
-            return model_sd
-        TE.state_dict_ = TE.state_dict
-        TE.state_dict = state_dict_TE
-        pipe.save_pretrained(os.path.join(self.save_dir, f"model-{step}"), **kwargs)
-    @classmethod
-    def load(cls, pretrained_model, original_config_file, from_safetensors=False, device='cpu', ema=True, **kwargs) -> StableDiffusionPipeline:
-        patch_method()
-        pipe = load_sd_ckpt(
-            checkpoint_path=pretrained_model,
-            original_config_file=original_config_file,
-            extract_ema=ema,
-            scheduler_type='pndm',
-            from_safetensors=from_safetensors,
-            device=device,
-        )
-        return pipe

hcpdiff/data/bucket.py DELETED Viewed

@@ -1,358 +0,0 @@
-"""
-bucket.py
-====================
-    :Name:        aspect ratio bucket with k-means
-    :Author:      Dong Ziyi
-    :Affiliation: HCP Lab, SYSU
-    :Created:     10/03/2023
-    :Licence:     Apache-2.0
-"""
-import math
-import os.path
-import pickle
-from typing import List, Tuple, Union, Any
-import cv2
-import numpy as np
-from hcpdiff.utils.img_size_tool import types_support, get_image_size
-from hcpdiff.utils.utils import get_file_ext
-from .source import DataSource
-from loguru import logger
-from sklearn.cluster import KMeans
-from tqdm import tqdm
-from concurrent.futures import ThreadPoolExecutor
-from .utils import resize_crop_fix, pad_crop_fix
-class BaseBucket:
-    def __getitem__(self, idx):
-        '''
-        :return: (file name of image), (target image size)
-        '''
-        raise NotImplementedError()
-    def __len__(self):
-        raise NotImplementedError()
-    def build(self, bs: int, img_root_list: List[str]):
-        raise NotImplementedError()
-    def rest(self, epoch):
-        pass
-    def crop_resize(self, image, size, mask_interp=cv2.INTER_CUBIC) -> Tuple[Any, Tuple]:
-        return image, (*size, 0, 0, *size)
-class FixedBucket(BaseBucket):
-    def __init__(self, target_size: Union[Tuple[int, int], int] = 512, **kwargs):
-        self.target_size = (target_size, target_size) if isinstance(target_size, int) else target_size
-    def build(self, bs: int, file_names: List[Tuple[str, DataSource]]):
-        self.file_names = file_names
-    def crop_resize(self, image, size, mask_interp=cv2.INTER_CUBIC):
-        return resize_crop_fix(image, size, mask_interp=mask_interp)
-    def __getitem__(self, idx) -> Tuple[Tuple[str, DataSource], Tuple[int, int]]:
-        return self.file_names[idx], self.target_size
-    def __len__(self):
-        return len(self.file_names)
-class RatioBucket(BaseBucket):
-    def __init__(self, target_area: int = 640*640, step_size: int = 8, num_bucket: int = 10, pre_build_bucket: str = None):
-        self.target_area = target_area
-        self.step_size = step_size
-        self.num_bucket = num_bucket
-        self.pre_build_bucket = pre_build_bucket
-    def load_bucket(self, path):
-        with open(path, 'rb') as f:
-            data = pickle.load(f)
-        self.buckets = data['buckets']
-        self.size_buckets = data['size_buckets']
-        self.idx_bucket_map = data['idx_bucket_map']
-        self.data_len = data['data_len']
-    def save_bucket(self, path):
-        with open(path, 'wb') as f:
-            pickle.dump({
-                'buckets':self.buckets,
-                'size_buckets':self.size_buckets,
-                'idx_bucket_map':self.idx_bucket_map,
-                'data_len':self.data_len,
-            }, f)
-    def build_buckets_from_ratios(self):
-        logger.info('build buckets from ratios')
-        size_low = int(math.sqrt(self.target_area/self.ratio_max))
-        size_high = int(self.ratio_max*size_low)
-        # SD需要边长是8的倍数
-        size_low = (size_low//self.step_size)*self.step_size
-        size_high = (size_high//self.step_size)*self.step_size
-        data = []
-        for w in range(size_low, size_high+1, self.step_size):
-            for h in range(size_low, size_high+1, self.step_size):
-                data.append([w*h, np.log2(w/h), w, h])  # 对比例取对数，更符合人感知，宽高相反的可以对称分布。
-        data = np.array(data)
-        error_area = np.abs(data[:, 0]-self.target_area)
-        data_use = data[np.argsort(error_area)[:self.num_bucket*3], :]  # 取最小的num_bucket*3个
-        # 聚类，选出指定个数的bucket
-        kmeans = KMeans(n_clusters=self.num_bucket, random_state=3407).fit(data_use[:, 1].reshape(-1, 1))
-        labels = kmeans.labels_
-        self.buckets = []  # [bucket_id:[file_idx,...]]
-        ratios_log = []
-        self.size_buckets = []
-        for i in range(self.num_bucket):
-            map_idx = np.where(labels == i)[0]
-            m_idx = map_idx[np.argmin(np.abs(data_use[labels == i, 1]-np.median(data_use[labels == i, 1])))]
-            # self.buckets[wh_hash(*data_use[m_idx, 2:])]=[]
-            self.buckets.append([])
-            ratios_log.append(data_use[m_idx, 1])
-            self.size_buckets.append(data_use[m_idx, 2:].astype(int))
-        ratios_log = np.array(ratios_log)
-        self.size_buckets = np.array(self.size_buckets)
-        # fill buckets with images w,h
-        self.idx_bucket_map = np.empty(len(self.file_names), dtype=int)
-        for i, (file, source) in enumerate(self.file_names):
-            w, h = get_image_size(file)
-            bucket_id = np.abs(ratios_log-np.log2(w/h)).argmin()
-            self.buckets[bucket_id].append(i)
-            self.idx_bucket_map[i] = bucket_id
-        logger.info('buckets info: '+', '.join(f'size:{self.size_buckets[i]}, num:{len(b)}' for i, b in enumerate(self.buckets)))
-    def build_buckets_from_images(self):
-        logger.info('build buckets from images')
-        def get_ratio(data):
-            file, source = data
-            w, h = get_image_size(file)
-            ratio = np.log2(w/h)
-            return ratio
-        ratio_list = []
-        with ThreadPoolExecutor() as executor:
-            for ratio in tqdm(executor.map(get_ratio, self.file_names), desc='get image info', total=len(self.file_names)):
-                ratio_list.append(ratio)
-        ratio_list = np.array(ratio_list)
-        # 聚类，选出指定个数的bucket
-        kmeans = KMeans(n_clusters=self.num_bucket, random_state=3407, verbose=True, tol=1e-3).fit(ratio_list.reshape(-1, 1))
-        labels = kmeans.labels_
-        ratios = 2**kmeans.cluster_centers_.reshape(-1)
-        h_all = np.sqrt(self.target_area/ratios)
-        w_all = h_all*ratios
-        # SD需要边长是8的倍数
-        h_all = (np.round(h_all/self.step_size)*self.step_size).astype(int)
-        w_all = (np.round(w_all/self.step_size)*self.step_size).astype(int)
-        self.size_buckets = list(zip(w_all, h_all))
-        self.size_buckets = np.array(self.size_buckets)
-        self.buckets = []  # [bucket_id:[file_idx,...]]
-        self.idx_bucket_map = np.empty(len(self.file_names), dtype=int)
-        for bidx in range(self.num_bucket):
-            bnow = labels == bidx
-            self.buckets.append(np.where(bnow)[0].tolist())
-            self.idx_bucket_map[bnow] = bidx
-        logger.info('buckets info: '+', '.join(f'size:{self.size_buckets[i]}, num:{len(b)}' for i, b in enumerate(self.buckets)))
-    def build(self, bs: int, file_names: List[Tuple[str, DataSource]]):
-        '''
-        :param bs: batch_size * n_gpus * accumulation_step
-        :param img_root_list:
-        '''
-        self.file_names = file_names
-        self.bs = bs
-        if self.pre_build_bucket and os.path.exists(self.pre_build_bucket):
-            self.load_bucket(self.pre_build_bucket)
-            return
-        self._build()
-        rs = np.random.RandomState(42)
-        # make len(bucket)%bs==0
-        self.data_len = 0
-        for bidx, bucket in enumerate(self.buckets):
-            rest = len(bucket)%bs
-            if rest>0:
-                bucket.extend(rs.choice(bucket, bs-rest))
-            self.data_len += len(bucket)
-            self.buckets[bidx] = np.array(bucket)
-        if self.pre_build_bucket:
-            self.save_bucket(self.pre_build_bucket)
-    def rest(self, epoch):
-        rs = np.random.RandomState(42+epoch)
-        bucket_list = [x.copy() for x in self.buckets]
-        # shuffle inter bucket
-        for x in bucket_list:
-            rs.shuffle(x)
-        # shuffle of batches
-        bucket_list = np.hstack(bucket_list).reshape(-1, self.bs).astype(int)
-        rs.shuffle(bucket_list)
-        self.idx_bucket = bucket_list.reshape(-1)
-    def crop_resize(self, image, size, mask_interp=cv2.INTER_CUBIC):
-        return resize_crop_fix(image, size, mask_interp=mask_interp)
-    def __getitem__(self, idx):
-        file_idx = self.idx_bucket[idx]
-        bucket_idx = self.idx_bucket_map[file_idx]
-        return self.file_names[file_idx], self.size_buckets[bucket_idx]
-    def __len__(self):
-        return self.data_len
-    @classmethod
-    def from_ratios(cls, target_area: int = 640*640, step_size: int = 8, num_bucket: int = 10, ratio_max: float = 4,
-                    pre_build_bucket: str = None, **kwargs):
-        arb = cls(target_area, step_size, num_bucket, pre_build_bucket=pre_build_bucket)
-        arb.ratio_max = ratio_max
-        arb._build = arb.build_buckets_from_ratios
-        return arb
-    @classmethod
-    def from_files(cls, target_area: int = 640*640, step_size: int = 8, num_bucket: int = 10, pre_build_bucket: str = None, **kwargs):
-        arb = cls(target_area, step_size, num_bucket, pre_build_bucket=pre_build_bucket)
-        arb._build = arb.build_buckets_from_images
-        return arb
-class SizeBucket(RatioBucket):
-    def __init__(self, step_size: int = 8, num_bucket: int = 10, pre_build_bucket: str = None):
-        super().__init__(step_size=step_size, num_bucket=num_bucket, pre_build_bucket=pre_build_bucket)
-    def build_buckets_from_images(self):
-        '''
-        根据图像尺寸聚类，不会resize图像，只有剪裁和填充操作。
-        '''
-        logger.info('build buckets from images size')
-        size_list = []
-        for i, (file, source) in enumerate(self.file_names):
-            w, h = get_image_size(file)
-            size_list.append([w, h])
-        size_list = np.array(size_list)
-        # 聚类，选出指定个数的bucket
-        kmeans = KMeans(n_clusters=self.num_bucket, random_state=3407).fit(size_list)
-        labels = kmeans.labels_
-        size_buckets = kmeans.cluster_centers_
-        # SD需要边长是8的倍数
-        self.size_buckets = (np.round(size_buckets/self.step_size)*self.step_size).astype(int)
-        self.buckets = []  # [bucket_id:[file_idx,...]]
-        self.idx_bucket_map = np.empty(len(self.file_names), dtype=int)
-        for bidx in range(self.num_bucket):
-            bnow = labels == bidx
-            self.buckets.append(np.where(bnow)[0].tolist())
-            self.idx_bucket_map[bnow] = bidx
-        logger.info('buckets info: '+', '.join(f'size:{self.size_buckets[i]}, num:{len(b)}' for i, b in enumerate(self.buckets)))
-    def crop_resize(self, image, size):
-        return pad_crop_fix(image, size)
-    @classmethod
-    def from_files(cls, step_size: int = 8, num_bucket: int = 10, pre_build_bucket: str = None, **kwargs):
-        arb = cls(step_size, num_bucket, pre_build_bucket=pre_build_bucket)
-        arb._build = arb.build_buckets_from_images
-        return arb
-class RatioSizeBucket(RatioBucket):
-    def __init__(self, step_size: int = 8, num_bucket: int = 10, max_area:int=640*640, pre_build_bucket: str = None):
-        super().__init__(step_size=step_size, num_bucket=num_bucket, pre_build_bucket=pre_build_bucket)
-        self.max_area = max_area
-    def build_buckets_from_images(self):
-        '''
-        根据图像尺寸聚类，不会resize图像，只有剪裁和填充操作。
-        '''
-        logger.info('build buckets from images')
-        ratio_list = []
-        for i, (file, source) in enumerate(self.file_names):
-            w, h = get_image_size(file)
-            ratio = np.log2(w/h)
-            log_area = np.log2(min(w*h, self.max_area))
-            ratio_list.append([ratio, log_area])
-        ratio_list = np.array(ratio_list)
-        # 聚类，选出指定个数的bucket
-        kmeans = KMeans(n_clusters=self.num_bucket, random_state=3407).fit(ratio_list)
-        labels = kmeans.labels_
-        ratios = 2**kmeans.cluster_centers_[:, 0]
-        sizes = 2**kmeans.cluster_centers_[:, 1]
-        h_all = np.sqrt(sizes/ratios)
-        w_all = h_all*ratios
-        # SD需要边长是8的倍数
-        h_all = (np.round(h_all/self.step_size)*self.step_size).astype(int)
-        w_all = (np.round(w_all/self.step_size)*self.step_size).astype(int)
-        self.size_buckets = list(zip(w_all, h_all))
-        self.size_buckets = np.array(self.size_buckets)
-        self.buckets = []  # [bucket_id:[file_idx,...]]
-        self.idx_bucket_map = np.empty(len(self.file_names), dtype=int)
-        for bidx in range(self.num_bucket):
-            bnow = labels == bidx
-            self.buckets.append(np.where(bnow)[0].tolist())
-            self.idx_bucket_map[bnow] = bidx
-        logger.info('buckets info: '+', '.join(f'size:{self.size_buckets[i]}, num:{len(b)}' for i, b in enumerate(self.buckets)))
-    @classmethod
-    def from_files(cls, step_size: int = 8, num_bucket: int = 10, max_area:int=640*640, pre_build_bucket: str = None, **kwargs):
-        arb = cls(step_size, num_bucket, max_area=max_area, pre_build_bucket=pre_build_bucket)
-        arb._build = arb.build_buckets_from_images
-        return arb
-class LongEdgeBucket(RatioBucket):
-    def __init__(self, target_edge=640, step_size: int = 8, num_bucket: int = 10, pre_build_bucket: str = None):
-        super().__init__(step_size=step_size, num_bucket=num_bucket, pre_build_bucket=pre_build_bucket)
-        self.target_edge = target_edge
-    def build_buckets_from_images(self):
-        '''
-        根据图像尺寸聚类，不会resize图像，只有剪裁和填充操作。
-        '''
-        logger.info('build buckets from images size')
-        size_list = []
-        for i, (file, source) in enumerate(self.file_names):
-            w, h = get_image_size(file)
-            scale = self.target_edge/max(w, h)
-            size_list.append([round(w*scale), round(h*scale)])
-        size_list = np.array(size_list)
-        # 聚类，选出指定个数的bucket
-        kmeans = KMeans(n_clusters=self.num_bucket, random_state=3407, verbose=True).fit(size_list)
-        labels = kmeans.labels_
-        size_buckets = kmeans.cluster_centers_
-        # SD需要边长是8的倍数
-        self.size_buckets = (np.round(size_buckets/self.step_size)*self.step_size).astype(int)
-        self.buckets = []  # [bucket_id:[file_idx,...]]
-        self.idx_bucket_map = np.empty(len(self.file_names), dtype=int)
-        for bidx in range(self.num_bucket):
-            bnow = labels == bidx
-            self.buckets.append(np.where(bnow)[0].tolist())
-            self.idx_bucket_map[bnow] = bidx
-        logger.info('buckets info: '+', '.join(f'size:{self.size_buckets[i]}, num:{len(b)}' for i, b in enumerate(self.buckets)))
-    def crop_resize(self, image, size):
-        return resize_crop_fix(image, size)
-    @classmethod
-    def from_files(cls, target_edge, step_size: int = 8, num_bucket: int = 10, pre_build_bucket: str = None, **kwargs):
-        arb = cls(target_edge, step_size, num_bucket, pre_build_bucket=pre_build_bucket)
-        arb._build = arb.build_buckets_from_images
-        return arb

hcpdiff/data/caption_loader.py DELETED Viewed

@@ -1,80 +0,0 @@
-import json
-import os
-import glob
-import yaml
-from typing import Dict
-from loguru import logger
-from hcpdiff.utils.img_size_tool import types_support
-import os
-class BaseCaptionLoader:
-    def __init__(self, path):
-        self.path = path
-    def _load(self):
-        raise NotImplementedError
-    def load(self):
-        retval = self._load()
-        logger.info(f'{len(retval)} record(s) loaded with {self.__class__.__name__}, from path {self.path!r}')
-        return retval
-    @staticmethod
-    def clean_ext(captions:Dict[str, str]):
-        def rm_ext(path):
-            name, ext = os.path.splitext(path)
-            if len(ext)>0 and ext[1:] in types_support:
-                return name
-            return path
-        return {rm_ext(k):v for k,v in captions.items()}
-class JsonCaptionLoader(BaseCaptionLoader):
-    def _load(self):
-        with open(self.path, 'r', encoding='utf-8') as f:
-            return self.clean_ext(json.loads(f.read()))
-class YamlCaptionLoader(BaseCaptionLoader):
-    def _load(self):
-        with open(self.path, 'r', encoding='utf-8') as f:
-            return self.clean_ext(yaml.load(f.read(), Loader=yaml.FullLoader))
-class TXTCaptionLoader(BaseCaptionLoader):
-    def _load(self):
-        txt_files = glob.glob(os.path.join(self.path, '*.txt'))
-        captions = {}
-        for file in txt_files:
-            with open(file, 'r', encoding='utf-8') as f:
-                captions[os.path.basename(file).split('.')[0]] = f.read().strip()
-        return captions
-def auto_caption_loader(path):
-    if os.path.isdir(path):
-        json_files = glob.glob(os.path.join(path, '*.json'))
-        if json_files:
-            return JsonCaptionLoader(json_files[0])
-        yaml_files = [
-            *glob.glob(os.path.join(path, '*.yaml')),
-            *glob.glob(os.path.join(path, '*.yml')),
-        ]
-        if yaml_files:
-            return YamlCaptionLoader(yaml_files[0])
-        txt_files = glob.glob(os.path.join(path, '*.txt'))
-        if txt_files:
-            return TXTCaptionLoader(path)
-        raise FileNotFoundError(f'Caption file not found in directory {path!r}.')
-    elif os.path.isfile(path):
-        _, ext = os.path.splitext(path)
-        if ext == '.json':
-            return JsonCaptionLoader(path)
-        elif ext in {'.yaml', '.yml'}:
-            return YamlCaptionLoader(path)
-        else:
-            raise FileNotFoundError(f'Unknown caption file {path!r}.')
-    else:
-        raise FileNotFoundError(f'Unknown caption file type {path!r}.')

hcpdiff/data/cond_dataset.py DELETED Viewed

@@ -1,40 +0,0 @@
-"""
-pair_dataset.py
-====================
-    :Name:        text-image pair dataset
-    :Author:      Dong Ziyi
-    :Affiliation: HCP Lab, SYSU
-    :Created:     10/03/2023
-    :Licence:     Apache-2.0
-"""
-import cv2
-import torch
-from .pair_dataset import TextImagePairDataset
-class TextImageCondPairDataset(TextImagePairDataset):
-    """
-    A dataset to prepare the instance and class images with the prompts for fine-tuning the model.
-    It pre-processes the images and the tokenizes prompts.
-    """
-    def load_data(self, path, data_source, size):
-        image_dict = data_source.load_image(path)
-        image = image_dict['image']
-        att_mask = image_dict.get('att_mask', None)
-        img_cond = image_dict.get('cond', None)
-        if img_cond is None:
-            raise FileNotFoundError(f'{self.__class__} need the condition images!')
-        if att_mask is None:
-            data, crop_coord = self.bucket.crop_resize({"img":image, "cond":img_cond}, size)
-            image = data_source.procees_image(data['img'])  # resize to bucket size
-            img_cond = data_source.cond_transform(data['cond'])
-            att_mask = torch.ones((size[1]//8, size[0]//8))
-        else:
-            data, crop_coord = self.bucket.crop_resize({"img":image, "mask":att_mask, "cond":img_cond}, size)
-            image = data_source.procees_image(data['img'])
-            img_cond = data_source.cond_transform(data['cond'])
-            att_mask = torch.tensor(cv2.resize(data['mask'], (size[0]//8, size[1]//8), interpolation=cv2.INTER_LINEAR))
-        return {'img':image, 'mask':att_mask, 'plugin_input':{"cond":img_cond}}

hcpdiff/data/crop_info_dataset.py DELETED Viewed

@@ -1,40 +0,0 @@
-"""
-pair_dataset.py
-====================
-    :Name:        text-image pair dataset
-    :Author:      Dong Ziyi
-    :Affiliation: HCP Lab, SYSU
-    :Created:     10/03/2023
-    :Licence:     Apache-2.0
-"""
-from typing import Callable, Iterable, Dict
-from .bucket import BaseBucket
-import os.path
-import torch
-import cv2
-from .pair_dataset import TextImagePairDataset
-from hcpdiff.utils.utils import get_file_name
-from torchvision import transforms
-class CropInfoPairDataset(TextImagePairDataset):
-    """
-    A dataset to prepare the instance and class images with the prompts for fine-tuning the model.
-    It pre-processes the images and the tokenizes prompts.
-    """
-    def load_data(self, path, data_source, size):
-        image_dict = data_source.load_image(path)
-        image = image_dict['image']
-        att_mask = image_dict.get('att_mask', None)
-        if att_mask is None:
-            data, crop_coord = self.bucket.crop_resize({"img":image}, size)
-            image = data_source.procees_image(data['img'])  # resize to bucket size
-            att_mask = torch.ones((size[1]//8, size[0]//8))
-        else:
-            data, crop_coord = self.bucket.crop_resize({"img":image, "mask":att_mask}, size)
-            image = data_source.procees_image(data['img'])
-            att_mask = torch.tensor(cv2.resize(data['mask'], (size[0]//8, size[1]//8), interpolation=cv2.INTER_LINEAR))
-        crop_info = torch.tensor(crop_coord, dtype=torch.float)  # for sdxl
-        return {'img':image, 'mask':att_mask, 'crop_info':crop_info}

hcpdiff/data/data_processor.py DELETED Viewed

@@ -1,33 +0,0 @@
-import numpy as np
-import torch
-from PIL import Image
-from diffusers.utils import PIL_INTERPOLATION
-class ControlNetProcessor:
-    def __init__(self, image):
-        self.image_path = image
-    def prepare_cond_image(self, image, width, height, batch_size, device):
-        if not isinstance(image, torch.Tensor):
-            if isinstance(image, Image.Image):
-                image = [image]
-            if isinstance(image[0], Image.Image):
-                image = [
-                    np.array(i.resize((width, height), resample=PIL_INTERPOLATION["lanczos"]))[None, :] for i in image
-                ]
-                image = np.concatenate(image, axis=0)
-                image = np.array(image).astype(np.float32)/255.0
-                image = image.transpose(0, 3, 1, 2)
-                image = torch.from_numpy(image)
-            elif isinstance(image[0], torch.Tensor):
-                image = torch.cat(image, dim=0)
-        image = image.repeat_interleave(batch_size, dim=0)
-        image = image.to(device=device)
-        return image
-    def __call__(self, width, height, batch_size, device, dtype):
-        img = Image.open(self.image_path).convert('RGB')
-        return self.prepare_cond_image(img, width, height, batch_size, 'cuda').to(dtype=dtype)

hcpdiff 0.9.1__py3-none-any.whl → 2.2__py3-none-any.whl

hcpdiff 0.9.1py3-none-any.whl → 2.2py3-none-any.whl