PyPI - optimum-rbln - Versions diffs - 0.1.0__py3-none-any.whl → 0.1.1__py3-none-any.whl - Mend

optimum-rbln 0.1.0py3-none-any.whl → 0.1.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

optimum/rbln/diffusers/pipelines/{stable_diffusion → controlnet}/pipeline_controlnet_img2img.py RENAMED Viewed

@@ -46,28 +46,43 @@ logger = logging.get_logger(__name__)
 class RBLNStableDiffusionControlNetImg2ImgPipeline(StableDiffusionControlNetImg2ImgPipeline):
     @classmethod
     def from_pretrained(cls, model_id, **kwargs):
+        """
+        Pipeline for image-to-image generation using Stable Diffusion with ControlNet.
+        This model inherits from [`StableDiffusionControlNetImg2ImgPipeline`]. Check the superclass documentation for the generic methods
+        implemented for all pipelines (downloading, saving, running on a particular device, etc.).
+        It implements the methods to convert a pre-trained Stable Diffusion Controlnet pipeline into a RBLNStableDiffusionControlNetImg2Img pipeline by:
+        - transferring the checkpoint weights of the original into an optimized RBLN graph,
+        - compiling the resulting graph using the RBLN compiler.
+        Args:
+            model_id (`Union[str, Path]`):
+                Can be either:
+                - A string, the *model id* of a pretrained model hosted inside a model repo on huggingface.co.
+                - A path to a *directory* containing a model saved using [`~OptimizedModel.save_pretrained`],
+        """
         export = kwargs.pop("export", None)
         text_encoder = kwargs.pop("text_encoder", None)
         controlnets = kwargs.pop("controlnet", None)
+        rbln_config_kwargs, rbln_constructor_kwargs = RBLNBaseModel.pop_rbln_kwargs_from_kwargs(kwargs)
         kwargs_dict = {
             "pretrained_model_name_or_path": model_id,
             "text_encoder": text_encoder,
             "controlnet": controlnets,
             **kwargs,
         }
         model = super().from_pretrained(**{k: v for k, v in kwargs_dict.items() if v is not None})
         if export is None or export is False:
             return model
-        rbln_config_kwargs, rbln_constructor_kwargs = RBLNBaseModel.pop_rbln_kwargs_from_kwargs(kwargs)
-        rbln_callback = rbln_config_kwargs.pop("rbln_callback", None)
-        img_width = kwargs.pop("img_width", None)
-        img_height = kwargs.pop("img_height", None)
-        model = rbln_callback(model)
+        do_classifier_free_guidance = (
+            rbln_config_kwargs.pop("rbln_guidance_scale", 5.0) > 1.0 and model.unet.config.time_cond_proj_dim is None
+        )
         save_dir = TemporaryDirectory()
         save_dir_path = Path(save_dir.name)
@@ -80,8 +95,6 @@ class RBLNStableDiffusionControlNetImg2ImgPipeline(StableDiffusionControlNetImg2
             export=True,
             rbln_unet_sample_size=model.unet.config.sample_size,
             rbln_use_encode=True,
-            rbln_img_width=img_width,
-            rbln_img_height=img_height,
             rbln_vae_scale_factor=model.vae_scale_factor,
             **rbln_config_kwargs,
             **rbln_constructor_kwargs,
@@ -95,7 +108,7 @@ class RBLNStableDiffusionControlNetImg2ImgPipeline(StableDiffusionControlNetImg2
         )
         batch_size = rbln_config_kwargs.pop("rbln_batch_size", 1)
-        unet_batch_size = batch_size * 2
+        unet_batch_size = batch_size * 2 if do_classifier_free_guidance else batch_size
         unet = RBLNUNet2DConditionModel.from_pretrained(
             model_id=save_dir_path / "unet",
@@ -103,8 +116,6 @@ class RBLNStableDiffusionControlNetImg2ImgPipeline(StableDiffusionControlNetImg2
             rbln_max_seq_len=text_encoder.config.max_position_embeddings,
             rbln_batch_size=unet_batch_size,
             rbln_use_encode=True,
-            rbln_img_width=img_width,
-            rbln_img_height=img_height,
             rbln_vae_scale_factor=model.vae_scale_factor,
             rbln_is_controlnet=True if "controlnet" in model.config.keys() else False,
             **rbln_config_kwargs,
@@ -116,8 +127,6 @@ class RBLNStableDiffusionControlNetImg2ImgPipeline(StableDiffusionControlNetImg2
                 model_id=str(save_dir_path / "controlnet"),
                 export=True,
                 rbln_batch_size=unet_batch_size,
-                rbln_img_width=img_width,
-                rbln_img_height=img_height,
                 rbln_vae_scale_factor=model.vae_scale_factor,
                 **rbln_config_kwargs,
                 **rbln_constructor_kwargs,
@@ -128,8 +137,6 @@ class RBLNStableDiffusionControlNetImg2ImgPipeline(StableDiffusionControlNetImg2
                 model_id=save_dir_path / "controlnet",
                 export=True,
                 rbln_batch_size=unet_batch_size,
-                rbln_img_width=img_width,
-                rbln_img_height=img_height,
                 rbln_vae_scale_factor=model.vae_scale_factor,
                 **rbln_config_kwargs,
                 **rbln_constructor_kwargs,
@@ -151,6 +158,8 @@ class RBLNStableDiffusionControlNetImg2ImgPipeline(StableDiffusionControlNetImg2
         }
         model.register_to_config(**update_dict)
+        model.models = [vae.model[0], vae.model[1], text_encoder.model[0], unet.model[0], controlnet.model[0]]
         return model
     def check_inputs(

optimum-rbln 0.1.0__py3-none-any.whl → 0.1.1__py3-none-any.whl

optimum-rbln 0.1.0py3-none-any.whl → 0.1.1py3-none-any.whl