PyPI - vibe-aigc - Versions diffs - 0.6.1__py3-none-any.whl → 0.6.2__py3-none-any.whl - Mend

vibe-aigc 0.6.1py3-none-any.whl → 0.6.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

vibe_aigc/vibe_backend.py CHANGED Viewed

@@ -150,6 +150,10 @@ class VibeBackend:
             import random
             request.seed = random.randint(0, 2**32 - 1)
+        # Special handling for TEXT_TO_VIDEO: use I2V pipeline
+        if request.capability == Capability.TEXT_TO_VIDEO:
+            return await self._generate_video_via_i2v(request)
         # Try to get workflow
         workflow = await self._get_workflow(request)
         if not workflow:
@@ -388,6 +392,199 @@ class VibeBackend:
         except Exception as e:
             return GenerationResult(success=False, error=str(e))
+    async def _generate_video_via_i2v(self, request: GenerationRequest) -> GenerationResult:
+        """Generate video via Image-to-Video pipeline.
+        Two-step process:
+        1. Generate base image with TEXT_TO_IMAGE
+        2. Animate with IMAGE_TO_VIDEO
+        """
+        print("\n[1/2] Generating base image...")
+        # Step 1: Generate image
+        image_workflow = self._create_flux_image_workflow(
+            prompt=request.prompt,
+            negative=request.negative_prompt,
+            width=request.width,
+            height=request.height,
+            seed=request.seed
+        )
+        image_result = await self._execute_workflow(image_workflow)
+        if not image_result.success:
+            return GenerationResult(
+                success=False,
+                error=f"Image generation failed: {image_result.error}"
+            )
+        print(f"    Base image: {image_result.output_path}")
+        # Step 2: Upload image and animate
+        print("\n[2/2] Animating with I2V...")
+        # Download image
+        async with aiohttp.ClientSession() as session:
+            async with session.get(image_result.output_url) as resp:
+                image_data = await resp.read()
+            # Upload to ComfyUI
+            form = aiohttp.FormData()
+            form.add_field('image', image_data, filename='input.png', content_type='image/png')
+            async with session.post(f"{self.url}/upload/image", data=form) as resp:
+                upload_result = await resp.json()
+                uploaded_name = upload_result.get("name", "input.png")
+                print(f"    Uploaded: {uploaded_name}")
+        # Create I2V workflow
+        i2v_workflow = self._create_wan_i2v_workflow(
+            uploaded_image=uploaded_name,
+            prompt=request.prompt,
+            negative=request.negative_prompt,
+            width=request.width,
+            height=request.height,
+            frames=request.frames,
+            seed=request.seed
+        )
+        video_result = await self._execute_workflow(i2v_workflow)
+        if not video_result.success:
+            return GenerationResult(
+                success=False,
+                error=f"Animation failed: {video_result.error}"
+            )
+        print(f"    Video: {video_result.output_path}")
+        return video_result
+    def _create_flux_image_workflow(
+        self, prompt: str, negative: str, width: int, height: int, seed: int
+    ) -> Dict[str, Any]:
+        """Create FLUX image generation workflow."""
+        return {
+            "1": {
+                "class_type": "CheckpointLoaderSimple",
+                "inputs": {"ckpt_name": "flux1-dev-fp8.safetensors"}
+            },
+            "2": {
+                "class_type": "CLIPTextEncode",
+                "inputs": {"text": prompt, "clip": ["1", 1]}
+            },
+            "3": {
+                "class_type": "CLIPTextEncode",
+                "inputs": {"text": negative or "blurry, distorted, ugly", "clip": ["1", 1]}
+            },
+            "4": {
+                "class_type": "EmptyLatentImage",
+                "inputs": {"width": width, "height": height, "batch_size": 1}
+            },
+            "5": {
+                "class_type": "KSampler",
+                "inputs": {
+                    "seed": seed,
+                    "steps": 20,
+                    "cfg": 3.5,
+                    "sampler_name": "euler",
+                    "scheduler": "simple",
+                    "denoise": 1.0,
+                    "model": ["1", 0],
+                    "positive": ["2", 0],
+                    "negative": ["3", 0],
+                    "latent_image": ["4", 0]
+                }
+            },
+            "6": {
+                "class_type": "VAEDecode",
+                "inputs": {"samples": ["5", 0], "vae": ["1", 2]}
+            },
+            "7": {
+                "class_type": "SaveImage",
+                "inputs": {"images": ["6", 0], "filename_prefix": "vibe_base"}
+            }
+        }
+    def _create_wan_i2v_workflow(
+        self, uploaded_image: str, prompt: str, negative: str,
+        width: int, height: int, frames: int, seed: int
+    ) -> Dict[str, Any]:
+        """Create Wan 2.1 I2V workflow."""
+        return {
+            "1": {
+                "class_type": "UNETLoader",
+                "inputs": {
+                    "unet_name": "I2V/Wan2_1-I2V-14B-480p_fp8_e4m3fn_scaled_KJ.safetensors",
+                    "weight_dtype": "fp8_e4m3fn"
+                }
+            },
+            "2": {
+                "class_type": "CLIPLoader",
+                "inputs": {
+                    "clip_name": "umt5_xxl_fp8_e4m3fn_scaled.safetensors",
+                    "type": "wan"
+                }
+            },
+            "3": {
+                "class_type": "VAELoader",
+                "inputs": {"vae_name": "wan_2.1_vae.safetensors"}
+            },
+            "4": {
+                "class_type": "LoadImage",
+                "inputs": {"image": uploaded_image}
+            },
+            "5": {
+                "class_type": "CLIPTextEncode",
+                "inputs": {"text": prompt + ", smooth motion, cinematic", "clip": ["2", 0]}
+            },
+            "6": {
+                "class_type": "CLIPTextEncode",
+                "inputs": {"text": negative or "static, frozen, blurry, distorted", "clip": ["2", 0]}
+            },
+            "7": {
+                "class_type": "WanImageToVideo",
+                "inputs": {
+                    "positive": ["5", 0],
+                    "negative": ["6", 0],
+                    "vae": ["3", 0],
+                    "width": width,
+                    "height": height,
+                    "length": frames,
+                    "batch_size": 1,
+                    "start_image": ["4", 0]
+                }
+            },
+            "8": {
+                "class_type": "KSampler",
+                "inputs": {
+                    "seed": seed,
+                    "steps": 30,
+                    "cfg": 5.0,
+                    "sampler_name": "euler",
+                    "scheduler": "normal",
+                    "denoise": 1.0,
+                    "model": ["1", 0],
+                    "positive": ["7", 0],
+                    "negative": ["7", 1],
+                    "latent_image": ["7", 2]
+                }
+            },
+            "9": {
+                "class_type": "VAEDecode",
+                "inputs": {"samples": ["8", 0], "vae": ["3", 0]}
+            },
+            "10": {
+                "class_type": "VHS_VideoCombine",
+                "inputs": {
+                    "images": ["9", 0],
+                    "frame_rate": 16,
+                    "loop_count": 0,
+                    "filename_prefix": "vibe_i2v",
+                    "format": "image/webp",
+                    "pingpong": False,
+                    "save_output": True
+                }
+            }
+        }
     def status(self) -> str:
         """Get backend status."""
         if not self._initialized:

{vibe_aigc-0.6.1.dist-info → vibe_aigc-0.6.2.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: vibe-aigc
-Version: 0.6.1
+Version: 0.6.2
 Summary: A New Paradigm for Content Generation via Agentic Orchestration
 Author: Vibe AIGC Contributors
 License-Expression: MIT

{vibe_aigc-0.6.1.dist-info → vibe_aigc-0.6.2.dist-info}/RECORD RENAMED Viewed

@@ -18,7 +18,7 @@ vibe_aigc/persistence.py,sha256=inrJQjmCK4LighxQSmJorR6c7OvRzx-cmEb5HCQS9PY,1061
 vibe_aigc/planner.py,sha256=hmnASmofpahNuF9ei_0DxzHxm23vYjF67u-SB_G5EcU,33129
 vibe_aigc/tools.py,sha256=Tm_NA53yJjjvCrUuZ7YVtdLAdfUgxOLm5zZzIcJYvHI,15572
 vibe_aigc/tools_multimodal.py,sha256=asSJJqF0hrD9uNiYpuieVY-lbgEXjbK3UjT20nX2Lig,20405
-vibe_aigc/vibe_backend.py,sha256=RhiG7LRU3rvbW4x002tJ_4pYX_i2Nwz4QDmP5RksP0k,16610
+vibe_aigc/vibe_backend.py,sha256=LUm9t3JeGfezJTjau9XAQeRN_DmHrPX2PCjNRhGE4lQ,23808
 vibe_aigc/video.py,sha256=0fg8RUpEsaJqDskAPiGP8yuyQDVCUvIy-uLScq_BOwg,14111
 vibe_aigc/visualization.py,sha256=jDs2f1vj4k8ZnJTA_niKLBH2NMahTgWneiADlNmW24s,7143
 vibe_aigc/vlm_feedback.py,sha256=Da26q5qmJr-vwdsstum8CTAjbedeLWAGxZfla2BS0Ko,10781
@@ -28,9 +28,9 @@ vibe_aigc/workflow_executor.py,sha256=mfYLOTfPmI7Upooxy07nPmlbZ-HZAfC18IaNW80G31
 vibe_aigc/workflow_registry.py,sha256=Z6gB1cA366LXqHcfqBF1od_8ySxAOt5RpKKaaZPqqUo,22359
 vibe_aigc/workflow_strategies.py,sha256=i_qqUrn-2F6lT9dNyFdTdy0NzE8ZnRNxAMl6zrOAtD8,26148
 vibe_aigc/workflows.py,sha256=uk7RjNVow6eimEdqfVQFDtLgHSkg0LUjSoa2N7C47u0,13886
-vibe_aigc-0.6.1.dist-info/licenses/LICENSE,sha256=Ir4dCTvOsbfoiOh9vYbhIKDH59S7J6qhJYZmHHICoKY,1079
-vibe_aigc-0.6.1.dist-info/METADATA,sha256=X3gmW_JWtW65vqnlS5HhM79K1-72Qz0cUxzl3KiFVmg,6604
-vibe_aigc-0.6.1.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
-vibe_aigc-0.6.1.dist-info/entry_points.txt,sha256=2htp4yXJMvCAQXTB39XWWwbBPP3MYUYXsqlwMeQsd7o,49
-vibe_aigc-0.6.1.dist-info/top_level.txt,sha256=Cpjz8X0WEhnhaigqxmsZSl9VxduaDspj7WuVUGGLeao,10
-vibe_aigc-0.6.1.dist-info/RECORD,,
+vibe_aigc-0.6.2.dist-info/licenses/LICENSE,sha256=Ir4dCTvOsbfoiOh9vYbhIKDH59S7J6qhJYZmHHICoKY,1079
+vibe_aigc-0.6.2.dist-info/METADATA,sha256=Tdhh5kFrhVvnvWNe3MkcXwrTW7FL_0w4rZ15rtmar34,6604
+vibe_aigc-0.6.2.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
+vibe_aigc-0.6.2.dist-info/entry_points.txt,sha256=2htp4yXJMvCAQXTB39XWWwbBPP3MYUYXsqlwMeQsd7o,49
+vibe_aigc-0.6.2.dist-info/top_level.txt,sha256=Cpjz8X0WEhnhaigqxmsZSl9VxduaDspj7WuVUGGLeao,10
+vibe_aigc-0.6.2.dist-info/RECORD,,

{vibe_aigc-0.6.1.dist-info → vibe_aigc-0.6.2.dist-info}/WHEEL RENAMED Viewed

File without changes

{vibe_aigc-0.6.1.dist-info → vibe_aigc-0.6.2.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{vibe_aigc-0.6.1.dist-info → vibe_aigc-0.6.2.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{vibe_aigc-0.6.1.dist-info → vibe_aigc-0.6.2.dist-info}/top_level.txt RENAMED Viewed

File without changes

vibe-aigc 0.6.1__py3-none-any.whl → 0.6.2__py3-none-any.whl

vibe-aigc 0.6.1py3-none-any.whl → 0.6.2py3-none-any.whl