PyPI - vibe-aigc - Versions diffs - 0.6.2__py3-none-any.whl → 0.6.3__py3-none-any.whl - Mend

vibe-aigc 0.6.2py3-none-any.whl → 0.6.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

vibe_aigc/tools.py CHANGED Viewed

@@ -496,8 +496,12 @@ class ToolRegistry:
         return "\n".join(lines)
-def create_default_registry() -> ToolRegistry:
-    """Create a registry with default tools."""
+def create_default_registry(comfyui_url: str = "http://127.0.0.1:8188") -> ToolRegistry:
+    """Create a registry with default tools.
+    Args:
+        comfyui_url: URL for ComfyUI server (for image/video generation)
+    """
     registry = ToolRegistry()
     # Register built-in tools
@@ -505,4 +509,12 @@ def create_default_registry() -> ToolRegistry:
     registry.register(TemplateTool())
     registry.register(CombineTool())
+    # Register ComfyUI-based generation tools (Paper Section 5.4)
+    try:
+        from .tools_comfyui import create_comfyui_tools
+        for tool in create_comfyui_tools(comfyui_url):
+            registry.register(tool)
+    except ImportError:
+        pass  # ComfyUI tools optional
     return registry

vibe_aigc/tools_comfyui.py ADDED Viewed

@@ -0,0 +1,271 @@
+"""
+ComfyUI Generation Tools - Image and Video Generation via VibeBackend.
+Integrates the VibeBackend into the Paper's tool architecture (Section 5.4):
+"The Planner traverses the system's atomic tool library...to select
+the optimal ensemble of components."
+This makes ComfyUI-based generation available to MetaPlanner as atomic tools.
+"""
+from typing import Dict, Any, Optional
+from dataclasses import dataclass
+from .tools import BaseTool, ToolSpec, ToolResult, ToolCategory
+from .vibe_backend import VibeBackend, GenerationRequest, GenerationResult
+from .discovery import Capability
+class ImageGenerationTool(BaseTool):
+    """
+    Image generation tool using local ComfyUI.
+    Maps high-level image requests to VibeBackend execution.
+    MetaPlanner can use this for visual content generation.
+    """
+    def __init__(self, comfyui_url: str = "http://127.0.0.1:8188"):
+        self.comfyui_url = comfyui_url
+        self._backend: Optional[VibeBackend] = None
+    @property
+    def spec(self) -> ToolSpec:
+        return ToolSpec(
+            name="image_generation",
+            description="Generate images using local AI models (FLUX, SD, etc.)",
+            category=ToolCategory.IMAGE,
+            input_schema={
+                "type": "object",
+                "required": ["prompt"],
+                "properties": {
+                    "prompt": {"type": "string", "description": "Image description"},
+                    "negative_prompt": {"type": "string", "description": "What to avoid"},
+                    "style": {"type": "string", "description": "Visual style hints"},
+                    "width": {"type": "integer", "default": 768},
+                    "height": {"type": "integer", "default": 512},
+                    "steps": {"type": "integer", "default": 20},
+                    "cfg": {"type": "number", "default": 7.0}
+                }
+            },
+            output_schema={
+                "type": "object",
+                "properties": {
+                    "image_url": {"type": "string"},
+                    "quality_score": {"type": "number"},
+                    "feedback": {"type": "string"}
+                }
+            },
+            examples=[
+                {
+                    "input": {"prompt": "cyberpunk cityscape at night, neon lights, rain"},
+                    "output": {"image_url": "http://...", "quality_score": 7.5}
+                }
+            ]
+        )
+    async def _ensure_backend(self) -> VibeBackend:
+        """Lazily initialize backend."""
+        if self._backend is None:
+            self._backend = VibeBackend(
+                comfyui_url=self.comfyui_url,
+                enable_vlm=True,
+                max_attempts=2,
+                quality_threshold=6.0
+            )
+            await self._backend.initialize()
+        return self._backend
+    async def execute(
+        self,
+        inputs: Dict[str, Any],
+        context: Optional[Dict[str, Any]] = None
+    ) -> ToolResult:
+        """Generate an image based on inputs."""
+        try:
+            backend = await self._ensure_backend()
+            # Build prompt from inputs + context (knowledge base hints)
+            prompt = inputs.get("prompt", "")
+            style = inputs.get("style", "")
+            # If knowledge base provided style hints, incorporate them
+            if context and "technical_specs" in context:
+                specs = context["technical_specs"]
+                if "lighting" in specs:
+                    prompt += f", {', '.join(specs['lighting'])}"
+                if "color_grading" in specs:
+                    prompt += f", {specs['color_grading']}"
+            if style:
+                prompt = f"{prompt}, {style}"
+            result = await backend.generate(GenerationRequest(
+                prompt=prompt,
+                capability=Capability.TEXT_TO_IMAGE,
+                negative_prompt=inputs.get("negative_prompt", ""),
+                width=inputs.get("width", 768),
+                height=inputs.get("height", 512),
+                steps=inputs.get("steps", 20),
+                cfg=inputs.get("cfg", 7.0)
+            ))
+            if result.success:
+                return ToolResult(
+                    success=True,
+                    output={
+                        "image_url": result.output_url,
+                        "quality_score": result.quality_score,
+                        "feedback": result.feedback,
+                        "strengths": result.strengths,
+                        "weaknesses": result.weaknesses
+                    },
+                    metadata={
+                        "model_used": result.model_used,
+                        "attempts": result.attempts
+                    }
+                )
+            else:
+                return ToolResult(
+                    success=False,
+                    output=None,
+                    error=result.error
+                )
+        except Exception as e:
+            return ToolResult(
+                success=False,
+                output=None,
+                error=str(e)
+            )
+class VideoGenerationTool(BaseTool):
+    """
+    Video generation tool using local ComfyUI.
+    Uses the I2V pipeline: FLUX → Wan I2V animation.
+    MetaPlanner can use this for motion content.
+    """
+    def __init__(self, comfyui_url: str = "http://127.0.0.1:8188"):
+        self.comfyui_url = comfyui_url
+        self._backend: Optional[VibeBackend] = None
+    @property
+    def spec(self) -> ToolSpec:
+        return ToolSpec(
+            name="video_generation",
+            description="Generate videos using local AI models (FLUX + Wan I2V)",
+            category=ToolCategory.VIDEO,
+            input_schema={
+                "type": "object",
+                "required": ["prompt"],
+                "properties": {
+                    "prompt": {"type": "string", "description": "Video description"},
+                    "negative_prompt": {"type": "string", "description": "What to avoid"},
+                    "style": {"type": "string", "description": "Visual style hints"},
+                    "motion": {"type": "string", "description": "Motion description"},
+                    "width": {"type": "integer", "default": 832},
+                    "height": {"type": "integer", "default": 480},
+                    "frames": {"type": "integer", "default": 33},
+                    "fps": {"type": "integer", "default": 16}
+                }
+            },
+            output_schema={
+                "type": "object",
+                "properties": {
+                    "video_url": {"type": "string"},
+                    "duration_seconds": {"type": "number"}
+                }
+            },
+            examples=[
+                {
+                    "input": {"prompt": "samurai walking through rain", "frames": 33},
+                    "output": {"video_url": "http://...", "duration_seconds": 2.0}
+                }
+            ]
+        )
+    async def _ensure_backend(self) -> VibeBackend:
+        """Lazily initialize backend."""
+        if self._backend is None:
+            self._backend = VibeBackend(
+                comfyui_url=self.comfyui_url,
+                enable_vlm=False,  # VLM slower for video
+                max_attempts=1
+            )
+            await self._backend.initialize()
+        return self._backend
+    async def execute(
+        self,
+        inputs: Dict[str, Any],
+        context: Optional[Dict[str, Any]] = None
+    ) -> ToolResult:
+        """Generate a video based on inputs."""
+        try:
+            backend = await self._ensure_backend()
+            # Build prompt
+            prompt = inputs.get("prompt", "")
+            style = inputs.get("style", "")
+            motion = inputs.get("motion", "")
+            # Incorporate knowledge base hints
+            if context and "technical_specs" in context:
+                specs = context["technical_specs"]
+                if "camera" in specs:
+                    prompt += f", {', '.join(specs['camera'][:2])}"
+                if "editing" in specs:
+                    motion = motion or specs["editing"][0] if specs["editing"] else ""
+            if style:
+                prompt = f"{prompt}, {style}"
+            if motion:
+                prompt = f"{prompt}, {motion}"
+            frames = inputs.get("frames", 33)
+            fps = inputs.get("fps", 16)
+            result = await backend.generate(GenerationRequest(
+                prompt=prompt,
+                capability=Capability.TEXT_TO_VIDEO,
+                negative_prompt=inputs.get("negative_prompt", ""),
+                width=inputs.get("width", 832),
+                height=inputs.get("height", 480),
+                frames=frames,
+                steps=20,
+                cfg=5.0
+            ))
+            if result.success:
+                return ToolResult(
+                    success=True,
+                    output={
+                        "video_url": result.output_url,
+                        "duration_seconds": frames / fps
+                    },
+                    metadata={
+                        "frames": frames,
+                        "fps": fps
+                    }
+                )
+            else:
+                return ToolResult(
+                    success=False,
+                    output=None,
+                    error=result.error
+                )
+        except Exception as e:
+            return ToolResult(
+                success=False,
+                output=None,
+                error=str(e)
+            )
+def create_comfyui_tools(comfyui_url: str = "http://127.0.0.1:8188") -> list:
+    """Create ComfyUI-based generation tools."""
+    return [
+        ImageGenerationTool(comfyui_url=comfyui_url),
+        VideoGenerationTool(comfyui_url=comfyui_url)
+    ]

{vibe_aigc-0.6.2.dist-info → vibe_aigc-0.6.3.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: vibe-aigc
-Version: 0.6.2
+Version: 0.6.3
 Summary: A New Paradigm for Content Generation via Agentic Orchestration
 Author: Vibe AIGC Contributors
 License-Expression: MIT

{vibe_aigc-0.6.2.dist-info → vibe_aigc-0.6.3.dist-info}/RECORD RENAMED Viewed

@@ -16,7 +16,8 @@ vibe_aigc/models.py,sha256=wIwlN_NDL_72YXRq3Igi5X5fx1ZFGG7ER6pO5MdL4-I,2408
 vibe_aigc/mv_pipeline.py,sha256=OvVnlSM8iPjrT5qmhE47p6-shKOAxN7_XqsQneuqLkk,25303
 vibe_aigc/persistence.py,sha256=inrJQjmCK4LighxQSmJorR6c7OvRzx-cmEb5HCQS9PY,10614
 vibe_aigc/planner.py,sha256=hmnASmofpahNuF9ei_0DxzHxm23vYjF67u-SB_G5EcU,33129
-vibe_aigc/tools.py,sha256=Tm_NA53yJjjvCrUuZ7YVtdLAdfUgxOLm5zZzIcJYvHI,15572
+vibe_aigc/tools.py,sha256=Ix0JKwCATtcZykG9F3gK0gM9zw9vu_4mO_NHxkUxc-s,15997
+vibe_aigc/tools_comfyui.py,sha256=sHe6bhYegrm2AAPzDuYyL4vcAJe_NG34vqjrLbovVX8,9979
 vibe_aigc/tools_multimodal.py,sha256=asSJJqF0hrD9uNiYpuieVY-lbgEXjbK3UjT20nX2Lig,20405
 vibe_aigc/vibe_backend.py,sha256=LUm9t3JeGfezJTjau9XAQeRN_DmHrPX2PCjNRhGE4lQ,23808
 vibe_aigc/video.py,sha256=0fg8RUpEsaJqDskAPiGP8yuyQDVCUvIy-uLScq_BOwg,14111
@@ -28,9 +29,9 @@ vibe_aigc/workflow_executor.py,sha256=mfYLOTfPmI7Upooxy07nPmlbZ-HZAfC18IaNW80G31
 vibe_aigc/workflow_registry.py,sha256=Z6gB1cA366LXqHcfqBF1od_8ySxAOt5RpKKaaZPqqUo,22359
 vibe_aigc/workflow_strategies.py,sha256=i_qqUrn-2F6lT9dNyFdTdy0NzE8ZnRNxAMl6zrOAtD8,26148
 vibe_aigc/workflows.py,sha256=uk7RjNVow6eimEdqfVQFDtLgHSkg0LUjSoa2N7C47u0,13886
-vibe_aigc-0.6.2.dist-info/licenses/LICENSE,sha256=Ir4dCTvOsbfoiOh9vYbhIKDH59S7J6qhJYZmHHICoKY,1079
-vibe_aigc-0.6.2.dist-info/METADATA,sha256=Tdhh5kFrhVvnvWNe3MkcXwrTW7FL_0w4rZ15rtmar34,6604
-vibe_aigc-0.6.2.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
-vibe_aigc-0.6.2.dist-info/entry_points.txt,sha256=2htp4yXJMvCAQXTB39XWWwbBPP3MYUYXsqlwMeQsd7o,49
-vibe_aigc-0.6.2.dist-info/top_level.txt,sha256=Cpjz8X0WEhnhaigqxmsZSl9VxduaDspj7WuVUGGLeao,10
-vibe_aigc-0.6.2.dist-info/RECORD,,
+vibe_aigc-0.6.3.dist-info/licenses/LICENSE,sha256=Ir4dCTvOsbfoiOh9vYbhIKDH59S7J6qhJYZmHHICoKY,1079
+vibe_aigc-0.6.3.dist-info/METADATA,sha256=5TjNBFqxPDHGzXA5N-ihp-ojTmvgGm4Z-aaSmAzLyzk,6604
+vibe_aigc-0.6.3.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
+vibe_aigc-0.6.3.dist-info/entry_points.txt,sha256=2htp4yXJMvCAQXTB39XWWwbBPP3MYUYXsqlwMeQsd7o,49
+vibe_aigc-0.6.3.dist-info/top_level.txt,sha256=Cpjz8X0WEhnhaigqxmsZSl9VxduaDspj7WuVUGGLeao,10
+vibe_aigc-0.6.3.dist-info/RECORD,,

{vibe_aigc-0.6.2.dist-info → vibe_aigc-0.6.3.dist-info}/WHEEL RENAMED Viewed

File without changes

{vibe_aigc-0.6.2.dist-info → vibe_aigc-0.6.3.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{vibe_aigc-0.6.2.dist-info → vibe_aigc-0.6.3.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{vibe_aigc-0.6.2.dist-info → vibe_aigc-0.6.3.dist-info}/top_level.txt RENAMED Viewed

File without changes

vibe-aigc 0.6.2__py3-none-any.whl → 0.6.3__py3-none-any.whl

vibe-aigc 0.6.2py3-none-any.whl → 0.6.3py3-none-any.whl