PyPI - ultimate-gemini-mcp - Versions diffs - 3.0.7__py3-none-any.whl - Mend

ultimate-gemini-mcp 3.0.7__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

src/__init__.py +16 -0
src/config/__init__.py +44 -0
src/config/constants.py +68 -0
src/config/settings.py +143 -0
src/core/__init__.py +47 -0
src/core/exceptions.py +62 -0
src/core/validation.py +117 -0
src/server.py +168 -0
src/services/__init__.py +13 -0
src/services/gemini_client.py +304 -0
src/services/image_service.py +174 -0
src/services/prompt_enhancer.py +137 -0
src/tools/__init__.py +11 -0
src/tools/batch_generate.py +181 -0
src/tools/generate_image.py +240 -0
ultimate_gemini_mcp-3.0.7.dist-info/METADATA +462 -0
ultimate_gemini_mcp-3.0.7.dist-info/RECORD +20 -0
ultimate_gemini_mcp-3.0.7.dist-info/WHEEL +4 -0
ultimate_gemini_mcp-3.0.7.dist-info/entry_points.txt +2 -0
ultimate_gemini_mcp-3.0.7.dist-info/licenses/LICENSE +31 -0

src/tools/batch_generate.py ADDED Viewed

@@ -0,0 +1,181 @@
+"""
+Batch image generation tool for processing multiple prompts efficiently.
+"""
+import asyncio
+import json
+import logging
+from typing import Any
+from ..config import MAX_BATCH_SIZE, get_settings
+from ..core import validate_batch_size, validate_prompts_list
+from .generate_image import generate_image_tool
+logger = logging.getLogger(__name__)
+async def batch_generate_images(
+    prompts: list[str],
+    model: str | None = None,
+    enhance_prompt: bool = True,
+    aspect_ratio: str = "1:1",
+    output_format: str = "png",
+    batch_size: int | None = None,
+    **shared_params: Any,
+) -> dict[str, Any]:
+    """
+    Generate multiple images from a list of prompts.
+    Args:
+        prompts: List of text prompts
+        model: Model to use for all images
+        enhance_prompt: Enhance all prompts
+        aspect_ratio: Aspect ratio for all images
+        output_format: Output format for all images
+        batch_size: Number of images to process in parallel (default: from config)
+        **shared_params: Additional parameters shared across all generations
+    Returns:
+        Dict with batch results
+    """
+    # Validate inputs
+    validate_prompts_list(prompts)
+    settings = get_settings()
+    if batch_size is None:
+        batch_size = settings.api.max_batch_size
+    validate_batch_size(batch_size, MAX_BATCH_SIZE)
+    # Prepare results
+    results: dict[str, Any] = {
+        "success": True,
+        "total_prompts": len(prompts),
+        "batch_size": batch_size,
+        "completed": 0,
+        "failed": 0,
+        "results": [],
+    }
+    # Process prompts in batches
+    for i in range(0, len(prompts), batch_size):
+        batch = prompts[i : i + batch_size]
+        logger.info(f"Processing batch {i // batch_size + 1}: {len(batch)} prompts")
+        # Create tasks for parallel processing
+        tasks = [
+            generate_image_tool(
+                prompt=prompt,
+                model=model,
+                enhance_prompt=enhance_prompt,
+                aspect_ratio=aspect_ratio,
+                output_format=output_format,
+                **shared_params,
+            )
+            for prompt in batch
+        ]
+        # Execute batch
+        batch_results = await asyncio.gather(*tasks, return_exceptions=True)
+        # Process results
+        for j, result in enumerate(batch_results):
+            prompt_index = i + j
+            if isinstance(result, Exception):
+                logger.error(f"Failed to generate image for prompt {prompt_index}: {result}")
+                results["failed"] += 1
+                results["results"].append(
+                    {
+                        "prompt_index": prompt_index,
+                        "prompt": batch[j],
+                        "success": False,
+                        "error": str(result),
+                    }
+                )
+            else:
+                # result is dict[str, Any] here (not an Exception)
+                if not isinstance(result, dict):
+                    logger.error(f"Unexpected result type: {type(result)}")
+                    results["failed"] += 1
+                    results["results"].append(
+                        {
+                            "prompt_index": prompt_index,
+                            "prompt": batch[j],
+                            "success": False,
+                            "error": "Unexpected result type",
+                        }
+                    )
+                else:
+                    results["completed"] += 1
+                    results["results"].append(
+                        {"prompt_index": prompt_index, "prompt": batch[j], **result}
+                    )
+    return results
+def register_batch_generate_tool(mcp_server: Any) -> None:
+    """Register batch_generate tool with MCP server."""
+    @mcp_server.tool()
+    async def batch_generate(
+        prompts: list[str],
+        model: str | None = None,
+        enhance_prompt: bool = True,
+        aspect_ratio: str = "1:1",
+        output_format: str = "png",
+        batch_size: int | None = None,
+        negative_prompt: str | None = None,
+    ) -> str:
+        """
+        Generate multiple images from a list of prompts efficiently.
+        Processes prompts in parallel batches for optimal performance.
+        All images share the same generation settings.
+        Args:
+            prompts: List of text descriptions for image generation
+            model: Model to use for all images (default: gemini-3-pro-image-preview)
+            enhance_prompt: Enhance all prompts automatically (default: True)
+            aspect_ratio: Aspect ratio for all images (default: 1:1)
+            output_format: Image format for all images (default: png)
+            batch_size: Parallel batch size (default: from config)
+            negative_prompt: Negative prompt for Imagen models (optional)
+        Returns:
+            JSON string with batch results including individual image paths
+        IMPORTANT - AI Assistant Instructions:
+        After batch generation completes, you MUST:
+        1. Parse the JSON response to extract file paths from result["results"][i]["images"][0]["path"]
+        2. Show the user a summary of all generated images with their file paths
+        3. Optionally display one or more images using the Read tool
+        4. Let the user know the total count of successful vs failed generations
+        Example response to user:
+        "Successfully generated 3 images:
+        1. /path/to/image1.png - [description]
+        2. /path/to/image2.png - [description]
+        3. /path/to/image3.png - [description]"
+        DO NOT just say "batch generation completed" without listing the file paths!
+        """
+        try:
+            result = await batch_generate_images(
+                prompts=prompts,
+                model=model,
+                enhance_prompt=enhance_prompt,
+                aspect_ratio=aspect_ratio,
+                output_format=output_format,
+                batch_size=batch_size,
+                negative_prompt=negative_prompt,
+            )
+            return json.dumps(result, indent=2)
+        except Exception as e:
+            logger.error(f"Batch generation error: {e}")
+            return json.dumps(
+                {"success": False, "error": str(e), "error_type": type(e).__name__}, indent=2
+            )

src/tools/generate_image.py ADDED Viewed

@@ -0,0 +1,240 @@
+"""
+Image generation tool supporting both Gemini and Imagen models.
+"""
+import base64
+import json
+import logging
+from pathlib import Path
+from typing import Any
+from ..config import get_settings
+from ..core import (
+    validate_aspect_ratio,
+    validate_image_format,
+    validate_model,
+    validate_prompt,
+)
+from ..services import ImageService
+logger = logging.getLogger(__name__)
+async def generate_image_tool(
+    prompt: str,
+    model: str | None = None,
+    enhance_prompt: bool = True,
+    aspect_ratio: str = "1:1",
+    image_size: str = "2K",
+    output_format: str = "png",
+    # Reference images (up to 14)
+    reference_image_paths: list[str] | None = None,
+    # Google Search grounding
+    enable_google_search: bool = False,
+    # Response modalities
+    response_modalities: list[str] | None = None,
+    # Output options
+    save_to_disk: bool = True,
+    **kwargs: Any,
+) -> dict[str, Any]:
+    """
+    Generate images using Gemini 3 Pro Image.
+    Args:
+        prompt: Text description for image generation
+        model: Model to use (default: gemini-3-pro-image-preview)
+        enhance_prompt: Automatically enhance prompt for better results
+        aspect_ratio: Image aspect ratio (1:1, 16:9, 9:16, etc.)
+        image_size: Image resolution: 1K, 2K, or 4K (default: 2K)
+        output_format: Image format (png, jpeg, webp)
+        reference_image_paths: Paths to reference images (up to 14)
+        enable_google_search: Use Google Search for real-time data grounding
+        response_modalities: Response types (TEXT, IMAGE - default: both)
+        save_to_disk: Save images to output directory
+    Returns:
+        Dict with generated images and metadata
+    """
+    # Validate inputs
+    validate_prompt(prompt)
+    if model:
+        validate_model(model)
+    validate_aspect_ratio(aspect_ratio)
+    validate_image_format(output_format)
+    # Get settings
+    settings = get_settings()
+    # Determine model
+    if model is None:
+        model = settings.api.default_model
+    # Initialize image service
+    image_service = ImageService(
+        api_key=settings.api.gemini_api_key,
+        enable_enhancement=settings.api.enable_prompt_enhancement,
+        timeout=settings.api.request_timeout,
+    )
+    try:
+        # Prepare parameters for Gemini 3 Pro Image
+        params: dict[str, Any] = {
+            "aspect_ratio": aspect_ratio,
+            "image_size": image_size,
+        }
+        # Add reference images if provided (up to 14)
+        if reference_image_paths:
+            reference_images = []
+            for img_path in reference_image_paths[:14]:  # Limit to max 14
+                image_path = Path(img_path)
+                if image_path.exists():
+                    image_data = base64.b64encode(image_path.read_bytes()).decode()
+                    reference_images.append(image_data)
+                else:
+                    logger.warning(f"Reference image not found: {img_path}")
+            if reference_images:
+                params["reference_images"] = reference_images
+        # Add Google Search grounding if enabled
+        if enable_google_search:
+            params["enable_google_search"] = True
+        # Add response modalities
+        if response_modalities:
+            params["response_modalities"] = response_modalities
+        # Generate images
+        results = await image_service.generate(
+            prompt=prompt,
+            model=model,
+            enhance_prompt=enhance_prompt and settings.api.enable_prompt_enhancement,
+            **params,
+        )
+        # Prepare response
+        response: dict[str, Any] = {
+            "success": True,
+            "model": model,
+            "prompt": prompt,
+            "images_generated": len(results),
+            "images": [],
+            "metadata": {
+                "enhance_prompt": enhance_prompt,
+                "aspect_ratio": aspect_ratio,
+            },
+        }
+        # Save images and prepare for MCP response
+        for result in results:
+            image_info = {
+                "index": result.index,
+                "size": result.get_size(),
+                "timestamp": result.timestamp.isoformat(),
+            }
+            if save_to_disk:
+                # Save to output directory
+                file_path = result.save(settings.output_dir)
+                image_info["path"] = str(file_path)
+                image_info["filename"] = file_path.name
+            # Add enhanced prompt info
+            if "enhanced_prompt" in result.metadata:
+                image_info["enhanced_prompt"] = result.metadata["enhanced_prompt"]
+            response["images"].append(image_info)
+        return response
+    finally:
+        await image_service.close()
+def register_generate_image_tool(mcp_server: Any) -> None:
+    """Register generate_image tool with MCP server."""
+    @mcp_server.tool()
+    async def generate_image(
+        prompt: str,
+        model: str | None = None,
+        enhance_prompt: bool = True,
+        aspect_ratio: str = "1:1",
+        image_size: str = "2K",
+        output_format: str = "png",
+        reference_image_paths: list[str] | None = None,
+        enable_google_search: bool = False,
+        response_modalities: list[str] | None = None,
+    ) -> str:
+        """
+        Generate images using Gemini 3 Pro Image - a state-of-the-art image generation model
+        optimized for professional asset production with advanced reasoning capabilities.
+        Features:
+        - High-resolution output: 1K, 2K, and 4K visuals
+        - Advanced text rendering for infographics, menus, diagrams
+        - Up to 14 reference images for consistent style/characters
+        - Google Search grounding for real-time data (weather, stocks, events)
+        - Thinking mode: Uses reasoning to refine composition
+        Args:
+            prompt: Text description of the image to generate
+            model: Model to use (default: gemini-3-pro-image-preview)
+            enhance_prompt: Automatically enhance prompt using AI (default: True)
+            aspect_ratio: Image aspect ratio like 1:1, 16:9, 9:16, 3:2, 4:5, etc. (default: 1:1)
+            image_size: Image resolution: 1K, 2K, or 4K (default: 2K)
+            output_format: Image format: png, jpeg, webp (default: png)
+            reference_image_paths: Paths to reference images (up to 14 total, max 6 objects, max 5 humans)
+            enable_google_search: Enable Google Search grounding for real-time data
+            response_modalities: Response types like ["TEXT", "IMAGE"] (default: both)
+        Available models:
+        - gemini-3-pro-image-preview (default and only model)
+        Returns:
+            JSON string with generation results, file paths, thoughts, and grounding metadata
+        IMPORTANT - AI Assistant Instructions:
+        After generating an image, you MUST:
+        1. Parse the JSON response to extract the file path from result["images"][0]["path"]
+        2. Inform the user of the EXACT file path where the image was saved
+        3. Use the Read tool to load and display the image to the user
+        4. If thoughts were generated, show the thinking process to the user
+        5. Optionally: Use bash to open the image in the default viewer:
+           - macOS: `open /path/to/image.png`
+           - Linux: `xdg-open /path/to/image.png`
+           - Windows: `start /path/to/image.png`
+        Example workflow:
+        ```
+        1. Call generate_image tool
+        2. Parse response JSON to get file_path and thoughts
+        3. Tell user: "Image saved to: /Users/name/gemini_images/image.png"
+        4. Show thinking process if present
+        5. Call Read tool with the file_path to display the image
+        6. Optionally call Bash with `open /path/to/image.png` to open in Preview
+        ```
+        DO NOT just say "image generated successfully" without showing the path and image!
+        """
+        try:
+            result = await generate_image_tool(
+                prompt=prompt,
+                model=model,
+                enhance_prompt=enhance_prompt,
+                aspect_ratio=aspect_ratio,
+                image_size=image_size,
+                output_format=output_format,
+                reference_image_paths=reference_image_paths,
+                enable_google_search=enable_google_search,
+                response_modalities=response_modalities,
+            )
+            return json.dumps(result, indent=2)
+        except Exception as e:
+            logger.error(f"Error generating image: {e}")
+            return json.dumps(
+                {"success": False, "error": str(e), "error_type": type(e).__name__}, indent=2
+            )