PyPI - xinference - Versions diffs - 1.9.0__py3-none-any.whl → 1.10.0__py3-none-any.whl - Mend

xinference 1.9.0py3-none-any.whl → 1.10.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of xinference might be problematic. Click here for more details.

Files changed (92) hide show

xinference/types.py CHANGED Viewed

@@ -351,6 +351,11 @@ class ModelAndPrompt(BaseModel):
     prompt: str
+class ModelAndMessages(BaseModel):
+    model: str
+    messages: List[Dict[str, Any]]
 class CreateCompletionTorch(BaseModel):
     echo: bool = echo_field
     max_tokens: Optional[int] = max_tokens_field
@@ -371,7 +376,6 @@ class CreateCompletionTorch(BaseModel):
 # This type is for openai API compatibility
 CreateCompletionOpenAI: BaseModel
 from openai.types.completion_create_params import CompletionCreateParamsNonStreaming
 CreateCompletionOpenAI = create_model_from_typeddict(
@@ -395,7 +399,6 @@ class CreateChatModel(BaseModel):
 # Currently, chat calls generates, so the params share the same one.
 CreateChatCompletionTorch = CreateCompletionTorch
 from ._compat import CreateChatCompletionOpenAI
@@ -462,3 +465,103 @@ class PeftModelConfig:
             image_lora_load_kwargs=data.get("image_lora_load_kwargs"),
             image_lora_fuse_kwargs=data.get("image_lora_fuse_kwargs"),
         )
+# This type is for Anthropic API compatibility
+ANTHROPIC_AVAILABLE = False
+try:
+    from anthropic.types import ContentBlock, Usage
+    ANTHROPIC_AVAILABLE = True
+except ImportError:
+    ContentBlock = None
+    Usage = None
+# Use TYPE_CHECKING to avoid runtime issues with mypy
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    # For type checking, define the types as if Anthropic is available
+    from anthropic.types import ContentBlock as ContentBlock_
+    from anthropic.types import Usage as Usage_
+    class AnthropicMessage(TypedDict):
+        id: str
+        type: str
+        role: str
+        content: List[ContentBlock_]
+        model: str
+        stop_reason: str
+        stop_sequence: str
+        usage: Usage_
+        container: Dict[str, Any]
+    class MessageCreateParams(TypedDict):
+        model: str
+        messages: List[Dict[str, Any]]
+        max_tokens: int
+        stream: NotRequired[bool]
+        temperature: NotRequired[float]
+        top_p: NotRequired[float]
+        top_k: NotRequired[int]
+        stop_sequences: NotRequired[List[str]]
+        metadata: NotRequired[Dict[str, Any]]
+        tools: NotRequired[List[Dict[str, Any]]]
+        tool_choice: NotRequired[Union[str, Dict[str, Any]]]
+    CreateMessageAnthropic: BaseModel
+    class CreateMessage(
+        ModelAndMessages,
+    ):
+        pass
+else:
+    # Runtime definitions
+    if ANTHROPIC_AVAILABLE:
+        class AnthropicMessage(TypedDict):
+            id: str
+            type: str
+            role: str
+            content: List[ContentBlock]
+            model: str
+            stop_reason: str
+            stop_sequence: str
+            usage: Usage
+            container: Dict[str, Any]
+        class MessageCreateParams(TypedDict):
+            model: str
+            messages: List[Dict[str, Any]]
+            max_tokens: int
+            stream: NotRequired[bool]
+            temperature: NotRequired[float]
+            top_p: NotRequired[float]
+            top_k: NotRequired[int]
+            stop_sequences: NotRequired[List[str]]
+            metadata: NotRequired[Dict[str, Any]]
+            tools: NotRequired[List[Dict[str, Any]]]
+            tool_choice: NotRequired[Union[str, Dict[str, Any]]]
+        CreateMessageAnthropic: BaseModel = create_model_from_typeddict(
+            MessageCreateParams,
+        )
+        CreateMessageAnthropic = fix_forward_ref(CreateMessageAnthropic)
+        class CreateMessage(CreateMessageAnthropic):
+            pass
+    else:
+        # Define dummy types when Anthropic is not available
+        class AnthropicMessage:
+            pass
+        class MessageCreateParams:
+            pass
+        CreateMessageAnthropic = None
+        class CreateMessage:
+            pass

xinference/ui/gradio/chat_interface.py CHANGED Viewed

@@ -135,6 +135,8 @@ class GradioInterface:
                     generate_config=generate_config,  # type: ignore
                 ):
                     assert isinstance(chunk, dict)
+                    if not chunk["choices"]:
+                        continue
                     delta = chunk["choices"][0]["delta"]
                     if (

xinference/ui/gradio/media_interface.py CHANGED Viewed

@@ -224,6 +224,7 @@ class MediaInterface:
             guidance_scale: int,
             num_inference_steps: int,
             padding_image_to_multiple: int,
+            strength: float,
             sampler_name: Optional[str] = None,
             progress=gr.Progress(),
         ) -> PIL.Image.Image:
@@ -243,6 +244,10 @@ class MediaInterface:
                 None if num_inference_steps == -1 else num_inference_steps  # type: ignore
             )
             padding_image_to_multiple = None if padding_image_to_multiple == -1 else padding_image_to_multiple  # type: ignore
+            # Initialize kwargs and handle strength parameter
+            kwargs = {}
+            if strength is not None:
+                kwargs["strength"] = strength
             sampler_name = None if sampler_name == "default" else sampler_name
             bio = io.BytesIO()
@@ -267,6 +272,7 @@ class MediaInterface:
                         guidance_scale=guidance_scale,
                         padding_image_to_multiple=padding_image_to_multiple,
                         sampler_name=sampler_name,
+                        **kwargs,
                     )
                 except Exception as e:
                     exc = e
@@ -324,6 +330,9 @@ class MediaInterface:
                     padding_image_to_multiple = gr.Number(
                         label="Padding image to multiple", value=-1
                     )
+                    strength = gr.Slider(
+                        label="Strength", value=0.6, step=0.1, minimum=0.0, maximum=1.0
+                    )
                     sampler_name = gr.Dropdown(
                         choices=SAMPLING_METHODS,
                         value="default",
@@ -348,12 +357,311 @@ class MediaInterface:
                     guidance_scale,
                     num_inference_steps,
                     padding_image_to_multiple,
+                    strength,
                     sampler_name,
                 ],
                 outputs=output_gallery,
             )
         return image2image_inteface
+    def inpainting_interface(self) -> "gr.Blocks":
+        from ...model.image.stable_diffusion.core import SAMPLING_METHODS
+        def preview_mask(
+            image_editor_output: Dict[str, Any],
+        ) -> PIL.Image.Image:
+            """Preview the generated mask without submitting inpainting task"""
+            # Extract original image and mask from ImageEditor output
+            if not image_editor_output or "background" not in image_editor_output:
+                return PIL.Image.new(
+                    "L", (512, 512), 0
+                )  # Return black image if no input
+            # Get the original image (background)
+            original_image = image_editor_output["background"]
+            # Get the composite image which contains the edits
+            composite_image = image_editor_output.get("composite", original_image)
+            # Create mask from the differences between original and composite
+            # White areas in composite indicate regions to inpaint
+            if original_image.mode != "RGB":
+                original_image = original_image.convert("RGB")
+            if composite_image.mode != "RGB":
+                composite_image = composite_image.convert("RGB")
+            # Create mask by finding differences (white drawn areas)
+            mask_image = PIL.Image.new("L", original_image.size, 0)
+            orig_data = original_image.load()
+            comp_data = composite_image.load()
+            mask_data = mask_image.load()
+            for y in range(original_image.size[1]):
+                for x in range(original_image.size[0]):
+                    orig_pixel = orig_data[x, y]
+                    comp_pixel = comp_data[x, y]
+                    # If pixels are different, assume it's a drawn area (white for inpainting)
+                    if orig_pixel != comp_pixel:
+                        mask_data[x, y] = 255  # White for inpainting
+            return mask_image
+        def process_inpainting(
+            prompt: str,
+            negative_prompt: str,
+            image_editor_output: Dict[str, Any],
+            uploaded_mask: Optional[PIL.Image.Image],
+            n: int,
+            size_width: int,
+            size_height: int,
+            guidance_scale: int,
+            num_inference_steps: int,
+            padding_image_to_multiple: int,
+            strength: float,
+            sampler_name: Optional[str] = None,
+            progress=gr.Progress(),
+        ) -> List[PIL.Image.Image]:
+            from ...client import RESTfulClient
+            client = RESTfulClient(self.endpoint)
+            client._set_token(self.access_token)
+            model = client.get_model(self.model_uid)
+            assert isinstance(model, RESTfulImageModelHandle)
+            if size_width > 0 and size_height > 0:
+                size = f"{int(size_width)}*{int(size_height)}"
+            else:
+                size = None
+            guidance_scale = None if guidance_scale == -1 else guidance_scale  # type: ignore
+            num_inference_steps = (
+                None if num_inference_steps == -1 else num_inference_steps  # type: ignore
+            )
+            padding_image_to_multiple = None if padding_image_to_multiple == -1 else padding_image_to_multiple  # type: ignore
+            # Initialize kwargs and handle strength parameter
+            kwargs = {}
+            if strength is not None:
+                kwargs["strength"] = strength
+            sampler_name = None if sampler_name == "default" else sampler_name
+            # Get the original image for inpainting
+            if not image_editor_output or "background" not in image_editor_output:
+                raise ValueError("Please upload and edit an image first")
+            original_image = image_editor_output["background"]
+            # Convert original image to RGB if needed
+            if original_image.mode == "RGBA":
+                # Create a white background and paste the RGBA image onto it
+                rgb_image = PIL.Image.new("RGB", original_image.size, (255, 255, 255))
+                rgb_image.paste(
+                    original_image, mask=original_image.split()[3]
+                )  # Use alpha channel as mask
+                original_image = rgb_image
+            elif original_image.mode != "RGB":
+                original_image = original_image.convert("RGB")
+            # Assert that original image is RGB format
+            assert (
+                original_image.mode == "RGB"
+            ), f"Expected RGB image, got {original_image.mode}"
+            # Use uploaded mask if provided, otherwise generate from editor
+            if uploaded_mask is not None:
+                mask_image = uploaded_mask
+                # Convert RGBA to RGB if needed
+                if mask_image.mode == "RGBA":
+                    # Create a white background and paste the RGBA image onto it
+                    rgb_mask = PIL.Image.new("RGB", mask_image.size, (255, 255, 255))
+                    rgb_mask.paste(
+                        mask_image, mask=(mask_image.split()[3])
+                    )  # Use alpha channel as mask
+                    mask_image = rgb_mask
+                elif mask_image.mode != "RGB":
+                    mask_image = mask_image.convert("RGB")
+                # Ensure mask is the same size as original image
+                if mask_image.size != original_image.size:
+                    mask_image = mask_image.resize(original_image.size)
+                # Assert that mask image is RGB format
+                assert (
+                    mask_image.mode == "RGB"
+                ), f"Expected RGB mask, got {mask_image.mode}"
+            else:
+                # Generate mask using the preview function
+                mask_image = preview_mask(image_editor_output)
+                # Assert that generated mask is L format (grayscale)
+                assert mask_image.mode == "L", f"Expected L mask, got {mask_image.mode}"
+            bio = io.BytesIO()
+            original_image.save(bio, format="png")
+            mask_bio = io.BytesIO()
+            mask_image.save(mask_bio, format="png")
+            response = None
+            exc = None
+            request_id = str(uuid.uuid4())
+            def run_in_thread():
+                nonlocal exc, response
+                try:
+                    response = model.inpainting(
+                        request_id=request_id,
+                        prompt=prompt,
+                        negative_prompt=negative_prompt,
+                        n=n,
+                        image=bio.getvalue(),
+                        mask_image=mask_bio.getvalue(),
+                        size=size,
+                        response_format="b64_json",
+                        num_inference_steps=num_inference_steps,
+                        guidance_scale=guidance_scale,
+                        padding_image_to_multiple=padding_image_to_multiple,
+                        sampler_name=sampler_name,
+                        **kwargs,
+                    )
+                except Exception as e:
+                    exc = e
+            t = threading.Thread(target=run_in_thread)
+            t.start()
+            while t.is_alive():
+                try:
+                    cur_progress = client.get_progress(request_id)["progress"]
+                except (KeyError, RuntimeError):
+                    cur_progress = 0.0
+                progress(cur_progress, desc="Inpainting images")
+                time.sleep(1)
+            if exc:
+                raise exc
+            images = []
+            for image_dict in response["data"]:  # type: ignore
+                assert image_dict["b64_json"] is not None
+                image_data = base64.b64decode(image_dict["b64_json"])
+                image = PIL.Image.open(io.BytesIO(image_data))
+                images.append(image)
+            return images
+        with gr.Blocks() as inpainting_interface:
+            with gr.Column():
+                with gr.Row():
+                    with gr.Column(scale=10):
+                        prompt = gr.Textbox(
+                            label="Prompt",
+                            show_label=True,
+                            placeholder="Enter prompt here...",
+                        )
+                        negative_prompt = gr.Textbox(
+                            label="Negative Prompt",
+                            show_label=True,
+                            placeholder="Enter negative prompt here...",
+                        )
+                    with gr.Column(scale=1):
+                        generate_button = gr.Button("Generate")
+                with gr.Row():
+                    n = gr.Number(label="Number of image", value=1)
+                    size_width = gr.Number(label="Width", value=-1)
+                    size_height = gr.Number(label="Height", value=-1)
+                with gr.Row():
+                    guidance_scale = gr.Number(label="Guidance scale", value=-1)
+                    num_inference_steps = gr.Number(
+                        label="Inference Step Number", value=-1
+                    )
+                    padding_image_to_multiple = gr.Number(
+                        label="Padding image to multiple", value=-1
+                    )
+                    strength = gr.Slider(
+                        label="Strength", value=0.6, step=0.1, minimum=0.0, maximum=1.0
+                    )
+                    sampler_name = gr.Dropdown(
+                        choices=SAMPLING_METHODS,
+                        value="default",
+                        label="Sampling method",
+                    )
+                with gr.Row():
+                    with gr.Column(scale=2):
+                        image_editor = gr.ImageEditor(
+                            type="pil",
+                            label="Edit Image and Create Mask (Draw white areas to inpaint)",
+                            interactive=True,
+                            height=400,
+                        )
+                        # Mask controls below the editor
+                        with gr.Row():
+                            preview_button = gr.Button("Preview Mask", size="sm")
+                            upload_mask = gr.Image(
+                                type="pil",
+                                label="Or upload mask image directly",
+                                interactive=True,
+                            )
+                        with gr.Row():
+                            mask_output = gr.Image(
+                                label="Current Mask Preview",
+                                interactive=False,
+                                height=200,
+                            )
+                    with gr.Column(scale=1):
+                        gr.Markdown("### Inpainting Results")
+                        output_gallery = gr.Gallery()
+            preview_button.click(
+                preview_mask,
+                inputs=[image_editor],
+                outputs=[mask_output],
+            )
+            # When user uploads a mask, display it
+            def process_uploaded_mask(
+                mask: Optional[PIL.Image.Image],
+            ) -> PIL.Image.Image:
+                if mask is None:
+                    return PIL.Image.new("L", (512, 512), 0)
+                # Convert RGBA to grayscale for preview
+                if mask.mode == "RGBA":
+                    # Use alpha channel for mask preview
+                    alpha = mask.split()[3]
+                    mask = alpha.convert("L")
+                elif mask.mode != "L":
+                    # Convert to grayscale
+                    mask = mask.convert("L")
+                return mask
+            upload_mask.change(
+                process_uploaded_mask, inputs=[upload_mask], outputs=[mask_output]
+            )
+            generate_button.click(
+                process_inpainting,
+                inputs=[
+                    prompt,
+                    negative_prompt,
+                    image_editor,
+                    upload_mask,
+                    n,
+                    size_width,
+                    size_height,
+                    guidance_scale,
+                    num_inference_steps,
+                    padding_image_to_multiple,
+                    strength,
+                    sampler_name,
+                ],
+                outputs=[output_gallery],
+            )
+        return inpainting_interface
     def text2video_interface(self) -> "gr.Blocks":
         def text_generate_video(
             prompt: str,
@@ -797,8 +1105,24 @@ class MediaInterface:
             return audio_path
+        # Determine model abilities
+        supports_basic_tts = "text2audio" in self.model_ability
+        supports_zero_shot = "text2audio_zero_shot" in self.model_ability
+        supports_voice_cloning = "text2audio_voice_cloning" in self.model_ability
+        # Show ability info
+        ability_info = []
+        if supports_basic_tts:
+            ability_info.append("✅ Basic TTS (text-to-speech)")
+        if supports_zero_shot:
+            ability_info.append("✅ Zero-shot TTS (voice selection)")
+        if supports_voice_cloning:
+            ability_info.append("✅ Voice Cloning (requires reference audio)")
         # Gradio UI
         with gr.Blocks() as tts_ui:
+            gr.Markdown(f"**Model Abilities:**\n{chr(10).join(ability_info)}")
             with gr.Row():
                 with gr.Column():
                     input_text = gr.Textbox(
@@ -811,13 +1135,32 @@ class MediaInterface:
                         label="Speed", minimum=0.5, maximum=2.0, value=1.0, step=0.1
                     )
-                    prompt_speech = gr.Audio(
-                        label="Prompt Speech (for cloning)", type="filepath"
-                    )
-                    prompt_text = gr.Textbox(
-                        label="Prompt Text (for cloning)",
-                        placeholder="Text of the prompt speech",
-                    )
+                    # Show voice cloning controls if supported
+                    if supports_voice_cloning:
+                        gr.Markdown("---\n**Voice Cloning Options**")
+                        # Make voice cloning required if model doesn't support zero-shot
+                        if supports_zero_shot:
+                            prompt_speech = gr.Audio(
+                                label="Prompt Speech (for cloning, optional)",
+                                type="filepath",
+                            )
+                            prompt_text = gr.Textbox(
+                                label="Prompt Text (for cloning, optional)",
+                                placeholder="Text of the prompt speech",
+                            )
+                        else:
+                            prompt_speech = gr.Audio(
+                                label="Prompt Speech (for cloning, required)",
+                                type="filepath",
+                            )
+                            prompt_text = gr.Textbox(
+                                label="Prompt Text (for cloning, optional)",
+                                placeholder="Text of the prompt speech (optional)",
+                            )
+                    else:
+                        # Hidden components for API compatibility
+                        prompt_speech = gr.Audio(visible=False)
+                        prompt_text = gr.Textbox(visible=False)
                     generate = gr.Button("Generate")
@@ -871,6 +1214,9 @@ class MediaInterface:
             if "image2image" in self.model_ability:
                 with gr.Tab("Image to Image"):
                     self.image2image_interface()
+            if "inpainting" in self.model_ability:
+                with gr.Tab("Inpainting"):
+                    self.inpainting_interface()
             if "text2video" in self.model_ability:
                 with gr.Tab("Text to Video"):
                     self.text2video_interface()

xinference/ui/web/ui/build/asset-manifest.json CHANGED Viewed

@@ -1,14 +1,14 @@
 {
   "files": {
     "main.css": "./static/css/main.013f296b.css",
-    "main.js": "./static/js/main.4918643a.js",
+    "main.js": "./static/js/main.1086c759.js",
     "static/media/icon.webp": "./static/media/icon.4603d52c63041e5dfbfd.webp",
     "index.html": "./index.html",
     "main.013f296b.css.map": "./static/css/main.013f296b.css.map",
-    "main.4918643a.js.map": "./static/js/main.4918643a.js.map"
+    "main.1086c759.js.map": "./static/js/main.1086c759.js.map"
   },
   "entrypoints": [
     "static/css/main.013f296b.css",
-    "static/js/main.4918643a.js"
+    "static/js/main.1086c759.js"
   ]
 }

xinference/ui/web/ui/build/index.html CHANGED Viewed

	@@ -1 +1 @@
1	- <!doctype html><html lang="en"><head><meta charset="utf-8"/><link rel="icon" href="./favicon.svg"/><meta name="viewport" content="width=device-width,initial-scale=1"/><meta name="theme-color" content="#000000"/><meta name="description" content="Web site created using create-react-app"/><link rel="apple-touch-icon" href="./logo192.png"/><link rel="manifest" href="./manifest.json"/><title>Xinference</title><script defer="defer" src="./static/js/main.~~4918643a~~.js"></script><link href="./static/css/main.013f296b.css" rel="stylesheet"></head><body><noscript>You need to enable JavaScript to run this app.</noscript><div id="root"></div></body></html>
1	+ <!doctype html><html lang="en"><head><meta charset="utf-8"/><link rel="icon" href="./favicon.svg"/><meta name="viewport" content="width=device-width,initial-scale=1"/><meta name="theme-color" content="#000000"/><meta name="description" content="Web site created using create-react-app"/><link rel="apple-touch-icon" href="./logo192.png"/><link rel="manifest" href="./manifest.json"/><title>Xinference</title><script defer="defer" src="./static/js/main.1086c759.js"></script><link href="./static/css/main.013f296b.css" rel="stylesheet"></head><body><noscript>You need to enable JavaScript to run this app.</noscript><div id="root"></div></body></html>

xinference 1.9.0__py3-none-any.whl → 1.10.0__py3-none-any.whl

Potentially problematic release.

xinference 1.9.0py3-none-any.whl → 1.10.0py3-none-any.whl