PyPI - retab - Versions diffs - 0.0.40__py3-none-any.whl → 0.0.42__py3-none-any.whl - Mend

retab 0.0.40py3-none-any.whl → 0.0.42py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

retab/client.py +5 -5
retab/resources/consensus/completions.py +1 -1
retab/resources/consensus/completions_stream.py +5 -5
retab/resources/consensus/responses.py +1 -1
retab/resources/consensus/responses_stream.py +2 -2
retab/resources/documents/client.py +12 -11
retab/resources/documents/extractions.py +4 -4
retab/resources/evals.py +1 -1
retab/resources/evaluations/documents.py +1 -1
retab/resources/jsonlUtils.py +4 -4
retab/resources/processors/automations/endpoints.py +9 -5
retab/resources/processors/automations/links.py +2 -2
retab/resources/processors/automations/logs.py +2 -2
retab/resources/processors/automations/mailboxes.py +43 -32
retab/resources/processors/automations/outlook.py +25 -7
retab/resources/processors/automations/tests.py +8 -2
retab/resources/processors/client.py +25 -16
retab/resources/prompt_optimization.py +1 -1
retab/resources/schemas.py +3 -3
retab/types/automations/mailboxes.py +1 -1
retab/types/completions.py +1 -1
retab/types/documents/create_messages.py +4 -4
retab/types/documents/extractions.py +3 -3
retab/types/documents/parse.py +3 -1
retab/types/evals.py +2 -2
retab/types/evaluations/iterations.py +2 -2
retab/types/evaluations/model.py +2 -2
retab/types/extractions.py +34 -9
retab/types/jobs/prompt_optimization.py +1 -1
retab/types/logs.py +3 -3
retab/types/schemas/object.py +4 -4
retab/types/schemas/templates.py +1 -1
retab/utils/__init__.py +0 -0
retab/utils/_model_cards/anthropic.yaml +59 -0
retab/utils/_model_cards/auto.yaml +43 -0
retab/utils/_model_cards/gemini.yaml +117 -0
retab/utils/_model_cards/openai.yaml +301 -0
retab/utils/_model_cards/xai.yaml +28 -0
retab/utils/ai_models.py +138 -0
retab/utils/benchmarking.py +484 -0
retab/utils/chat.py +327 -0
retab/utils/display.py +440 -0
retab/utils/json_schema.py +2156 -0
retab/utils/mime.py +165 -0
retab/utils/responses.py +169 -0
retab/utils/stream_context_managers.py +52 -0
retab/utils/usage/__init__.py +0 -0
retab/utils/usage/usage.py +301 -0
retab-0.0.42.dist-info/METADATA +119 -0
{retab-0.0.40.dist-info → retab-0.0.42.dist-info}/RECORD +52 -36
retab-0.0.40.dist-info/METADATA +0 -418
{retab-0.0.40.dist-info → retab-0.0.42.dist-info}/WHEEL +0 -0
{retab-0.0.40.dist-info → retab-0.0.42.dist-info}/top_level.txt +0 -0

retab/utils/chat.py ADDED Viewed

@@ -0,0 +1,327 @@
+import base64
+import logging
+from typing import List, Literal, Optional, Union, cast
+import requests
+from anthropic.types.image_block_param import ImageBlockParam
+from anthropic.types.message_param import MessageParam
+from anthropic.types.text_block_param import TextBlockParam
+from google.genai.types import BlobDict, ContentDict, ContentUnionDict, PartDict  # type: ignore
+from openai.types.chat.chat_completion_content_part_image_param import ChatCompletionContentPartImageParam
+from openai.types.chat.chat_completion_content_part_input_audio_param import ChatCompletionContentPartInputAudioParam
+from openai.types.chat.chat_completion_content_part_param import ChatCompletionContentPartParam
+from openai.types.chat.chat_completion_content_part_text_param import ChatCompletionContentPartTextParam
+from openai.types.chat.chat_completion_message_param import ChatCompletionMessageParam
+from ..types.chat import ChatCompletionRetabMessage
+MediaType = Literal["image/jpeg", "image/png", "image/gif", "image/webp"]
+def convert_to_google_genai_format(messages: List[ChatCompletionRetabMessage]) -> tuple[str, list[ContentUnionDict]]:
+    """
+    Converts a list of ChatCompletionRetabMessage to a format compatible with the google.genai SDK.
+    Example:
+        ```python
+        import google.genai as genai
+        # Configure the Gemini client
+        genai.configure(api_key=os.environ["GEMINI_API_KEY"])
+        # Initialize the model
+        model = genai.GenerativeModel("gemini-2.0-flash")
+        # Get messages in Gemini format
+        gemini_messages = document_message.gemini_messages
+        # Generate a response
+        ```
+    Args:
+        messages (List[ChatCompletionRetabMessage]): List of chat messages.
+    Returns:
+        List[Union[Dict[str, str], str]]: A list of formatted inputs for the google.genai SDK.
+    """
+    system_message: str = ""
+    formatted_content: list[ContentUnionDict] = []
+    for message in messages:
+        # -----------------------
+        # Handle system message
+        # -----------------------
+        if message["role"] in ("system", "developer"):
+            assert isinstance(message["content"], str), "System message content must be a string."
+            if system_message != "":
+                raise ValueError("Only one system message is allowed per chat.")
+            system_message += message["content"]
+            continue
+        parts: list[PartDict] = []
+        message_content = message["content"]
+        if isinstance(message_content, str):
+            # Direct string content is treated as the prompt for the SDK
+            parts.append(PartDict(text=message_content))
+        elif isinstance(message_content, list):
+            # Handle structured content
+            for part in message_content:
+                if part["type"] == "text":
+                    parts.append(PartDict(text=part["text"]))
+                elif part["type"] == "image_url":
+                    url = part["image_url"].get("url", "")  # type: ignore
+                    if url.startswith("data:image"):
+                        # Extract base64 data and add it to the formatted inputs
+                        media_type, data_content = url.split(";base64,")
+                        media_type = media_type.split("data:")[-1]  # => "image/jpeg"
+                        base64_data = data_content
+                        # Try to convert to PIL.Image and append it to the formatted inputs
+                        try:
+                            image_bytes = base64.b64decode(base64_data)
+                            parts.append(PartDict(inline_data=BlobDict(data=image_bytes, mime_type=media_type)))
+                        except Exception:
+                            pass
+                elif part["type"] == "input_audio":
+                    pass
+                elif part["type"] == "file":
+                    pass
+                else:
+                    pass
+        formatted_content.append(ContentDict(parts=parts, role=("user" if message["role"] == "user" else "model")))
+    return system_message, formatted_content
+def convert_to_anthropic_format(messages: List[ChatCompletionRetabMessage]) -> tuple[str, List[MessageParam]]:
+    """
+    Converts a list of ChatCompletionRetabMessage to a format compatible with the Anthropic SDK.
+    Args:
+        messages (List[ChatCompletionRetabMessage]): List of chat messages.
+    Returns:
+        (system_message, formatted_messages):
+            system_message (str | NotGiven):
+                The system message if one was found, otherwise NOT_GIVEN.
+            formatted_messages (List[MessageParam]):
+                A list of formatted messages ready for Anthropic.
+    """
+    formatted_messages: list[MessageParam] = []
+    system_message: str = ""
+    for message in messages:
+        content_blocks: list[Union[TextBlockParam, ImageBlockParam]] = []
+        # -----------------------
+        # Handle system message
+        # -----------------------
+        if message["role"] in ("system", "developer"):
+            assert isinstance(message["content"], str), "System message content must be a string."
+            if system_message != "":
+                raise ValueError("Only one system message is allowed per chat.")
+            system_message += message["content"]
+            continue
+        # -----------------------
+        # Handle non-system roles
+        # -----------------------
+        if isinstance(message["content"], str):
+            # Direct string content is treated as a single text block
+            content_blocks.append(
+                {
+                    "type": "text",
+                    "text": message["content"],
+                }
+            )
+        elif isinstance(message["content"], list):
+            # Handle structured content
+            for part in message["content"]:
+                if part["type"] == "text":
+                    part = cast(ChatCompletionContentPartTextParam, part)
+                    content_blocks.append(
+                        {
+                            "type": "text",
+                            "text": part["text"],  # type: ignore
+                        }
+                    )
+                elif part["type"] == "input_audio":
+                    part = cast(ChatCompletionContentPartInputAudioParam, part)
+                    logging.warning("Audio input is not supported yet.")
+                    # No blocks appended since not supported
+                elif part["type"] == "image_url":
+                    # Handle images that may be either base64 data-URLs or standard remote URLs
+                    part = cast(ChatCompletionContentPartImageParam, part)
+                    image_url = part["image_url"]["url"]
+                    if "base64," in image_url:
+                        # The string is already something like: data:image/jpeg;base64,xxxxxxxx...
+                        media_type, data_content = image_url.split(";base64,")
+                        # media_type might look like: "data:image/jpeg"
+                        media_type = media_type.split("data:")[-1]  # => "image/jpeg"
+                        base64_data = data_content
+                    else:
+                        # It's a remote URL, so fetch, encode, and derive media type from headers
+                        try:
+                            r = requests.get(image_url)
+                            r.raise_for_status()
+                            content_type = r.headers.get("Content-Type", "image/jpeg")
+                            # fallback "image/jpeg" if no Content-Type given
+                            # Only keep recognized image/* for anthropic
+                            if content_type not in ("image/jpeg", "image/png", "image/gif", "image/webp"):
+                                logging.warning(
+                                    "Unrecognized Content-Type '%s' - defaulting to image/jpeg",
+                                    content_type,
+                                )
+                                content_type = "image/jpeg"
+                            media_type = content_type
+                            base64_data = base64.b64encode(r.content).decode("utf-8")
+                        except Exception:
+                            logging.warning(
+                                "Failed to load image from URL: %s",
+                                image_url,
+                                exc_info=True,
+                                stack_info=True,
+                            )
+                            # Skip adding this block if error
+                            continue
+                    # Finally, append to content blocks
+                    content_blocks.append(
+                        {
+                            "type": "image",
+                            "source": {
+                                "type": "base64",
+                                "media_type": cast(MediaType, media_type),
+                                "data": base64_data,
+                            },
+                        }
+                    )
+        formatted_messages.append(
+            MessageParam(
+                role=message["role"],  # type: ignore
+                content=content_blocks,
+            )
+        )
+    return system_message, formatted_messages
+def convert_from_anthropic_format(messages: list[MessageParam], system_prompt: str) -> list[ChatCompletionRetabMessage]:
+    """
+    Converts a list of Anthropic MessageParam to a list of ChatCompletionRetabMessage.
+    """
+    formatted_messages: list[ChatCompletionRetabMessage] = [ChatCompletionRetabMessage(role="developer", content=system_prompt)]
+    for message in messages:
+        role = message["role"]
+        content_blocks = message["content"]
+        # Handle different content structures
+        if isinstance(content_blocks, list) and len(content_blocks) == 1 and isinstance(content_blocks[0], dict) and content_blocks[0].get("type") == "text":
+            # Simple text message
+            formatted_messages.append(cast(ChatCompletionRetabMessage, {"role": role, "content": content_blocks[0].get("text", "")}))
+        elif isinstance(content_blocks, list):
+            # Message with multiple content parts or non-text content
+            formatted_content: list[ChatCompletionContentPartParam] = []
+            for block in content_blocks:
+                if isinstance(block, dict):
+                    if block.get("type") == "text":
+                        formatted_content.append(cast(ChatCompletionContentPartParam, {"type": "text", "text": block.get("text", "")}))
+                    elif block.get("type") == "image":
+                        source = block.get("source", {})
+                        if isinstance(source, dict) and source.get("type") == "base64":
+                            # Convert base64 image to data URL format
+                            media_type = source.get("media_type", "image/jpeg")
+                            data = source.get("data", "")
+                            image_url = f"data:{media_type};base64,{data}"
+                            formatted_content.append(cast(ChatCompletionContentPartParam, {"type": "image_url", "image_url": {"url": image_url}}))
+            formatted_messages.append(cast(ChatCompletionRetabMessage, {"role": role, "content": formatted_content}))
+    return formatted_messages
+def convert_to_openai_format(messages: List[ChatCompletionRetabMessage]) -> List[ChatCompletionMessageParam]:
+    return cast(list[ChatCompletionMessageParam], messages)
+def convert_from_openai_format(messages: list[ChatCompletionMessageParam]) -> list[ChatCompletionRetabMessage]:
+    return cast(list[ChatCompletionRetabMessage], messages)
+def separate_messages(
+    messages: list[ChatCompletionRetabMessage],
+) -> tuple[Optional[ChatCompletionRetabMessage], list[ChatCompletionRetabMessage], list[ChatCompletionRetabMessage]]:
+    """
+    Separates messages into system, user and assistant messages.
+    Args:
+        messages: List of chat messages containing system, user and assistant messages
+    Returns:
+        Tuple containing:
+        - The system message if present, otherwise None
+        - List of user messages
+        - List of assistant messages
+    """
+    system_message = None
+    user_messages = []
+    assistant_messages = []
+    for message in messages:
+        if message["role"] in ("system", "developer"):
+            system_message = message
+        elif message["role"] == "user":
+            user_messages.append(message)
+        elif message["role"] == "assistant":
+            assistant_messages.append(message)
+    return system_message, user_messages, assistant_messages
+def str_messages(messages: list[ChatCompletionRetabMessage], max_length: int = 100) -> str:
+    """
+    Converts a list of chat messages into a string representation with faithfully serialized structure.
+    Args:
+        messages (list[ChatCompletionRetabMessage]): The list of chat messages.
+        max_length (int): Maximum length for content before truncation.
+    Returns:
+        str: A string representation of the messages with applied truncation.
+    """
+    def truncate(text: str, max_len: int) -> str:
+        """Truncate text to max_len with ellipsis."""
+        return text if len(text) <= max_len else f"{text[:max_len]}..."
+    serialized: list[ChatCompletionRetabMessage] = []
+    for message in messages:
+        role = message["role"]
+        content = message["content"]
+        if isinstance(content, str):
+            serialized.append({"role": role, "content": truncate(content, max_length)})
+        elif isinstance(content, list):
+            truncated_content: list[ChatCompletionContentPartParam] = []
+            for part in content:
+                if part["type"] == "text" and part["text"]:
+                    truncated_content.append({"type": "text", "text": truncate(part["text"], max_length)})
+                elif part["type"] == "image_url" and part["image_url"]:
+                    image_url = part["image_url"].get("url", "unknown image")
+                    truncated_content.append({"type": "image_url", "image_url": {"url": truncate(image_url, max_length)}})
+            serialized.append({"role": role, "content": truncated_content})
+    return repr(serialized)

retab 0.0.40__py3-none-any.whl → 0.0.42__py3-none-any.whl

retab 0.0.40py3-none-any.whl → 0.0.42py3-none-any.whl