PyPI - retab - Versions diffs - 0.0.36__py3-none-any.whl → 0.0.38__py3-none-any.whl - Mend

retab 0.0.36py3-none-any.whl → 0.0.38py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (123) hide show

retab/__init__.py +4 -0
{uiform → retab}/_resource.py +5 -5
{uiform → retab}/_utils/ai_models.py +2 -2
{uiform → retab}/_utils/benchmarking.py +15 -16
{uiform → retab}/_utils/chat.py +29 -34
{uiform → retab}/_utils/display.py +0 -3
{uiform → retab}/_utils/json_schema.py +9 -14
{uiform → retab}/_utils/mime.py +11 -14
{uiform → retab}/_utils/responses.py +16 -10
{uiform → retab}/_utils/stream_context_managers.py +1 -1
{uiform → retab}/_utils/usage/usage.py +31 -31
{uiform → retab}/client.py +54 -53
{uiform → retab}/resources/consensus/client.py +19 -38
{uiform → retab}/resources/consensus/completions.py +36 -59
{uiform → retab}/resources/consensus/completions_stream.py +35 -47
{uiform → retab}/resources/consensus/responses.py +37 -86
{uiform → retab}/resources/consensus/responses_stream.py +41 -89
retab/resources/documents/client.py +455 -0
{uiform → retab}/resources/documents/extractions.py +192 -101
{uiform → retab}/resources/evals.py +56 -43
retab/resources/evaluations/__init__.py +3 -0
retab/resources/evaluations/client.py +301 -0
retab/resources/evaluations/documents.py +233 -0
retab/resources/evaluations/iterations.py +452 -0
{uiform → retab}/resources/files.py +2 -2
{uiform → retab}/resources/jsonlUtils.py +225 -221
retab/resources/models.py +73 -0
retab/resources/processors/automations/client.py +244 -0
{uiform → retab}/resources/processors/automations/endpoints.py +79 -120
retab/resources/processors/automations/links.py +294 -0
{uiform → retab}/resources/processors/automations/logs.py +30 -19
retab/resources/processors/automations/mailboxes.py +397 -0
retab/resources/processors/automations/outlook.py +337 -0
{uiform → retab}/resources/processors/automations/tests.py +22 -25
{uiform → retab}/resources/processors/client.py +181 -166
{uiform → retab}/resources/schemas.py +78 -66
{uiform → retab}/resources/secrets/external_api_keys.py +1 -5
retab/resources/secrets/webhook.py +64 -0
{uiform → retab}/resources/usage.py +41 -4
{uiform → retab}/types/ai_models.py +17 -17
{uiform → retab}/types/automations/cron.py +19 -12
{uiform → retab}/types/automations/endpoints.py +7 -4
{uiform → retab}/types/automations/links.py +7 -3
{uiform → retab}/types/automations/mailboxes.py +10 -10
{uiform → retab}/types/automations/outlook.py +15 -11
{uiform → retab}/types/automations/webhooks.py +1 -1
retab/types/browser_canvas.py +3 -0
retab/types/chat.py +8 -0
{uiform → retab}/types/completions.py +12 -15
retab/types/consensus.py +19 -0
{uiform → retab}/types/db/annotations.py +3 -3
{uiform → retab}/types/db/files.py +8 -6
{uiform → retab}/types/documents/create_messages.py +20 -22
{uiform → retab}/types/documents/extractions.py +71 -26
{uiform → retab}/types/evals.py +5 -5
retab/types/evaluations/__init__.py +31 -0
retab/types/evaluations/documents.py +30 -0
retab/types/evaluations/iterations.py +112 -0
retab/types/evaluations/model.py +73 -0
retab/types/events.py +79 -0
{uiform → retab}/types/extractions.py +36 -13
retab/types/inference_settings.py +15 -0
retab/types/jobs/base.py +54 -0
retab/types/jobs/batch_annotation.py +12 -0
{uiform → retab}/types/jobs/evaluation.py +1 -2
{uiform → retab}/types/logs.py +37 -34
retab/types/metrics.py +32 -0
{uiform → retab}/types/mime.py +22 -20
{uiform → retab}/types/modalities.py +10 -10
retab/types/predictions.py +19 -0
{uiform → retab}/types/schemas/enhance.py +4 -2
{uiform → retab}/types/schemas/evaluate.py +7 -4
{uiform → retab}/types/schemas/generate.py +6 -3
{uiform → retab}/types/schemas/layout.py +1 -1
{uiform → retab}/types/schemas/object.py +16 -17
{uiform → retab}/types/schemas/templates.py +1 -3
{uiform → retab}/types/secrets/external_api_keys.py +0 -1
{uiform → retab}/types/standards.py +18 -1
{retab-0.0.36.dist-info → retab-0.0.38.dist-info}/METADATA +78 -77
retab-0.0.38.dist-info/RECORD +107 -0
retab-0.0.38.dist-info/top_level.txt +1 -0
retab-0.0.36.dist-info/RECORD +0 -96
retab-0.0.36.dist-info/top_level.txt +0 -1
uiform/__init__.py +0 -4
uiform/_utils/benchmarking copy.py +0 -588
uiform/resources/documents/client.py +0 -255
uiform/resources/models.py +0 -45
uiform/resources/processors/automations/client.py +0 -78
uiform/resources/processors/automations/links.py +0 -356
uiform/resources/processors/automations/mailboxes.py +0 -435
uiform/resources/processors/automations/outlook.py +0 -444
uiform/resources/secrets/webhook.py +0 -62
uiform/types/chat.py +0 -8
uiform/types/consensus.py +0 -10
uiform/types/events.py +0 -76
uiform/types/jobs/base.py +0 -150
uiform/types/jobs/batch_annotation.py +0 -22
{uiform → retab}/_utils/__init__.py +0 -0
{uiform → retab}/_utils/usage/__init__.py +0 -0
{uiform → retab}/py.typed +0 -0
{uiform → retab}/resources/__init__.py +0 -0
{uiform → retab}/resources/consensus/__init__.py +0 -0
{uiform → retab}/resources/documents/__init__.py +0 -0
{uiform → retab}/resources/finetuning.py +0 -0
{uiform → retab}/resources/openai_example.py +0 -0
{uiform → retab}/resources/processors/__init__.py +0 -0
{uiform → retab}/resources/processors/automations/__init__.py +0 -0
{uiform → retab}/resources/prompt_optimization.py +0 -0
{uiform → retab}/resources/secrets/__init__.py +0 -0
{uiform → retab}/resources/secrets/client.py +0 -0
{uiform → retab}/types/__init__.py +0 -0
{uiform → retab}/types/automations/__init__.py +0 -0
{uiform → retab}/types/db/__init__.py +0 -0
{uiform → retab}/types/documents/__init__.py +0 -0
{uiform → retab}/types/documents/correct_orientation.py +0 -0
{uiform → retab}/types/jobs/__init__.py +0 -0
{uiform → retab}/types/jobs/finetune.py +0 -0
{uiform → retab}/types/jobs/prompt_optimization.py +0 -0
{uiform → retab}/types/jobs/webcrawl.py +0 -0
{uiform → retab}/types/pagination.py +0 -0
{uiform → retab}/types/schemas/__init__.py +0 -0
{uiform → retab}/types/secrets/__init__.py +0 -0
{retab-0.0.36.dist-info → retab-0.0.38.dist-info}/WHEEL +0 -0

retab/__init__.py ADDED Viewed

@@ -0,0 +1,4 @@
+from .client import AsyncRetab, Retab
+from .types.schemas.object import Schema
+__all__ = ["Retab", "AsyncRetab", "Schema"]

{uiform → retab}/_resource.py RENAMED Viewed

@@ -5,13 +5,13 @@ import time
 from typing import TYPE_CHECKING
 if TYPE_CHECKING:
-    from .client import AsyncUiForm, UiForm
+    from .client import AsyncRetab, Retab
 class SyncAPIResource:
-    _client: UiForm
+    _client: Retab
-    def __init__(self, client: UiForm) -> None:
+    def __init__(self, client: Retab) -> None:
         self._client = client
     def _sleep(self, seconds: float) -> None:
@@ -19,9 +19,9 @@ class SyncAPIResource:
 class AsyncAPIResource:
-    _client: AsyncUiForm
+    _client: AsyncRetab
-    def __init__(self, client: AsyncUiForm) -> None:
+    def __init__(self, client: AsyncRetab) -> None:
         self._client = client
     async def _sleep(self, seconds: float) -> None:

{uiform → retab}/_utils/ai_models.py RENAMED Viewed

@@ -61,7 +61,7 @@ def assert_valid_model_batch_processing(model: str) -> None:
             raise ValueError(f"Invalid base model in fine-tuned model '{model}'. Base model must be one of: {get_args(OpenAIModel)}")
         if not model_id or not model_id.strip():
             raise ValueError(f"Model ID cannot be empty in fine-tuned model '{model}'")
-    except ValueError as e:
+    except ValueError:
         if ":" not in model:
             raise ValueError(
                 f"Invalid model format: {model}. Must be either:\n"
@@ -90,7 +90,7 @@ def assert_valid_model_schema_generation(model: str) -> None:
             raise ValueError(f"Invalid base model in fine-tuned model '{model}'. Base model must be one of: {get_args(OpenAIModel)}")
         if not model_id or not model_id.strip():
             raise ValueError(f"Model ID cannot be empty in fine-tuned model '{model}'")
-    except ValueError as e:
+    except ValueError:
         if ":" not in model:
             raise ValueError(
                 f"Invalid model format: {model}. Must be either:\n"

{uiform → retab}/_utils/benchmarking.py RENAMED Viewed

@@ -5,7 +5,7 @@ import shutil
 # The goal is to leverage this piece of code to open a jsonl file and get an analysis of the performance of the model using a one-liner.
 ############# BENCHMARKING MODELS #############
 from itertools import zip_longest
-from typing import Any, Callable, Literal, Optional
+from typing import Any, Callable, Literal, Optional, cast
 import pandas as pd  # type: ignore
 from Levenshtein import distance as levenshtein_distance
@@ -27,7 +27,7 @@ def normalize_string(text: str) -> str:
     if not text:
         return ""
     # Remove all non-alphanumeric characters and convert to lowercase
-    return re.sub(r'[^a-zA-Z0-9]', '', text).lower()
+    return re.sub(r"[^a-zA-Z0-9]", "", text).lower()
 def hamming_distance_padded(s: str, t: str) -> int:
@@ -45,7 +45,7 @@ def hamming_distance_padded(s: str, t: str) -> int:
     s = normalize_string(s)
     t = normalize_string(t)
-    return sum(a != b for a, b in zip_longest(s, t, fillvalue=' '))
+    return sum(a != b for a, b in zip_longest(s, t, fillvalue=" "))
 def hamming_similarity(str_1: str, str_2: str) -> float:
@@ -385,7 +385,7 @@ class EvalMetrics(BaseModel):
     distances: dict[dictionary_metrics, EvalMetric]
-def flatten_dict(d: dict[str, Any], parent_key: str = '', sep: str = '.') -> dict[str, Any]:
+def flatten_dict(d: dict[str, Any], parent_key: str = "", sep: str = ".") -> dict[str, Any]:
     """Flatten a nested dictionary with dot-separated keys."""
     items: list[tuple[str, Any]] = []
     for k, v in d.items():
@@ -408,16 +408,14 @@ def plot_metrics_with_uncertainty(analysis: dict[str, Any], uncertainties: Optio
     """
     # Flatten the dictionaries
     flattened_analysis = flatten_dict(analysis)
-    if uncertainties:
-        flattened_uncertainties = flatten_dict(uncertainties)
-    else:
-        uncertainties_list = None
     # Prepare data by matching fields
     fields = list(flattened_analysis.keys())
     similarities = [flattened_analysis[field] for field in fields]
+    # Prepare uncertainties if provided
+    uncertainties_list = None
     if uncertainties:
+        flattened_uncertainties = flatten_dict(uncertainties)
         uncertainties_list = [flattened_uncertainties.get(field, None) for field in fields]
     # Create a DataFrame
@@ -454,10 +452,11 @@ def plot_metrics_with_uncertainty(analysis: dict[str, Any], uncertainties: Optio
         if similarity is None:
             continue  # Skip fields with no similarity value
+        similarity = cast(float, similarity)
         # Calculate bar length and uncertainty range
         bar_len = round(similarity * scale)
         if uncertainty is not None and uncertainty > 0:
+            uncertainty = cast(float, uncertainty)
             uncertainty_start = max(0, round((similarity - uncertainty) * scale))
             uncertainty_end = min(bar_width, round((similarity + uncertainty) * scale))
         else:
@@ -465,21 +464,21 @@ def plot_metrics_with_uncertainty(analysis: dict[str, Any], uncertainties: Optio
             uncertainty_end = bar_len  # No uncertainty to display
         # Build the bar string
-        bar_string = ''
+        bar_string = ""
         for i in range(bar_width):
             if i < bar_len:
                 if i < uncertainty_start:
-                    char = '█'  # Solid block for certain part
+                    char = "█"  # Solid block for certain part
                 else:
-                    char = '█'  # Lighter block for uncertainty overlap
+                    char = "█"  # Lighter block for uncertainty overlap
             else:
                 if i < uncertainty_end:
-                    char = '░'  # Dash for upper uncertainty range
+                    char = "░"  # Dash for upper uncertainty range
                 else:
-                    char = ' '  # Space for empty area
+                    char = " "  # Space for empty area
             bar_string += char
         # Print the label and bar
-        score_field = f'[{similarity:.4f}]'
+        score_field = f"[{similarity:.4f}]"
         print(f"{field:<{label_width}} {score_field} | {bar_string}")

{uiform → retab}/_utils/chat.py RENAMED Viewed

@@ -1,31 +1,26 @@
 import base64
-import io
 import logging
 from typing import List, Literal, Optional, Union, cast
 import requests
-from anthropic.types.content_block import ContentBlock
-from anthropic.types.image_block_param import ImageBlockParam, Source
+from anthropic.types.image_block_param import ImageBlockParam
 from anthropic.types.message_param import MessageParam
 from anthropic.types.text_block_param import TextBlockParam
-from anthropic.types.tool_result_block_param import ToolResultBlockParam
-from anthropic.types.tool_use_block_param import ToolUseBlockParam
 from google.genai.types import BlobDict, ContentDict, ContentUnionDict, PartDict  # type: ignore
 from openai.types.chat.chat_completion_content_part_image_param import ChatCompletionContentPartImageParam
 from openai.types.chat.chat_completion_content_part_input_audio_param import ChatCompletionContentPartInputAudioParam
 from openai.types.chat.chat_completion_content_part_param import ChatCompletionContentPartParam
 from openai.types.chat.chat_completion_content_part_text_param import ChatCompletionContentPartTextParam
 from openai.types.chat.chat_completion_message_param import ChatCompletionMessageParam
-from PIL import Image
-from ..types.chat import ChatCompletionUiformMessage
+from ..types.chat import ChatCompletionRetabMessage
 MediaType = Literal["image/jpeg", "image/png", "image/gif", "image/webp"]
-def convert_to_google_genai_format(messages: List[ChatCompletionUiformMessage]) -> tuple[str, list[ContentUnionDict]]:
+def convert_to_google_genai_format(messages: List[ChatCompletionRetabMessage]) -> tuple[str, list[ContentUnionDict]]:
     """
-    Converts a list of ChatCompletionUiFormMessage to a format compatible with the google.genai SDK.
+    Converts a list of ChatCompletionRetabMessage to a format compatible with the google.genai SDK.
     Example:
@@ -45,7 +40,7 @@ def convert_to_google_genai_format(messages: List[ChatCompletionUiformMessage])
         ```
     Args:
-        messages (List[ChatCompletionUiformMessage]): List of chat messages.
+        messages (List[ChatCompletionRetabMessage]): List of chat messages.
     Returns:
         List[Union[Dict[str, str], str]]: A list of formatted inputs for the google.genai SDK.
@@ -64,7 +59,7 @@ def convert_to_google_genai_format(messages: List[ChatCompletionUiformMessage])
             continue
         parts: list[PartDict] = []
-        message_content = message['content']
+        message_content = message["content"]
         if isinstance(message_content, str):
             # Direct string content is treated as the prompt for the SDK
             parts.append(PartDict(text=message_content))
@@ -74,8 +69,8 @@ def convert_to_google_genai_format(messages: List[ChatCompletionUiformMessage])
                 if part["type"] == "text":
                     parts.append(PartDict(text=part["text"]))
                 elif part["type"] == "image_url":
-                    url = part['image_url'].get('url', '')  # type: ignore
-                    if url.startswith('data:image'):
+                    url = part["image_url"].get("url", "")  # type: ignore
+                    if url.startswith("data:image"):
                         # Extract base64 data and add it to the formatted inputs
                         media_type, data_content = url.split(";base64,")
                         media_type = media_type.split("data:")[-1]  # => "image/jpeg"
@@ -99,12 +94,12 @@ def convert_to_google_genai_format(messages: List[ChatCompletionUiformMessage])
     return system_message, formatted_content
-def convert_to_anthropic_format(messages: List[ChatCompletionUiformMessage]) -> tuple[str, List[MessageParam]]:
+def convert_to_anthropic_format(messages: List[ChatCompletionRetabMessage]) -> tuple[str, List[MessageParam]]:
     """
-    Converts a list of ChatCompletionUiformMessage to a format compatible with the Anthropic SDK.
+    Converts a list of ChatCompletionRetabMessage to a format compatible with the Anthropic SDK.
     Args:
-        messages (List[ChatCompletionUiformMessage]): List of chat messages.
+        messages (List[ChatCompletionRetabMessage]): List of chat messages.
     Returns:
         (system_message, formatted_messages):
@@ -133,24 +128,24 @@ def convert_to_anthropic_format(messages: List[ChatCompletionUiformMessage]) ->
         # -----------------------
         # Handle non-system roles
         # -----------------------
-        if isinstance(message['content'], str):
+        if isinstance(message["content"], str):
             # Direct string content is treated as a single text block
             content_blocks.append(
                 {
                     "type": "text",
-                    "text": message['content'],
+                    "text": message["content"],
                 }
             )
-        elif isinstance(message['content'], list):
+        elif isinstance(message["content"], list):
             # Handle structured content
-            for part in message['content']:
+            for part in message["content"]:
                 if part["type"] == "text":
                     part = cast(ChatCompletionContentPartTextParam, part)
                     content_blocks.append(
                         {
                             "type": "text",
-                            "text": part['text'],  # type: ignore
+                            "text": part["text"],  # type: ignore
                         }
                     )
@@ -221,11 +216,11 @@ def convert_to_anthropic_format(messages: List[ChatCompletionUiformMessage]) ->
     return system_message, formatted_messages
-def convert_from_anthropic_format(messages: list[MessageParam], system_prompt: str) -> list[ChatCompletionUiformMessage]:
+def convert_from_anthropic_format(messages: list[MessageParam], system_prompt: str) -> list[ChatCompletionRetabMessage]:
     """
-    Converts a list of Anthropic MessageParam to a list of ChatCompletionUiformMessage.
+    Converts a list of Anthropic MessageParam to a list of ChatCompletionRetabMessage.
     """
-    formatted_messages: list[ChatCompletionUiformMessage] = [ChatCompletionUiformMessage(role="developer", content=system_prompt)]
+    formatted_messages: list[ChatCompletionRetabMessage] = [ChatCompletionRetabMessage(role="developer", content=system_prompt)]
     for message in messages:
         role = message["role"]
@@ -234,7 +229,7 @@ def convert_from_anthropic_format(messages: list[MessageParam], system_prompt: s
         # Handle different content structures
         if isinstance(content_blocks, list) and len(content_blocks) == 1 and isinstance(content_blocks[0], dict) and content_blocks[0].get("type") == "text":
             # Simple text message
-            formatted_messages.append(cast(ChatCompletionUiformMessage, {"role": role, "content": content_blocks[0].get("text", "")}))
+            formatted_messages.append(cast(ChatCompletionRetabMessage, {"role": role, "content": content_blocks[0].get("text", "")}))
         elif isinstance(content_blocks, list):
             # Message with multiple content parts or non-text content
             formatted_content: list[ChatCompletionContentPartParam] = []
@@ -253,22 +248,22 @@ def convert_from_anthropic_format(messages: list[MessageParam], system_prompt: s
                             formatted_content.append(cast(ChatCompletionContentPartParam, {"type": "image_url", "image_url": {"url": image_url}}))
-            formatted_messages.append(cast(ChatCompletionUiformMessage, {"role": role, "content": formatted_content}))
+            formatted_messages.append(cast(ChatCompletionRetabMessage, {"role": role, "content": formatted_content}))
     return formatted_messages
-def convert_to_openai_format(messages: List[ChatCompletionUiformMessage]) -> List[ChatCompletionMessageParam]:
+def convert_to_openai_format(messages: List[ChatCompletionRetabMessage]) -> List[ChatCompletionMessageParam]:
     return cast(list[ChatCompletionMessageParam], messages)
-def convert_from_openai_format(messages: list[ChatCompletionMessageParam]) -> list[ChatCompletionUiformMessage]:
-    return cast(list[ChatCompletionUiformMessage], messages)
+def convert_from_openai_format(messages: list[ChatCompletionMessageParam]) -> list[ChatCompletionRetabMessage]:
+    return cast(list[ChatCompletionRetabMessage], messages)
 def separate_messages(
-    messages: list[ChatCompletionUiformMessage],
-) -> tuple[Optional[ChatCompletionUiformMessage], list[ChatCompletionUiformMessage], list[ChatCompletionUiformMessage]]:
+    messages: list[ChatCompletionRetabMessage],
+) -> tuple[Optional[ChatCompletionRetabMessage], list[ChatCompletionRetabMessage], list[ChatCompletionRetabMessage]]:
     """
     Separates messages into system, user and assistant messages.
@@ -296,12 +291,12 @@ def separate_messages(
     return system_message, user_messages, assistant_messages
-def str_messages(messages: list[ChatCompletionUiformMessage], max_length: int = 100) -> str:
+def str_messages(messages: list[ChatCompletionRetabMessage], max_length: int = 100) -> str:
     """
     Converts a list of chat messages into a string representation with faithfully serialized structure.
     Args:
-        messages (list[ChatCompletionUiformMessage]): The list of chat messages.
+        messages (list[ChatCompletionRetabMessage]): The list of chat messages.
         max_length (int): Maximum length for content before truncation.
     Returns:
@@ -312,7 +307,7 @@ def str_messages(messages: list[ChatCompletionUiformMessage], max_length: int =
         """Truncate text to max_len with ellipsis."""
         return text if len(text) <= max_len else f"{text[:max_len]}..."
-    serialized: list[ChatCompletionUiformMessage] = []
+    serialized: list[ChatCompletionRetabMessage] = []
     for message in messages:
         role = message["role"]
         content = message["content"]

{uiform → retab}/_utils/display.py RENAMED Viewed

@@ -105,9 +105,6 @@ def count_image_tokens(image_url: str, detail: Literal["low", "high", "auto"] =
         total_tiles = tiles_wide * tiles_high
         return base_token_cost + (token_per_tile * total_tiles)
 def process_jsonl_file(jsonl_path: str) -> List[TokenCounts]:

{uiform → retab}/_utils/json_schema.py RENAMED Viewed

@@ -14,8 +14,8 @@ from email_validator import validate_email
 from pydantic import BaseModel, BeforeValidator, Field, create_model
 from pydantic.config import ConfigDict
-from uiform._utils.mime import generate_blake2b_hash_from_string
-from uiform.types.schemas.layout import Column, FieldItem, Layout, RefObject, Row, RowList
+from ..types.schemas.layout import Column, FieldItem, Layout, RefObject, Row, RowList
+from .mime import generate_blake2b_hash_from_string
 # **** Validation Functions ****
@@ -116,7 +116,7 @@ def validate_vat_number(v: Any) -> Optional[str]:
     try:
         if stdnum.eu.vat.is_valid(v_str):
             return stdnum.eu.vat.validate(v_str)
-    except:
+    except Exception:
         pass
     return None
@@ -150,7 +150,7 @@ def validate_email_address(v: Any) -> Optional[str]:
         return None
     try:
         return validate_email(v_str).normalized
-    except:
+    except Exception:
         return None
@@ -170,7 +170,7 @@ def validate_frenchpostcode(v: Any) -> Optional[str]:
         if not v_str.isdigit():
             return None
         return v_str
-    except:
+    except Exception:
         return None
@@ -201,7 +201,7 @@ def validate_un_code(v: Any) -> Optional[int]:
         val = int(float(v_str))  # handle numeric strings
         if 0 <= val <= 3481:
             return val
-    except:
+    except Exception:
         pass
     return None
@@ -242,7 +242,7 @@ def validate_integer(v: Any) -> Optional[int]:
         return None
     try:
         return int(float(v_str))
-    except:
+    except Exception:
         return None
@@ -257,7 +257,7 @@ def validate_float(v: Any) -> Optional[float]:
         return None
     try:
         return float(v_str)
-    except:
+    except Exception:
         return None
@@ -333,7 +333,7 @@ def validate_bool(v: Any) -> bool:
             return True
         elif v_str in false_values:
             return False
-    except:
+    except Exception:
         pass
     return False
@@ -2091,11 +2091,6 @@ def sanitize(instance: Any, schema: dict[str, Any]) -> Any:
     return __sanitize_instance(instance, expanded_schema)
-import copy
-import json
-from .mime import generate_blake2b_hash_from_string
 def compute_schema_data_id(json_schema: dict[str, Any]) -> str:
     """Returns the schema_data_id for a given JSON schema.

{uiform → retab}/_utils/mime.py RENAMED Viewed

@@ -4,16 +4,17 @@ import io
 import json
 import mimetypes
 from pathlib import Path
-from typing import Literal, Sequence, TypeVar, get_args
+from typing import Sequence, TypeVar, get_args
 import httpx
 import PIL.Image
+import puremagic
 from pydantic import HttpUrl
 from ..types.mime import MIMEData
 from ..types.modalities import SUPPORTED_TYPES
-T = TypeVar('T')
+T = TypeVar("T")
 def generate_blake2b_hash_from_bytes(bytes_: bytes) -> str:
@@ -25,7 +26,7 @@ def generate_blake2b_hash_from_base64(base64_string: str) -> str:
 def generate_blake2b_hash_from_string(input_string: str) -> str:
-    return generate_blake2b_hash_from_bytes(input_string.encode('utf-8'))
+    return generate_blake2b_hash_from_bytes(input_string.encode("utf-8"))
 def generate_blake2b_hash_from_dict(input_dict: dict) -> str:
@@ -43,7 +44,7 @@ def convert_pil_image_to_mime_data(image: PIL.Image.Image) -> MIMEData:
     """
     # Convert PIL image to base64 string
     buffered = io.BytesIO()
-    choosen_format = image.format if (image.format and image.format.lower() in ['png', 'jpeg', 'gif', 'webp']) else "JPEG"
+    choosen_format = image.format if (image.format and image.format.lower() in ["png", "jpeg", "gif", "webp"]) else "JPEG"
     image.save(buffered, format=choosen_format)
     base64_content = base64.b64encode(buffered.getvalue()).decode("utf-8")
@@ -98,13 +99,11 @@ def prepare_mime_document(document: Path | str | bytes | io.IOBase | MIMEData |
     if isinstance(document, bytes):
         # `document` is already the raw bytes
         try:
-            import puremagic
             extension = puremagic.from_string(document)
             if extension.lower() in [".jpg", ".jpeg", ".jfif"]:
                 extension = ".jpeg"
-        except:
-            extension = '.txt'
+        except Exception:
+            extension = ".txt"
         file_bytes = document
         filename = "uploaded_file" + extension
     elif isinstance(document, io.IOBase):
@@ -112,19 +111,17 @@ def prepare_mime_document(document: Path | str | bytes | io.IOBase | MIMEData |
         file_bytes = document.read()
         filename = getattr(document, "name", "uploaded_file")
         filename = Path(filename).name
-    elif hasattr(document, 'unicode_string') and callable(getattr(document, 'unicode_string')):
+    elif hasattr(document, "unicode_string") and callable(getattr(document, "unicode_string")):
         with httpx.Client() as client:
             url: str = document.unicode_string()  # type: ignore
             response = client.get(url)
             response.raise_for_status()
             try:
-                import puremagic
                 extension = puremagic.from_string(response.content)
                 if extension.lower() in [".jpg", ".jpeg", ".jfif"]:
                     extension = ".jpeg"
-            except:
-                extension = '.txt'
+            except Exception:
+                extension = ".txt"
             file_bytes = response.content  # Fix: Use response.content instead of document
             filename = "uploaded_file" + extension
     else:
@@ -139,7 +136,7 @@ def prepare_mime_document(document: Path | str | bytes | io.IOBase | MIMEData |
     encoded_content = base64.b64encode(file_bytes).decode("utf-8")
     # Compute SHA-256 hash over the *base64-encoded* content
     hash_obj = hashlib.sha256(encoded_content.encode("utf-8"))
-    content_hash = hash_obj.hexdigest()
+    hash_obj.hexdigest()
     # Guess MIME type based on file extension
     guessed_type, _ = mimetypes.guess_type(filename)

{uiform → retab}/_utils/responses.py RENAMED Viewed

@@ -16,13 +16,13 @@ from openai.types.responses.response_input_message_content_list_param import Res
 from openai.types.responses.response_input_param import ResponseInputItemParam
 from openai.types.responses.response_input_text_param import ResponseInputTextParam
-from ..types.chat import ChatCompletionUiformMessage
+from ..types.chat import ChatCompletionRetabMessage
 from ..types.documents.extractions import UiParsedChatCompletion, UiParsedChoice
-def convert_to_openai_format(messages: list[ChatCompletionUiformMessage]) -> list[ResponseInputItemParam]:
+def convert_to_openai_format(messages: list[ChatCompletionRetabMessage]) -> list[ResponseInputItemParam]:
     """
-    Converts a list of ChatCompletionUiformMessage to the OpenAI ResponseInputParam format.
+    Converts a list of ChatCompletionRetabMessage to the OpenAI ResponseInputParam format.
     Args:
         messages: List of chat messages in UIForm format
@@ -64,9 +64,9 @@ def convert_to_openai_format(messages: list[ChatCompletionUiformMessage]) -> lis
     return formatted_messages
-def convert_from_openai_format(messages: list[ResponseInputItemParam]) -> list[ChatCompletionUiformMessage]:
+def convert_from_openai_format(messages: list[ResponseInputItemParam]) -> list[ChatCompletionRetabMessage]:
     """
-    Converts messages from OpenAI ResponseInputParam format to ChatCompletionUiformMessage format.
+    Converts messages from OpenAI ResponseInputParam format to ChatCompletionRetabMessage format.
     Args:
         messages: Messages in OpenAI ResponseInputParam format
@@ -74,16 +74,22 @@ def convert_from_openai_format(messages: list[ResponseInputItemParam]) -> list[C
     Returns:
         List of chat messages in UIForm format
     """
-    formatted_messages: list[ChatCompletionUiformMessage] = []
+    formatted_messages: list[ChatCompletionRetabMessage] = []
     for message in messages:
+        if "role" not in message or "content" not in message:
+            # Mandatory fields for a message
+            if message.get("type") != "message":
+                print(f"Not supported message type: {message.get('type')}... Skipping...")
+            continue
+        role = message["role"]
+        content = message["content"]
         if "type" not in message:
             # The type is required by all other sub-types of ResponseInputItemParam except for EasyInputMessageParam and Message, which are messages.
             message["type"] = "message"
-        if message["type"] != "message":
-            print(f"Not supported message type: {message['type']}... Skipping...")
-            continue
         role = message["role"]
         content = message["content"]
         formatted_content: str | list[ChatCompletionContentPartParam]
@@ -104,7 +110,7 @@ def convert_from_openai_format(messages: list[ResponseInputItemParam]) -> list[C
                     print(f"Not supported content type: {part['type']}... Skipping...")
         # Create message in UIForm format
-        formatted_message = ChatCompletionUiformMessage(role=role, content=formatted_content)
+        formatted_message = ChatCompletionRetabMessage(role=role, content=formatted_content)
         formatted_messages.append(formatted_message)
     return formatted_messages

{uiform → retab}/_utils/stream_context_managers.py RENAMED Viewed

@@ -1,7 +1,7 @@
 from contextlib import AbstractAsyncContextManager, AbstractContextManager
 from typing import Any, AsyncGenerator, Callable, Generator, TypeVar, Union
-T = TypeVar('T')
+T = TypeVar("T")
 class AsyncGeneratorContextManager(AbstractAsyncContextManager[AsyncGenerator[T, None]]):

retab 0.0.36__py3-none-any.whl → 0.0.38__py3-none-any.whl

retab 0.0.36py3-none-any.whl → 0.0.38py3-none-any.whl