PyPI - natural-pdf - Versions diffs - 0.1.38__py3-none-any.whl → 0.2.0__py3-none-any.whl - Mend

natural-pdf 0.1.38py3-none-any.whl → 0.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (55) hide show

natural_pdf/__init__.py +11 -6
natural_pdf/analyzers/__init__.py +6 -1
natural_pdf/analyzers/guides.py +354 -258
natural_pdf/analyzers/layout/layout_analyzer.py +2 -3
natural_pdf/analyzers/layout/layout_manager.py +18 -4
natural_pdf/analyzers/layout/paddle.py +11 -0
natural_pdf/analyzers/layout/surya.py +2 -3
natural_pdf/analyzers/shape_detection_mixin.py +25 -34
natural_pdf/analyzers/text_structure.py +2 -2
natural_pdf/classification/manager.py +1 -1
natural_pdf/collections/mixins.py +3 -2
natural_pdf/core/highlighting_service.py +743 -32
natural_pdf/core/page.py +252 -399
natural_pdf/core/page_collection.py +1249 -0
natural_pdf/core/pdf.py +231 -89
natural_pdf/{collections → core}/pdf_collection.py +18 -11
natural_pdf/core/render_spec.py +335 -0
natural_pdf/describe/base.py +1 -1
natural_pdf/elements/__init__.py +1 -0
natural_pdf/elements/base.py +108 -83
natural_pdf/elements/{collections.py → element_collection.py} +575 -1372
natural_pdf/elements/line.py +0 -1
natural_pdf/elements/rect.py +0 -1
natural_pdf/elements/region.py +405 -280
natural_pdf/elements/text.py +9 -7
natural_pdf/exporters/base.py +2 -2
natural_pdf/exporters/original_pdf.py +1 -1
natural_pdf/exporters/paddleocr.py +2 -4
natural_pdf/exporters/searchable_pdf.py +3 -2
natural_pdf/extraction/mixin.py +1 -3
natural_pdf/flows/collections.py +1 -69
natural_pdf/flows/element.py +25 -0
natural_pdf/flows/flow.py +1658 -19
natural_pdf/flows/region.py +757 -263
natural_pdf/ocr/ocr_options.py +0 -2
natural_pdf/ocr/utils.py +2 -1
natural_pdf/qa/document_qa.py +21 -5
natural_pdf/search/search_service_protocol.py +1 -1
natural_pdf/selectors/parser.py +35 -2
natural_pdf/tables/result.py +35 -1
natural_pdf/text_mixin.py +101 -0
natural_pdf/utils/debug.py +2 -1
natural_pdf/utils/highlighting.py +1 -0
natural_pdf/utils/layout.py +2 -2
natural_pdf/utils/packaging.py +4 -3
natural_pdf/utils/text_extraction.py +15 -12
natural_pdf/utils/visualization.py +385 -0
{natural_pdf-0.1.38.dist-info → natural_pdf-0.2.0.dist-info}/METADATA +7 -3
{natural_pdf-0.1.38.dist-info → natural_pdf-0.2.0.dist-info}/RECORD +55 -52
optimization/memory_comparison.py +1 -1
optimization/pdf_analyzer.py +2 -2
{natural_pdf-0.1.38.dist-info → natural_pdf-0.2.0.dist-info}/WHEEL +0 -0
{natural_pdf-0.1.38.dist-info → natural_pdf-0.2.0.dist-info}/entry_points.txt +0 -0
{natural_pdf-0.1.38.dist-info → natural_pdf-0.2.0.dist-info}/licenses/LICENSE +0 -0
{natural_pdf-0.1.38.dist-info → natural_pdf-0.2.0.dist-info}/top_level.txt +0 -0

natural_pdf/{collections → core}/pdf_collection.py RENAMED Viewed

@@ -588,24 +588,25 @@ class PDFCollection(
         # Get classification manager from first PDF
         try:
             first_pdf = self._pdfs[0]
-            if not hasattr(first_pdf, 'get_manager'):
+            if not hasattr(first_pdf, "get_manager"):
                 raise RuntimeError("PDFs do not support classification manager")
-            manager = first_pdf.get_manager('classification')
+            manager = first_pdf.get_manager("classification")
             if not manager or not manager.is_available():
                 raise RuntimeError("ClassificationManager is not available")
         except Exception as e:
             from natural_pdf.classification.manager import ClassificationError
             raise ClassificationError(f"Cannot access ClassificationManager: {e}") from e
         # Determine processing mode early
         inferred_using = manager.infer_using(model if model else manager.DEFAULT_TEXT_MODEL, using)
         # Gather content from all PDFs
         pdf_contents = []
         valid_pdfs = []
         logger.info(f"Gathering content from {len(self._pdfs)} PDFs for batch classification...")
         for pdf in self._pdfs:
             try:
                 # Get the content for classification - use the same logic as individual PDF classify
@@ -618,16 +619,18 @@ class PDFCollection(
                 elif inferred_using == "vision":
                     # For vision, we need single-page PDFs only
                     if len(pdf.pages) != 1:
-                        logger.warning(f"Skipping PDF {pdf.path}: Vision classification requires single-page PDFs")
+                        logger.warning(
+                            f"Skipping PDF {pdf.path}: Vision classification requires single-page PDFs"
+                        )
                         continue
                     # Get first page image
-                    content = pdf.pages[0].to_image()
+                    content = pdf.pages[0].render()
                 else:
                     raise ValueError(f"Unsupported using mode: {inferred_using}")
                 pdf_contents.append(content)
                 valid_pdfs.append(pdf)
             except Exception as e:
                 logger.warning(f"Skipping PDF {pdf.path}: Error getting content - {e}")
                 continue
@@ -636,7 +639,9 @@ class PDFCollection(
             logger.warning("No valid content could be gathered from PDFs for classification.")
             return self
-        logger.info(f"Gathered content from {len(valid_pdfs)} PDFs. Running batch classification...")
+        logger.info(
+            f"Gathered content from {len(valid_pdfs)} PDFs. Running batch classification..."
+        )
         # Run batch classification
         try:
@@ -651,6 +656,7 @@ class PDFCollection(
         except Exception as e:
             logger.error(f"Batch classification failed: {e}")
             from natural_pdf.classification.manager import ClassificationError
             raise ClassificationError(f"Batch classification failed: {e}") from e
         # Assign results back to PDFs
@@ -660,10 +666,11 @@ class PDFCollection(
                 f"with PDFs processed ({len(valid_pdfs)}). Cannot assign results."
             )
             from natural_pdf.classification.manager import ClassificationError
             raise ClassificationError("Batch result count mismatch with input PDFs")
         logger.info(f"Assigning {len(batch_results)} results to PDFs under key '{analysis_key}'.")
         processed_count = 0
         for pdf, result_obj in zip(valid_pdfs, batch_results):
             try:

natural_pdf/core/render_spec.py ADDED Viewed

@@ -0,0 +1,335 @@
+"""Unified rendering infrastructure for natural-pdf.
+This module provides the core components for the unified image generation system:
+- RenderSpec: Data structure describing what to render
+- Visualizable: Mixin providing show/render/export methods
+"""
+import logging
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import TYPE_CHECKING, Any, Dict, List, Literal, Optional, Tuple, Union
+if TYPE_CHECKING:
+    from PIL import Image as PIL_Image
+    from natural_pdf.core.page import Page
+    from natural_pdf.elements.base import Element
+logger = logging.getLogger(__name__)
+@dataclass
+class RenderSpec:
+    """Specification for rendering a single page or region.
+    This is the core data structure that unifies all rendering operations.
+    Every visual object in natural-pdf converts its display requirements
+    into one or more RenderSpecs, which are then processed by the
+    unified rendering pipeline.
+    Attributes:
+        page: The page to render
+        crop_bbox: Optional bounding box (x0, y0, x1, y1) to crop to
+        highlights: List of highlight specifications, each containing:
+            - bbox or polygon: The geometry to highlight
+            - color: Optional color for the highlight
+            - label: Optional label text
+            - element: Optional reference to the source element
+    """
+    page: "Page"
+    crop_bbox: Optional[Tuple[float, float, float, float]] = None
+    highlights: List[Dict[str, Any]] = field(default_factory=list)
+    def add_highlight(
+        self,
+        bbox: Optional[Tuple[float, float, float, float]] = None,
+        polygon: Optional[List[Tuple[float, float]]] = None,
+        color: Optional[Union[str, Tuple[int, int, int]]] = None,
+        label: Optional[str] = None,
+        element: Optional["Element"] = None,
+    ) -> None:
+        """Add a highlight to this render spec.
+        Args:
+            bbox: Bounding box to highlight
+            polygon: Polygon points to highlight (alternative to bbox)
+            color: Color for the highlight
+            label: Label text for the highlight
+            element: Source element reference
+        """
+        if bbox is None and polygon is None and element is not None:
+            # Extract geometry from element
+            if (
+                hasattr(element, "polygon")
+                and hasattr(element, "has_polygon")
+                and element.has_polygon
+            ):
+                polygon = element.polygon
+            elif hasattr(element, "bbox"):
+                bbox = element.bbox
+        if bbox is None and polygon is None:
+            raise ValueError("Must provide bbox, polygon, or element with geometry")
+        highlight = {
+            "bbox": bbox,
+            "polygon": polygon,
+            "color": color,
+            "label": label,
+            "element": element,
+        }
+        # Remove None values
+        highlight = {k: v for k, v in highlight.items() if v is not None}
+        self.highlights.append(highlight)
+class Visualizable:
+    """Mixin class providing unified show/render/export methods.
+    Classes that inherit from Visualizable need only implement
+    _get_render_specs() to gain full image generation capabilities.
+    """
+    def _get_render_specs(
+        self, mode: Literal["show", "render"] = "show", **kwargs
+    ) -> List[RenderSpec]:
+        """Get render specifications for this object.
+        This is the only method subclasses need to implement.
+        It should return a list of RenderSpec objects describing
+        what needs to be rendered.
+        Args:
+            mode: Rendering mode - 'show' includes highlights, 'render' is clean
+            **kwargs: Additional parameters from show/render methods
+        Returns:
+            List of RenderSpec objects
+        """
+        raise NotImplementedError(f"{self.__class__.__name__} must implement _get_render_specs()")
+    def _get_highlighter(self):
+        """Get the highlighting service for rendering.
+        This method should be overridden by classes that have
+        a different way of accessing the highlighter.
+        """
+        # Try common patterns
+        if hasattr(self, "_highlighter"):
+            return self._highlighter
+        elif hasattr(self, "page") and hasattr(self.page, "_highlighter"):
+            return self.page._highlighter
+        elif hasattr(self, "pages") and self.pages:
+            # For collections, use first page's highlighter
+            first_page = next(iter(self.pages))
+            if hasattr(first_page, "_highlighter"):
+                return first_page._highlighter
+        raise RuntimeError(
+            f"Cannot find HighlightingService for {self.__class__.__name__}. "
+            "Override _get_highlighter() to provide access."
+        )
+    def show(
+        self,
+        *,
+        # Basic rendering options
+        resolution: Optional[float] = None,
+        width: Optional[int] = None,
+        # Highlight options
+        color: Optional[Union[str, Tuple[int, int, int]]] = None,
+        labels: bool = True,
+        label_format: Optional[str] = None,
+        highlights: Optional[List[Dict[str, Any]]] = None,
+        legend_position: str = "right",
+        annotate: Optional[Union[str, List[str]]] = None,
+        # Layout options for multi-page/region
+        layout: Literal["stack", "grid", "single"] = "stack",
+        stack_direction: Literal["vertical", "horizontal"] = "vertical",
+        gap: int = 5,
+        columns: Optional[int] = None,  # For grid layout
+        # Cropping options
+        crop: Union[bool, Literal["content"]] = False,
+        crop_bbox: Optional[Tuple[float, float, float, float]] = None,
+        **kwargs,
+    ) -> Optional["PIL_Image"]:
+        """Generate a preview image with highlights.
+        This method is for interactive debugging and visualization.
+        Elements are highlighted to show what's selected or being worked with.
+        Args:
+            resolution: DPI for rendering (default from global settings)
+            width: Target width in pixels (overrides resolution)
+            color: Default highlight color
+            labels: Whether to show labels for highlights
+            label_format: Format string for labels (e.g., "Element {index}")
+            highlights: Additional highlight groups to show
+            legend_position: Position of legend/colorbar ('right', 'left', 'top', 'bottom')
+            annotate: Attribute name(s) to display on highlights (string or list)
+            layout: How to arrange multiple pages/regions
+            stack_direction: Direction for stack layout
+            gap: Pixels between stacked images
+            columns: Number of columns for grid layout
+            crop: Whether to crop (True, False, or 'content' for bbox of elements)
+            crop_bbox: Explicit crop bounds
+            **kwargs: Additional parameters passed to rendering
+        Returns:
+            PIL Image object or None if nothing to render
+        """
+        # Convert string to list if needed
+        if isinstance(annotate, str):
+            annotate = [annotate]
+        specs = self._get_render_specs(
+            mode="show",
+            color=color,
+            highlights=highlights,
+            crop=crop,
+            crop_bbox=crop_bbox,
+            annotate=annotate,
+            **kwargs,
+        )
+        if not specs:
+            logger.warning(f"{self.__class__.__name__}.show() generated no render specs")
+            return None
+        highlighter = self._get_highlighter()
+        return highlighter.unified_render(
+            specs=specs,
+            resolution=resolution,
+            width=width,
+            labels=labels,
+            label_format=label_format,
+            legend_position=legend_position,
+            layout=layout,
+            stack_direction=stack_direction,
+            gap=gap,
+            columns=columns,
+            **kwargs,
+        )
+    def render(
+        self,
+        *,
+        # Basic rendering options
+        resolution: Optional[float] = None,
+        width: Optional[int] = None,
+        # Layout options for multi-page/region
+        layout: Literal["stack", "grid", "single"] = "stack",
+        stack_direction: Literal["vertical", "horizontal"] = "vertical",
+        gap: int = 5,
+        columns: Optional[int] = None,
+        # Cropping options
+        crop: Union[bool, Literal["content"]] = False,
+        crop_bbox: Optional[Tuple[float, float, float, float]] = None,
+        **kwargs,
+    ) -> Optional["PIL_Image"]:
+        """Generate a clean image without highlights.
+        This method produces publication-ready images without
+        any debugging annotations or highlights.
+        Args:
+            resolution: DPI for rendering (default from global settings)
+            width: Target width in pixels (overrides resolution)
+            layout: How to arrange multiple pages/regions
+            stack_direction: Direction for stack layout
+            gap: Pixels between stacked images
+            columns: Number of columns for grid layout
+            crop: Whether to crop
+            crop_bbox: Explicit crop bounds
+            **kwargs: Additional parameters passed to rendering
+        Returns:
+            PIL Image object or None if nothing to render
+        """
+        specs = self._get_render_specs(mode="render", crop=crop, crop_bbox=crop_bbox, **kwargs)
+        if not specs:
+            logger.warning(f"{self.__class__.__name__}.render() generated no render specs")
+            return None
+        highlighter = self._get_highlighter()
+        return highlighter.unified_render(
+            specs=specs,
+            resolution=resolution,
+            width=width,
+            labels=False,  # Never show labels in render mode
+            layout=layout,
+            stack_direction=stack_direction,
+            gap=gap,
+            columns=columns,
+            **kwargs,
+        )
+    def export(
+        self,
+        path: Union[str, Path],
+        *,
+        # All the same options as render()
+        resolution: Optional[float] = None,
+        width: Optional[int] = None,
+        layout: Literal["stack", "grid", "single"] = "stack",
+        stack_direction: Literal["vertical", "horizontal"] = "vertical",
+        gap: int = 5,
+        columns: Optional[int] = None,
+        crop: Union[bool, Literal["content"]] = False,
+        crop_bbox: Optional[Tuple[float, float, float, float]] = None,
+        format: Optional[str] = None,
+        **kwargs,
+    ) -> None:
+        """Export a clean image to file.
+        This is a convenience method that renders and saves in one step.
+        Args:
+            path: Output file path
+            resolution: DPI for rendering
+            width: Target width in pixels
+            layout: How to arrange multiple pages/regions
+            stack_direction: Direction for stack layout
+            gap: Pixels between stacked images
+            columns: Number of columns for grid layout
+            crop: Whether to crop
+            crop_bbox: Explicit crop bounds
+            format: Image format (inferred from path if not specified)
+            **kwargs: Additional parameters passed to rendering
+        """
+        image = self.render(
+            resolution=resolution,
+            width=width,
+            layout=layout,
+            stack_direction=stack_direction,
+            gap=gap,
+            columns=columns,
+            crop=crop,
+            crop_bbox=crop_bbox,
+            **kwargs,
+        )
+        if image is None:
+            raise ValueError(f"No image generated by {self.__class__.__name__}.render()")
+        # Ensure path is a Path object
+        path = Path(path)
+        # Determine format
+        if format is None:
+            format = path.suffix.lstrip(".").upper()
+            if format == "JPG":
+                format = "JPEG"
+        # Save image
+        save_kwargs = {}
+        if format == "JPEG":
+            save_kwargs["quality"] = kwargs.get("quality", 95)
+        elif format == "PNG":
+            save_kwargs["compress_level"] = kwargs.get("compress_level", 6)
+        image.save(path, format=format, **save_kwargs)
+        logger.info(f"Exported {self.__class__.__name__} to {path}")

natural_pdf/describe/base.py CHANGED Viewed

@@ -17,7 +17,7 @@ from .summary import ElementSummary, InspectionSummary
 if TYPE_CHECKING:
     from natural_pdf.core.page import Page
     from natural_pdf.elements.base import Element
-    from natural_pdf.elements.collections import ElementCollection
+    from natural_pdf.elements.element_collection import ElementCollection
     from natural_pdf.elements.region import Region
 logger = logging.getLogger(__name__)

natural_pdf/elements/__init__.py CHANGED Viewed

@@ -1,3 +1,4 @@
 """
 Element classes for Natural PDF.
 """

natural-pdf 0.1.38__py3-none-any.whl → 0.2.0__py3-none-any.whl

natural-pdf 0.1.38py3-none-any.whl → 0.2.0py3-none-any.whl