PyPI - natural-pdf - Versions diffs - 0.1.21__py3-none-any.whl → 0.1.23__py3-none-any.whl - Mend

natural-pdf 0.1.21py3-none-any.whl → 0.1.23py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

natural_pdf/analyzers/shape_detection_mixin.py +3 -3
natural_pdf/classification/manager.py +1 -1
natural_pdf/classification/mixin.py +35 -14
natural_pdf/classification/results.py +16 -1
natural_pdf/cli.py +9 -27
natural_pdf/core/highlighting_service.py +23 -0
natural_pdf/core/page.py +16 -0
natural_pdf/core/pdf.py +55 -49
natural_pdf/describe/base.py +2 -2
natural_pdf/describe/elements.py +1 -1
natural_pdf/elements/base.py +79 -1
natural_pdf/elements/collections.py +23 -1
natural_pdf/elements/region.py +54 -148
natural_pdf/exporters/paddleocr.py +1 -1
natural_pdf/extraction/manager.py +2 -2
natural_pdf/extraction/mixin.py +295 -11
natural_pdf/extraction/result.py +28 -1
natural_pdf/flows/region.py +1 -1
natural_pdf/ocr/engine_surya.py +25 -5
natural_pdf/qa/__init__.py +2 -1
natural_pdf/qa/document_qa.py +33 -37
natural_pdf/qa/qa_result.py +55 -0
natural_pdf/selectors/parser.py +22 -0
{natural_pdf-0.1.21.dist-info → natural_pdf-0.1.23.dist-info}/METADATA +21 -14
{natural_pdf-0.1.21.dist-info → natural_pdf-0.1.23.dist-info}/RECORD +29 -28
{natural_pdf-0.1.21.dist-info → natural_pdf-0.1.23.dist-info}/WHEEL +0 -0
{natural_pdf-0.1.21.dist-info → natural_pdf-0.1.23.dist-info}/entry_points.txt +0 -0
{natural_pdf-0.1.21.dist-info → natural_pdf-0.1.23.dist-info}/licenses/LICENSE +0 -0
{natural_pdf-0.1.21.dist-info → natural_pdf-0.1.23.dist-info}/top_level.txt +0 -0

natural_pdf/elements/region.py CHANGED Viewed

@@ -82,7 +82,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         self.end_element = None
         self.metadata: Dict[str, Any] = {}
-        self.analyses: Dict[str, Any] = {}
+        # Analysis results live under self.metadata['analysis'] via property
         # Standard attributes for all elements
         self.object_type = "region"  # For selector compatibility
@@ -115,146 +115,28 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         **kwargs,
     ) -> "Region":
         """
-        Protected helper method to create a region in a specified direction relative to this region.
+        Region-specific wrapper around :py:meth:`DirectionalMixin._direction`.
-        Args:
-            direction: 'left', 'right', 'above', or 'below'
-            size: Size in the primary direction (width for horizontal, height for vertical)
-            cross_size: Size in the cross direction ('full' or 'element')
-            include_source: Whether to include this region's area in the result
-            until: Optional selector string to specify a boundary element
-            include_endpoint: Whether to include the boundary element found by 'until'
-            **kwargs: Additional parameters for the 'until' selector search
-        Returns:
-            Region object
-        """
-        import math  # Use math.inf for infinity
-        is_horizontal = direction in ("left", "right")
-        is_positive = direction in ("right", "below")  # right/below are positive directions
-        pixel_offset = 1  # Offset for excluding elements/endpoints
-        # 1. Determine initial boundaries based on direction and include_source
-        if is_horizontal:
-            # Initial cross-boundaries (vertical)
-            y0 = 0 if cross_size == "full" else self.top
-            y1 = self.page.height if cross_size == "full" else self.bottom
-            # Initial primary boundaries (horizontal)
-            if is_positive:  # right
-                x0_initial = self.x0 if include_source else self.x1 + pixel_offset
-                x1_initial = self.x1  # This edge moves
-            else:  # left
-                x0_initial = self.x0  # This edge moves
-                x1_initial = self.x1 if include_source else self.x0 - pixel_offset
-        else:  # Vertical
-            # Initial cross-boundaries (horizontal)
-            x0 = 0 if cross_size == "full" else self.x0
-            x1 = self.page.width if cross_size == "full" else self.x1
-            # Initial primary boundaries (vertical)
-            if is_positive:  # below
-                y0_initial = self.top if include_source else self.bottom + pixel_offset
-                y1_initial = self.bottom  # This edge moves
-            else:  # above
-                y0_initial = self.top  # This edge moves
-                y1_initial = self.bottom if include_source else self.top - pixel_offset
-        # 2. Calculate the final primary boundary, considering 'size' or page limits
-        if is_horizontal:
-            if is_positive:  # right
-                x1_final = min(
-                    self.page.width,
-                    x1_initial + (size if size is not None else (self.page.width - x1_initial)),
-                )
-                x0_final = x0_initial
-            else:  # left
-                x0_final = max(0, x0_initial - (size if size is not None else x0_initial))
-                x1_final = x1_initial
-        else:  # Vertical
-            if is_positive:  # below
-                y1_final = min(
-                    self.page.height,
-                    y1_initial + (size if size is not None else (self.page.height - y1_initial)),
-                )
-                y0_final = y0_initial
-            else:  # above
-                y0_final = max(0, y0_initial - (size if size is not None else y0_initial))
-                y1_final = y1_initial
-        # 3. Handle 'until' selector if provided
-        target = None
-        if until:
-            all_matches = self.page.find_all(until, **kwargs)
-            matches_in_direction = []
-            # Filter and sort matches based on direction
-            if direction == "above":
-                matches_in_direction = [m for m in all_matches if m.bottom <= self.top]
-                matches_in_direction.sort(key=lambda e: e.bottom, reverse=True)
-            elif direction == "below":
-                matches_in_direction = [m for m in all_matches if m.top >= self.bottom]
-                matches_in_direction.sort(key=lambda e: e.top)
-            elif direction == "left":
-                matches_in_direction = [m for m in all_matches if m.x1 <= self.x0]
-                matches_in_direction.sort(key=lambda e: e.x1, reverse=True)
-            elif direction == "right":
-                matches_in_direction = [m for m in all_matches if m.x0 >= self.x1]
-                matches_in_direction.sort(key=lambda e: e.x0)
-            if matches_in_direction:
-                target = matches_in_direction[0]
-                # Adjust the primary boundary based on the target
-                if is_horizontal:
-                    if is_positive:  # right
-                        x1_final = target.x1 if include_endpoint else target.x0 - pixel_offset
-                    else:  # left
-                        x0_final = target.x0 if include_endpoint else target.x1 + pixel_offset
-                else:  # Vertical
-                    if is_positive:  # below
-                        y1_final = target.bottom if include_endpoint else target.top - pixel_offset
-                    else:  # above
-                        y0_final = target.top if include_endpoint else target.bottom + pixel_offset
-                # Adjust cross boundaries if cross_size is 'element'
-                if cross_size == "element":
-                    if is_horizontal:  # Adjust y0, y1
-                        target_y0 = (
-                            target.top if include_endpoint else target.bottom
-                        )  # Use opposite boundary if excluding
-                        target_y1 = target.bottom if include_endpoint else target.top
-                        y0 = min(y0, target_y0)
-                        y1 = max(y1, target_y1)
-                    else:  # Adjust x0, x1
-                        target_x0 = (
-                            target.x0 if include_endpoint else target.x1
-                        )  # Use opposite boundary if excluding
-                        target_x1 = target.x1 if include_endpoint else target.x0
-                        x0 = min(x0, target_x0)
-                        x1 = max(x1, target_x1)
-        # 4. Finalize bbox coordinates
-        if is_horizontal:
-            bbox = (x0_final, y0, x1_final, y1)
-        else:
-            bbox = (x0, y0_final, x1, y1_final)
+        It performs any pre-processing required by *Region* (none currently),
+        delegates the core geometry work to the mix-in implementation via
+        ``super()``, then attaches region-level metadata before returning the
+        new :class:`Region` instance.
+        """
-        # Ensure valid coordinates (x0 <= x1, y0 <= y1)
-        final_x0 = min(bbox[0], bbox[2])
-        final_y0 = min(bbox[1], bbox[3])
-        final_x1 = max(bbox[0], bbox[2])
-        final_y1 = max(bbox[1], bbox[3])
-        final_bbox = (final_x0, final_y0, final_x1, final_y1)
+        # Delegate to the shared implementation on DirectionalMixin
+        region = super()._direction(
+            direction=direction,
+            size=size,
+            cross_size=cross_size,
+            include_source=include_source,
+            until=until,
+            include_endpoint=include_endpoint,
+            **kwargs,
+        )
-        # 5. Create and return Region
-        region = Region(self.page, final_bbox)
+        # Post-process: make sure callers can trace lineage and flags
         region.source_element = self
         region.includes_source = include_source
-        # Optionally store the boundary element if found
-        if target:
-            region.boundary_element = target
         return region
@@ -710,7 +592,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         self,
         scale: float = 2.0,
         resolution: float = 150,
-        crop_only: bool = False,
+        crop: bool = False,
         include_highlights: bool = True,
         **kwargs,
     ) -> "Image.Image":
@@ -719,7 +601,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         Args:
             resolution: Resolution in DPI for rendering (default: 150)
-            crop_only: If True, only crop the region without highlighting its boundaries
+            crop: If True, only crop the region without highlighting its boundaries
             include_highlights: Whether to include existing highlights (default: True)
             **kwargs: Additional parameters for page.to_image()
@@ -730,7 +612,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         page_kwargs = kwargs.copy()
         effective_resolution = resolution  # Start with the provided resolution
-        if crop_only and "width" in kwargs:
+        if crop and "width" in kwargs:
             target_width = kwargs["width"]
             # Calculate what resolution is needed to make the region crop have target_width
             region_width_points = self.width  # Region width in PDF points
@@ -785,8 +667,8 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         # Crop the image to just this region
         region_image = page_image.crop((x0, top, x1, bottom))
-        # If not crop_only, add a border to highlight the region boundaries
-        if not crop_only:
+        # If not crop, add a border to highlight the region boundaries
+        if not crop:
             from PIL import ImageDraw
             # Create a 1px border around the region
@@ -808,6 +690,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         color: Optional[Union[Tuple, str]] = "blue",
         label: Optional[str] = None,
         width: Optional[int] = None,  # Add width parameter
+        crop: bool = False,  # NEW: Crop output to region bounds before legend
     ) -> "Image.Image":
         """
         Show the page with just this region highlighted temporarily.
@@ -819,6 +702,9 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
             color: Color to highlight this region (default: blue)
             label: Optional label for this region in the legend
             width: Optional width for the output image in pixels
+            crop: If True, crop the rendered image to this region's
+                        bounding box (with a small margin handled inside
+                        HighlightingService) before legends/overlays are added.
         Returns:
             PIL Image of the page with only this region highlighted
@@ -844,6 +730,9 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
             "use_color_cycling": False,  # Explicitly false for single preview
         }
+        # Determine crop bbox if requested
+        crop_bbox = self.bbox if crop else None
         # Use render_preview to show only this highlight
         return service.render_preview(
             page_index=self._page.index,
@@ -852,6 +741,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
             width=width,  # Pass the width parameter
             labels=labels,
             legend_position=legend_position,
+            crop_bbox=crop_bbox,
         )
     def save(
@@ -880,7 +770,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         self,
         filename: str,
         resolution: float = 150,
-        crop_only: bool = False,
+        crop: bool = False,
         include_highlights: bool = True,
         **kwargs,
     ) -> "Region":
@@ -890,7 +780,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         Args:
             filename: Path to save the image to
             resolution: Resolution in DPI for rendering (default: 150)
-            crop_only: If True, only crop the region without highlighting its boundaries
+            crop: If True, only crop the region without highlighting its boundaries
             include_highlights: Whether to include existing highlights (default: True)
             **kwargs: Additional parameters for page.to_image()
@@ -900,7 +790,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         # Get the region image
         image = self.to_image(
             resolution=resolution,
-            crop_only=crop_only,
+            crop=crop,
             include_highlights=include_highlights,
             **kwargs,
         )
@@ -953,7 +843,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         # Get the region image
         image = work_region.to_image(
-            resolution=resolution, crop_only=True, include_highlights=False
+            resolution=resolution, crop=True, include_highlights=False
         )
         if image is None:
@@ -2044,7 +1934,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         # Render the page region to an image using the determined resolution
         try:
             region_image = self.to_image(
-                resolution=final_resolution, include_highlights=False, crop_only=True
+                resolution=final_resolution, include_highlights=False, crop=True
             )
             if not region_image:
                 logger.error("Failed to render region to image for OCR.")
@@ -2466,7 +2356,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
             from natural_pdf.qa.document_qa import get_qa_engine
         except ImportError:
             logger.error(
-                "Question answering requires optional dependencies. Install with `pip install natural-pdf[core-ml]`"
+                "Question answering requires optional dependencies. Install with `pip install natural-pdf[ai]`"
             )
             return {
                 "answer": None,
@@ -2684,7 +2574,7 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
             img = self.to_image(
                 resolution=resolution,
                 include_highlights=False,  # No highlights for classification input
-                crop_only=True,  # Just the region content
+                crop=True,  # Just the region content
             )
             if img is None:
                 raise ValueError(
@@ -2964,4 +2854,20 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
         return text_element
+    # ------------------------------------------------------------------
+    # Unified analysis storage (maps to metadata["analysis"])
+    # ------------------------------------------------------------------
+    @property
+    def analyses(self) -> Dict[str, Any]:
+        if not hasattr(self, "metadata") or self.metadata is None:
+            self.metadata = {}
+        return self.metadata.setdefault("analysis", {})
+    @analyses.setter
+    def analyses(self, value: Dict[str, Any]):
+        if not hasattr(self, "metadata") or self.metadata is None:
+            self.metadata = {}
+        self.metadata["analysis"] = value

natural_pdf/exporters/paddleocr.py CHANGED Viewed

@@ -217,7 +217,7 @@ class PaddleOCRRecognitionExporter(FinetuneExporter):
                         # Expand region, render, and save image
                         region = element.expand(self.padding)
                         img = region.to_image(
-                            resolution=self.resolution, crop_only=True, include_highlights=False
+                            resolution=self.resolution, crop=True, include_highlights=False
                         )
                         img.save(absolute_image_path, "PNG")

natural_pdf/extraction/manager.py CHANGED Viewed

@@ -126,10 +126,10 @@ class StructuredDataManager:
             )
             parsed_data = completion.choices[0].message.parsed
             return StructuredDataResult(
-                data=parsed_data, success=True, error_message=None, model=selected_model
+                data=parsed_data, success=True, error_message=None, model_used=selected_model
             )
         except Exception as e:
             logger.error(f"Extraction failed: {str(e)}")
             return StructuredDataResult(
-                data=None, success=False, error_message=str(e), model=selected_model
+                data=None, success=False, error_message=str(e), model_used=selected_model
             )

natural-pdf 0.1.21__py3-none-any.whl → 0.1.23__py3-none-any.whl

natural-pdf 0.1.21py3-none-any.whl → 0.1.23py3-none-any.whl