PyPI - docling-ibm-models - Versions diffs - 1.1.5__py3-none-any.whl → 1.1.7__py3-none-any.whl - Mend

docling-ibm-models 1.1.5py3-none-any.whl → 1.1.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

docling_ibm_models/tableformer/data_management/matching_post_processor.py CHANGED Viewed

@@ -4,6 +4,7 @@
 #
 import json
 import logging
+import math
 import statistics
 import docling_ibm_models.tableformer.settings as s
@@ -403,45 +404,63 @@ class MatchingPostProcessor:
                 # Push horizontally
                 if x1_min < x2_min:
                     # Move box1 to the left and box2 to the right
-                    box1["bbox"][2] -= overlap_x
-                    box2["bbox"][0] += overlap_x
+                    box1["bbox"][2] -= math.ceil(overlap_x / 2) + 2
+                    box2["bbox"][0] += math.floor(overlap_x / 2)
                 else:
                     # Move box2 to the left and box1 to the right
-                    box2["bbox"][2] -= overlap_x
-                    box1["bbox"][0] += overlap_x
+                    box2["bbox"][2] -= math.ceil(overlap_x / 2) + 2
+                    box1["bbox"][0] += math.floor(overlap_x / 2)
             else:
                 # Push vertically
                 if y1_min < y2_min:
                     # Move box1 up and box2 down
-                    box1["bbox"][3] -= overlap_y
-                    box2["bbox"][1] += overlap_y
+                    box1["bbox"][3] -= math.ceil(overlap_y / 2) + 2
+                    box2["bbox"][1] += math.floor(overlap_y / 2)
                 else:
                     # Move box2 up and box1 down
-                    box2["bbox"][3] -= overlap_y
-                    box1["bbox"][1] += overlap_y
+                    box2["bbox"][3] -= math.ceil(overlap_y / 2) + 2
+                    box1["bbox"][1] += math.floor(overlap_y / 2)
+            # Will flip coordinates in proper order, if previous operations reversed it
+            box1["bbox"] = [
+                min(box1["bbox"][0], box1["bbox"][2]),
+                min(box1["bbox"][1], box1["bbox"][3]),
+                max(box1["bbox"][0], box1["bbox"][2]),
+                max(box1["bbox"][1], box1["bbox"][3]),
+            ]
+            box2["bbox"] = [
+                min(box2["bbox"][0], box2["bbox"][2]),
+                min(box2["bbox"][1], box2["bbox"][3]),
+                max(box2["bbox"][0], box2["bbox"][2]),
+                max(box2["bbox"][1], box2["bbox"][3]),
+            ]
             return box1, box2
         def do_boxes_overlap(box1, box2):
-            # print("{} - {}".format(box1["bbox"], box2["bbox"]))
-            # Extract coordinates from the bounding boxes
-            x1_min, y1_min, x1_max, y1_max = box1["bbox"]
-            x2_min, y2_min, x2_max, y2_max = box2["bbox"]
-            # Check if one box is to the left of the other
-            if x1_max < x2_min or x2_max < x1_min:
+            B1 = box1["bbox"]
+            B2 = box2["bbox"]
+            if (
+                (B1[0] >= B2[2])
+                or (B1[2] <= B2[0])
+                or (B1[3] <= B2[1])
+                or (B1[1] >= B2[3])
+            ):
                 return False
-            # Check if one box is above the other
-            if y1_max < y2_min or y2_max < y1_min:
-                return False
-            return True
+            else:
+                return True
         def find_overlapping_pairs_indexes(bboxes):
             overlapping_indexes = []
             # Compare each box with every other box (combinations)
             for i in range(len(bboxes)):
                 for j in range(i + 1, len(bboxes)):
-                    if do_boxes_overlap(bboxes[i], bboxes[j]):
-                        bboxes[i], bboxes[j] = correct_overlap(bboxes[i], bboxes[j])
+                    if i != j:
+                        if bboxes[i] != bboxes[j]:
+                            if do_boxes_overlap(bboxes[i], bboxes[j]):
+                                bboxes[i], bboxes[j] = correct_overlap(
+                                    bboxes[i], bboxes[j]
+                                )
             return overlapping_indexes, bboxes
@@ -1144,7 +1163,7 @@ class MatchingPostProcessor:
                 new_pdf_cells.append(pdf_cells[i])
         return new_pdf_cells
-    def process(self, matching_details):
+    def process(self, matching_details, correct_overlapping_cells=False):
         r"""
         Do post processing, see details in the comments below
@@ -1348,9 +1367,10 @@ class MatchingPostProcessor:
         table_cells_wo = po2
         max_cell_id = po3
-        # As the last step - correct cell bboxes in a way that they don't overlap:
-        if len(table_cells_wo) <= 300:  # For performance reasons
-            table_cells_wo = self._find_overlapping(table_cells_wo)
+        if correct_overlapping_cells:
+            # As the last step - correct cell bboxes in a way that they don't overlap:
+            if len(table_cells_wo) <= 300:  # For performance reasons
+                table_cells_wo = self._find_overlapping(table_cells_wo)
         self._log().debug("*** final_matches_wo")
         self._log().debug(final_matches_wo)

docling_ibm_models/tableformer/data_management/tf_cell_matcher.py CHANGED Viewed

@@ -127,13 +127,14 @@ class CellMatcher:
             Dictionary with all details about the mathings between the table and pdf cells
         """
         pdf_cells = copy.deepcopy(iocr_page["tokens"])
-        for word in pdf_cells:
-            word["bbox"] = [
-                word["bbox"]["l"],
-                word["bbox"]["t"],
-                word["bbox"]["r"],
-                word["bbox"]["b"],
-            ]
+        if len(pdf_cells) > 0:
+            for word in pdf_cells:
+                word["bbox"] = [
+                    word["bbox"]["l"],
+                    word["bbox"]["t"],
+                    word["bbox"]["r"],
+                    word["bbox"]["b"],
+                ]
         table_bboxes = prediction["bboxes"]
         table_classes = prediction["classes"]
         # BBOXES transformed...
@@ -145,9 +146,13 @@ class CellMatcher:
         table_cells = self._build_table_cells(
             html_seq, otsl_seq, table_bboxes_page, table_classes
         )
-        matches, matches_counter = self._intersection_over_pdf_match(
-            table_cells, pdf_cells
-        )
+        matches = {}
+        matches_counter = 0
+        if len(pdf_cells) > 0:
+            matches, matches_counter = self._intersection_over_pdf_match(
+                table_cells, pdf_cells
+            )
         self._log().debug("matches_counter: {}".format(matches_counter))
@@ -188,13 +193,14 @@ class CellMatcher:
             Dictionary with all details about the mathings between the table and pdf cells
         """
         pdf_cells = copy.deepcopy(iocr_page["tokens"])
-        for word in pdf_cells:
-            word["bbox"] = [
-                word["bbox"]["l"],
-                word["bbox"]["t"],
-                word["bbox"]["r"],
-                word["bbox"]["b"],
-            ]
+        if len(pdf_cells) > 0:
+            for word in pdf_cells:
+                word["bbox"] = [
+                    word["bbox"]["l"],
+                    word["bbox"]["t"],
+                    word["bbox"]["r"],
+                    word["bbox"]["b"],
+                ]
         table_bboxes = prediction["bboxes"]
         table_classes = prediction["classes"]

docling_ibm_models/tableformer/data_management/tf_predictor.py CHANGED Viewed

@@ -523,8 +523,9 @@ class TFPredictor:
         # return the resized image
         return resized, sf
-    def multi_table_predict(self, iocr_page, table_bboxes, do_matching=True):
-        # def multi_table_predict(self, iocr_page, page_image, table_bboxes):
+    def multi_table_predict(
+        self, iocr_page, table_bboxes, do_matching=True, correct_overlapping_cells=False
+    ):
         multi_tf_output = []
         page_image = iocr_page["image"]
@@ -546,7 +547,12 @@ class TFPredictor:
             # Predict
             if do_matching:
                 tf_responses, predict_details = self.predict(
-                    iocr_page, table_bbox, table_image, scale_factor, None
+                    iocr_page,
+                    table_bbox,
+                    table_image,
+                    scale_factor,
+                    None,
+                    correct_overlapping_cells,
                 )
             else:
                 tf_responses, predict_details = self.predict_dummy(
@@ -696,7 +702,12 @@ class TFPredictor:
             prediction["bboxes"] = corrected_bboxes
         # Match the cells
-        matching_details = {"table_cells": [], "matches": {}}
+        matching_details = {
+            "table_cells": [],
+            "matches": {},
+            "pdf_cells": [],
+            "prediction_bboxes_page": [],
+        }
         # Table bbox upscaling will scale predicted bboxes too within cell matcher
         scaled_table_bbox = [
@@ -728,7 +739,13 @@ class TFPredictor:
         return tf_output, matching_details
     def predict(
-        self, iocr_page, table_bbox, table_image, scale_factor, eval_res_preds=None
+        self,
+        iocr_page,
+        table_bbox,
+        table_image,
+        scale_factor,
+        eval_res_preds=None,
+        correct_overlapping_cells=False,
     ):
         r"""
         Predict the table out of an image in memory
@@ -739,6 +756,8 @@ class TFPredictor:
             Docling provided table data
         eval_res_preds : dict
             Ready predictions provided by the evaluation results
+        correct_overlapping_cells : boolean
+            Enables or disables last post-processing step, that fixes cell bboxes to remove overlap
         Returns
         -------
@@ -803,7 +822,12 @@ class TFPredictor:
             prediction["bboxes"] = corrected_bboxes
         # Match the cells
-        matching_details = {"table_cells": [], "matches": {}}
+        matching_details = {
+            "table_cells": [],
+            "matches": {},
+            "pdf_cells": [],
+            "prediction_bboxes_page": [],
+        }
         # Table bbox upscaling will scale predicted bboxes too within cell matcher
         scaled_table_bbox = [
@@ -819,10 +843,15 @@ class TFPredictor:
             )
         # Post-processing
         if len(prediction["bboxes"]) > 0:
-            if self.enable_post_process:
-                AggProfiler().begin("post_process", self._prof)
-                matching_details = self._post_processor.process(matching_details)
-                AggProfiler().end("post_process", self._prof)
+            if (
+                len(iocr_page["tokens"]) > 0
+            ):  # There are at least some pdf cells to match with
+                if self.enable_post_process:
+                    AggProfiler().begin("post_process", self._prof)
+                    matching_details = self._post_processor.process(
+                        matching_details, correct_overlapping_cells
+                    )
+                    AggProfiler().end("post_process", self._prof)
         # Generate the expected Docling responses
         AggProfiler().begin("generate_docling_response", self._prof)

docling_ibm_models/tableformer/models/table04_rs/bbox_decoder_rs.py CHANGED Viewed

@@ -157,7 +157,12 @@ class BBoxDecoder(nn.Module):
             predictions_classes.append(self._class_embed(h))
         if len(predictions_bboxes) > 0:
             predictions_bboxes = torch.stack([x[0] for x in predictions_bboxes])
+        else:
+            predictions_bboxes = torch.empty(0)
         if len(predictions_classes) > 0:
             predictions_classes = torch.stack([x[0] for x in predictions_classes])
+        else:
+            predictions_classes = torch.empty(0)
         return predictions_classes, predictions_bboxes

docling_ibm_models/tableformer/otsl.py CHANGED Viewed

@@ -123,6 +123,9 @@ def otsl_check_right(rs_split, x, y):
 def otsl_to_html(rs_list, logdebug):
+    if len(rs_list) == 0:
+        return []
     if rs_list[0] not in ["fcel", "ched", "rhed", "srow", "ecel"]:
         # Most likely already HTML...
         return rs_list

{docling_ibm_models-1.1.5.dist-info → docling_ibm_models-1.1.7.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: docling-ibm-models
-Version: 1.1.5
+Version: 1.1.7
 Summary: This package contains the AI models used by the Docling PDF conversion package
 License: MIT
 Keywords: docling,convert,document,pdf,layout model,segmentation,table structure,table former

{docling_ibm_models-1.1.5.dist-info → docling_ibm_models-1.1.7.dist-info}/RECORD RENAMED Viewed

@@ -4,20 +4,20 @@ docling_ibm_models/tableformer/common.py,sha256=RV2ptqgkfz1OIoN-WqiSeln0pkZ_7zTO
 docling_ibm_models/tableformer/data_management/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 docling_ibm_models/tableformer/data_management/data_transformer.py,sha256=lNKkAk0VALbixapCuDDSIQKtA0QPCGQF8AGO3D64new,18263
 docling_ibm_models/tableformer/data_management/functional.py,sha256=UrXsEm4DSc1QXdUPb0tZ7nvbg7mGVjpQhX3pGL6C5bA,20633
-docling_ibm_models/tableformer/data_management/matching_post_processor.py,sha256=-82B4xUJ9uxMDcsX2DJINTy3J0OB9rKXzHKtf-J3GHI,57205
-docling_ibm_models/tableformer/data_management/tf_cell_matcher.py,sha256=DFu428Cr84maT9WehdoZkpkJKeahwe5JlclvTC6fuVY,20870
+docling_ibm_models/tableformer/data_management/matching_post_processor.py,sha256=41GLMlkMAY1pkc-elP3ktFgZLCHjscghaHfgIVn2168,57998
+docling_ibm_models/tableformer/data_management/tf_cell_matcher.py,sha256=kzOjSmXkYrxc0de8wHbDJMvwKXelxYf4OccHTRqnpco,21081
 docling_ibm_models/tableformer/data_management/tf_dataset.py,sha256=6_qSsYt6qoE2JBzUNrJfCDX3Kgg7tyrv3kimGLdEQ5o,49890
-docling_ibm_models/tableformer/data_management/tf_predictor.py,sha256=LxRme9AWLZhQw7xP5Tpxwa5XFTY66m5IFS5v9VC30GA,38978
+docling_ibm_models/tableformer/data_management/tf_predictor.py,sha256=Ha--59Rfs3V78p3q__q5cuEoewrTld18qhX8VqAQrYc,39730
 docling_ibm_models/tableformer/data_management/transforms.py,sha256=_i1HXkX8LAuHbeGRrg8kF9yFNJRQZOKmWzxKt559ABQ,13268
 docling_ibm_models/tableformer/models/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 docling_ibm_models/tableformer/models/common/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 docling_ibm_models/tableformer/models/common/base_model.py,sha256=SbCjeEvDmGnyoKYhB5pYeg2LFVQdArglfrhqkuW1nUw,10030
 docling_ibm_models/tableformer/models/table04_rs/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-docling_ibm_models/tableformer/models/table04_rs/bbox_decoder_rs.py,sha256=mMZSGk0PjQ4_fhuP44_WJVzfxyLky6S3zlVxCrNKRgc,5991
+docling_ibm_models/tableformer/models/table04_rs/bbox_decoder_rs.py,sha256=JV9rFh9caT3qnwWlZ0CZpw5aiiNzyTbfVp6H6JMxS0Q,6117
 docling_ibm_models/tableformer/models/table04_rs/encoder04_rs.py,sha256=iExmqJ0Pn0lJU3nWb_x8abTn42GctMqE55_YA2ppgvc,1975
 docling_ibm_models/tableformer/models/table04_rs/tablemodel04_rs.py,sha256=7iGkrTNLzjC1yn1zuA3N6DvBvbrcO_BR5tmHG3RKmXs,12159
 docling_ibm_models/tableformer/models/table04_rs/transformer_rs.py,sha256=4106qxxH0w92CVOFzFuCb87tRMvqAUP3X3F1WT5Z47A,6371
-docling_ibm_models/tableformer/otsl.py,sha256=k8l1hYWvcCkcnWbLxuBUYEcigYBFTRqiM2GBAHcUDok,21024
+docling_ibm_models/tableformer/otsl.py,sha256=oE_s2QHTE74jXD0vsXCuya_woReabUOBg6npprEqt58,21069
 docling_ibm_models/tableformer/settings.py,sha256=UlpsP0cpJZR2Uk48lgysYy0om3fr8Xt3z1xzvlTw5j4,3067
 docling_ibm_models/tableformer/test_dataset_cache.py,sha256=zvVJvUnYz4GxAQfPUmLTHUbqj0Yhi2vwgOBnsRgt1rI,818
 docling_ibm_models/tableformer/test_prepare_image.py,sha256=oPmU93-yWIkCeUYulGQ1p676Vq-zcjw2EX24WA5lspA,3155
@@ -26,7 +26,7 @@ docling_ibm_models/tableformer/utils/app_profiler.py,sha256=13dvwo5byzfP2ejqGBFw
 docling_ibm_models/tableformer/utils/torch_utils.py,sha256=uN0rK9mSXy1ewBnBnILrWebJhhVU4N-XJZBqNiLJwlQ,8893
 docling_ibm_models/tableformer/utils/utils.py,sha256=8Bxf1rEn977lFbY9NX0r5xh9PvxIRipQZX_EZW92XfA,10980
 docling_ibm_models/tableformer/utils/variance.py,sha256=USjRwaMsCmzvc6PeWskaAJnUjbliRVd_MqNKLjMDQw8,4675
-docling_ibm_models-1.1.5.dist-info/LICENSE,sha256=ACwmltkrXIz5VsEQcrqljq-fat6ZXAMepjXGoe40KtE,1069
-docling_ibm_models-1.1.5.dist-info/METADATA,sha256=rMLyByq-Q0Z7F4izoMo3X9YEr4pVrCgOZPEnHtmTcvw,7172
-docling_ibm_models-1.1.5.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
-docling_ibm_models-1.1.5.dist-info/RECORD,,
+docling_ibm_models-1.1.7.dist-info/LICENSE,sha256=ACwmltkrXIz5VsEQcrqljq-fat6ZXAMepjXGoe40KtE,1069
+docling_ibm_models-1.1.7.dist-info/METADATA,sha256=o2f2zLxzqrkoDZ0gdBXDoCJNNJ3FyACeKIMemFE0LBs,7172
+docling_ibm_models-1.1.7.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
+docling_ibm_models-1.1.7.dist-info/RECORD,,

{docling_ibm_models-1.1.5.dist-info → docling_ibm_models-1.1.7.dist-info}/LICENSE RENAMED Viewed

File without changes

{docling_ibm_models-1.1.5.dist-info → docling_ibm_models-1.1.7.dist-info}/WHEEL RENAMED Viewed

File without changes

docling-ibm-models 1.1.5__py3-none-any.whl → 1.1.7__py3-none-any.whl

docling-ibm-models 1.1.5py3-none-any.whl → 1.1.7py3-none-any.whl