PyPI - docling-ibm-models - Versions diffs - 1.2.0__py3-none-any.whl → 1.2.1__py3-none-any.whl - Mend

docling-ibm-models 1.2.0py3-none-any.whl → 1.2.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

docling_ibm_models/tableformer/data_management/tf_cell_matcher.py CHANGED Viewed

@@ -129,12 +129,15 @@ class CellMatcher:
         pdf_cells = copy.deepcopy(iocr_page["tokens"])
         if len(pdf_cells) > 0:
             for word in pdf_cells:
-                word["bbox"] = [
-                    word["bbox"]["l"],
-                    word["bbox"]["t"],
-                    word["bbox"]["r"],
-                    word["bbox"]["b"],
-                ]
+                if isinstance(word["bbox"], list):
+                    continue
+                elif isinstance(word["bbox"], dict):
+                    word["bbox"] = [
+                        word["bbox"]["l"],
+                        word["bbox"]["t"],
+                        word["bbox"]["r"],
+                        word["bbox"]["b"],
+                    ]
         table_bboxes = prediction["bboxes"]
         table_classes = prediction["classes"]
         # BBOXES transformed...

docling_ibm_models/tableformer/data_management/tf_predictor.py CHANGED Viewed

@@ -524,7 +524,12 @@ class TFPredictor:
         return resized, sf
     def multi_table_predict(
-        self, iocr_page, table_bboxes, do_matching=True, correct_overlapping_cells=False
+        self,
+        iocr_page,
+        table_bboxes,
+        do_matching=True,
+        correct_overlapping_cells=False,
+        sort_row_col_indexes=True,
     ):
         multi_tf_output = []
         page_image = iocr_page["image"]
@@ -563,56 +568,70 @@ class TFPredictor:
             # PROCESS PREDICTED RESULTS, TO TURN PREDICTED COL/ROW IDs into Indexes
             # Indexes should be in increasing order, without gaps
-            # Fix col/row indexes
-            # Arranges all col/row indexes sequentially without gaps using input IDs
-            indexing_start_cols = []  # Index of original start col IDs (not indexes)
-            indexing_end_cols = []  # Index of original end col IDs (not indexes)
-            indexing_start_rows = []  # Index of original start row IDs (not indexes)
-            indexing_end_rows = []  # Index of original end row IDs (not indexes)
-            # First, collect all possible predicted IDs, to be used as indexes
-            # ID's returned by Tableformer are sequential, but might contain gaps
-            for tf_response_cell in tf_responses:
-                start_col_offset_idx = tf_response_cell["start_col_offset_idx"]
-                end_col_offset_idx = tf_response_cell["end_col_offset_idx"]
-                start_row_offset_idx = tf_response_cell["start_row_offset_idx"]
-                end_row_offset_idx = tf_response_cell["end_row_offset_idx"]
-                # Collect all possible col/row IDs:
-                if start_col_offset_idx not in indexing_start_cols:
-                    indexing_start_cols.append(start_col_offset_idx)
-                if end_col_offset_idx not in indexing_end_cols:
-                    indexing_end_cols.append(end_col_offset_idx)
-                if start_row_offset_idx not in indexing_start_rows:
-                    indexing_start_rows.append(start_row_offset_idx)
-                if end_row_offset_idx not in indexing_end_rows:
-                    indexing_end_rows.append(end_row_offset_idx)
-            indexing_start_cols.sort()
-            indexing_end_cols.sort()
-            indexing_start_rows.sort()
-            indexing_end_rows.sort()
-            # After this - put actual indexes of IDs back into predicted structure...
-            for tf_response_cell in tf_responses:
-                tf_response_cell["start_col_offset_idx"] = indexing_start_cols.index(
-                    tf_response_cell["start_col_offset_idx"]
-                )
-                tf_response_cell["end_col_offset_idx"] = (
-                    tf_response_cell["start_col_offset_idx"]
-                    + tf_response_cell["col_span"]
-                )
-                tf_response_cell["start_row_offset_idx"] = indexing_start_rows.index(
-                    tf_response_cell["start_row_offset_idx"]
-                )
-                tf_response_cell["end_row_offset_idx"] = (
-                    tf_response_cell["start_row_offset_idx"]
-                    + tf_response_cell["row_span"]
-                )
-            # Counting matched cols/rows from actual indexes (and not ids)
-            predict_details["num_cols"] = len(indexing_end_cols)
-            predict_details["num_rows"] = len(indexing_end_rows)
+            if sort_row_col_indexes:
+                # Fix col/row indexes
+                # Arranges all col/row indexes sequentially without gaps using input IDs
+                indexing_start_cols = (
+                    []
+                )  # Index of original start col IDs (not indexes)
+                indexing_end_cols = []  # Index of original end col IDs (not indexes)
+                indexing_start_rows = (
+                    []
+                )  # Index of original start row IDs (not indexes)
+                indexing_end_rows = []  # Index of original end row IDs (not indexes)
+                # First, collect all possible predicted IDs, to be used as indexes
+                # ID's returned by Tableformer are sequential, but might contain gaps
+                for tf_response_cell in tf_responses:
+                    start_col_offset_idx = tf_response_cell["start_col_offset_idx"]
+                    end_col_offset_idx = tf_response_cell["end_col_offset_idx"]
+                    start_row_offset_idx = tf_response_cell["start_row_offset_idx"]
+                    end_row_offset_idx = tf_response_cell["end_row_offset_idx"]
+                    # Collect all possible col/row IDs:
+                    if start_col_offset_idx not in indexing_start_cols:
+                        indexing_start_cols.append(start_col_offset_idx)
+                    if end_col_offset_idx not in indexing_end_cols:
+                        indexing_end_cols.append(end_col_offset_idx)
+                    if start_row_offset_idx not in indexing_start_rows:
+                        indexing_start_rows.append(start_row_offset_idx)
+                    if end_row_offset_idx not in indexing_end_rows:
+                        indexing_end_rows.append(end_row_offset_idx)
+                indexing_start_cols.sort()
+                indexing_end_cols.sort()
+                indexing_start_rows.sort()
+                indexing_end_rows.sort()
+                # After this - put actual indexes of IDs back into predicted structure...
+                for tf_response_cell in tf_responses:
+                    tf_response_cell["start_col_offset_idx"] = (
+                        indexing_start_cols.index(
+                            tf_response_cell["start_col_offset_idx"]
+                        )
+                    )
+                    tf_response_cell["end_col_offset_idx"] = (
+                        tf_response_cell["start_col_offset_idx"]
+                        + tf_response_cell["col_span"]
+                    )
+                    tf_response_cell["start_row_offset_idx"] = (
+                        indexing_start_rows.index(
+                            tf_response_cell["start_row_offset_idx"]
+                        )
+                    )
+                    tf_response_cell["end_row_offset_idx"] = (
+                        tf_response_cell["start_row_offset_idx"]
+                        + tf_response_cell["row_span"]
+                    )
+                # Counting matched cols/rows from actual indexes (and not ids)
+                predict_details["num_cols"] = len(indexing_end_cols)
+                predict_details["num_rows"] = len(indexing_end_rows)
+            else:
+                otsl_seq = predict_details["prediction"]["rs_seq"]
+                predict_details["num_cols"] = otsl_seq.index("nl")
+                predict_details["num_rows"] = otsl_seq.count("nl")
             # Put results into multi_tf_output
             multi_tf_output.append(
                 {"tf_responses": tf_responses, "predict_details": predict_details}
@@ -667,13 +686,20 @@ class TFPredictor:
                 )
                 if outputs_coord is not None:
-                    bbox_pred = u.box_cxcywh_to_xyxy(outputs_coord)
-                    prediction["bboxes"] = bbox_pred.tolist()
+                    if len(outputs_coord) == 0:
+                        prediction["bboxes"] = []
+                    else:
+                        bbox_pred = u.box_cxcywh_to_xyxy(outputs_coord)
+                        prediction["bboxes"] = bbox_pred.tolist()
                 else:
                     prediction["bboxes"] = []
                 if outputs_class is not None:
-                    result_class = torch.argmax(outputs_class, dim=1)
-                    prediction["classes"] = result_class.tolist()
+                    if len(outputs_class) == 0:
+                        prediction["classes"] = []
+                    else:
+                        result_class = torch.argmax(outputs_class, dim=1)
+                        prediction["classes"] = result_class.tolist()
                 else:
                     prediction["classes"] = []
                 if self._remove_padding:
@@ -788,13 +814,20 @@ class TFPredictor:
                 )
                 if outputs_coord is not None:
-                    bbox_pred = u.box_cxcywh_to_xyxy(outputs_coord)
-                    prediction["bboxes"] = bbox_pred.tolist()
+                    if len(outputs_coord) == 0:
+                        prediction["bboxes"] = []
+                    else:
+                        bbox_pred = u.box_cxcywh_to_xyxy(outputs_coord)
+                        prediction["bboxes"] = bbox_pred.tolist()
                 else:
                     prediction["bboxes"] = []
                 if outputs_class is not None:
-                    result_class = torch.argmax(outputs_class, dim=1)
-                    prediction["classes"] = result_class.tolist()
+                    if len(outputs_class) == 0:
+                        prediction["classes"] = []
+                    else:
+                        result_class = torch.argmax(outputs_class, dim=1)
+                        prediction["classes"] = result_class.tolist()
                 else:
                     prediction["classes"] = []
                 if self._remove_padding:

docling_ibm_models/tableformer/models/table04_rs/tablemodel04_rs.py CHANGED Viewed

@@ -308,8 +308,12 @@ class TableModel04_rs(BaseModel, nn.Module):
         if len(outputs_coord1) > 0:
             outputs_coord1 = torch.stack(outputs_coord1)
+        else:
+            outputs_coord1 = torch.empty(0)
         if len(outputs_class1) > 0:
             outputs_class1 = torch.stack(outputs_class1)
+        else:
+            outputs_class1 = torch.empty(0)
         outputs_class = outputs_class1
         outputs_coord = outputs_coord1

{docling_ibm_models-1.2.0.dist-info → docling_ibm_models-1.2.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: docling-ibm-models
-Version: 1.2.0
+Version: 1.2.1
 Summary: This package contains the AI models used by the Docling PDF conversion package
 License: MIT
 Keywords: docling,convert,document,pdf,layout model,segmentation,table structure,table former

{docling_ibm_models-1.2.0.dist-info → docling_ibm_models-1.2.1.dist-info}/RECORD RENAMED Viewed

@@ -5,9 +5,9 @@ docling_ibm_models/tableformer/data_management/__init__.py,sha256=47DEQpj8HBSa-_
 docling_ibm_models/tableformer/data_management/data_transformer.py,sha256=lNKkAk0VALbixapCuDDSIQKtA0QPCGQF8AGO3D64new,18263
 docling_ibm_models/tableformer/data_management/functional.py,sha256=UrXsEm4DSc1QXdUPb0tZ7nvbg7mGVjpQhX3pGL6C5bA,20633
 docling_ibm_models/tableformer/data_management/matching_post_processor.py,sha256=41GLMlkMAY1pkc-elP3ktFgZLCHjscghaHfgIVn2168,57998
-docling_ibm_models/tableformer/data_management/tf_cell_matcher.py,sha256=kzOjSmXkYrxc0de8wHbDJMvwKXelxYf4OccHTRqnpco,21081
+docling_ibm_models/tableformer/data_management/tf_cell_matcher.py,sha256=GaBW5px3xX9JaHVASZArKiQ-qfrzX0oj-E_6P3-OvuU,21238
 docling_ibm_models/tableformer/data_management/tf_dataset.py,sha256=6_qSsYt6qoE2JBzUNrJfCDX3Kgg7tyrv3kimGLdEQ5o,49890
-docling_ibm_models/tableformer/data_management/tf_predictor.py,sha256=Ha--59Rfs3V78p3q__q5cuEoewrTld18qhX8VqAQrYc,39730
+docling_ibm_models/tableformer/data_management/tf_predictor.py,sha256=32rox4--vqFddCG6oJ1_RQpIoc8nmq4ADvPpgphVR60,40959
 docling_ibm_models/tableformer/data_management/transforms.py,sha256=_i1HXkX8LAuHbeGRrg8kF9yFNJRQZOKmWzxKt559ABQ,13268
 docling_ibm_models/tableformer/models/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 docling_ibm_models/tableformer/models/common/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -15,7 +15,7 @@ docling_ibm_models/tableformer/models/common/base_model.py,sha256=SbCjeEvDmGnyoK
 docling_ibm_models/tableformer/models/table04_rs/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 docling_ibm_models/tableformer/models/table04_rs/bbox_decoder_rs.py,sha256=JV9rFh9caT3qnwWlZ0CZpw5aiiNzyTbfVp6H6JMxS0Q,6117
 docling_ibm_models/tableformer/models/table04_rs/encoder04_rs.py,sha256=iExmqJ0Pn0lJU3nWb_x8abTn42GctMqE55_YA2ppgvc,1975
-docling_ibm_models/tableformer/models/table04_rs/tablemodel04_rs.py,sha256=7iGkrTNLzjC1yn1zuA3N6DvBvbrcO_BR5tmHG3RKmXs,12159
+docling_ibm_models/tableformer/models/table04_rs/tablemodel04_rs.py,sha256=FtmWZNOKjQFLG5GtBCvvU23rWrIsDu3gqfcfl68soPg,12275
 docling_ibm_models/tableformer/models/table04_rs/transformer_rs.py,sha256=nhnYFlXT5KyJMdB4qMo5r8GimWXVy0lcqcmoHPEl-KE,6416
 docling_ibm_models/tableformer/otsl.py,sha256=oE_s2QHTE74jXD0vsXCuya_woReabUOBg6npprEqt58,21069
 docling_ibm_models/tableformer/settings.py,sha256=UlpsP0cpJZR2Uk48lgysYy0om3fr8Xt3z1xzvlTw5j4,3067
@@ -26,7 +26,7 @@ docling_ibm_models/tableformer/utils/app_profiler.py,sha256=Pb7o1zcikKXh7ninaNt4
 docling_ibm_models/tableformer/utils/mem_monitor.py,sha256=ycZ07fUBVVKKLTVGF54jGPDM2aTkKuZWk1kMbOS0wwQ,6353
 docling_ibm_models/tableformer/utils/torch_utils.py,sha256=uN0rK9mSXy1ewBnBnILrWebJhhVU4N-XJZBqNiLJwlQ,8893
 docling_ibm_models/tableformer/utils/utils.py,sha256=8Bxf1rEn977lFbY9NX0r5xh9PvxIRipQZX_EZW92XfA,10980
-docling_ibm_models-1.2.0.dist-info/LICENSE,sha256=mBb7ErEcM8VS9OhiGHnQ2kk75HwPhr54W1Oiz3965MY,1088
-docling_ibm_models-1.2.0.dist-info/METADATA,sha256=j_ccZliZ-e99bOg1MVoshV2f_ZxmfqKsIE-JRW2N2tI,7172
-docling_ibm_models-1.2.0.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
-docling_ibm_models-1.2.0.dist-info/RECORD,,
+docling_ibm_models-1.2.1.dist-info/LICENSE,sha256=mBb7ErEcM8VS9OhiGHnQ2kk75HwPhr54W1Oiz3965MY,1088
+docling_ibm_models-1.2.1.dist-info/METADATA,sha256=xYeasIJ2_l_UYBLsElHklPP9-VTn2ppFRVFIaKRDpj4,7172
+docling_ibm_models-1.2.1.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
+docling_ibm_models-1.2.1.dist-info/RECORD,,

{docling_ibm_models-1.2.0.dist-info → docling_ibm_models-1.2.1.dist-info}/LICENSE RENAMED Viewed

File without changes

{docling_ibm_models-1.2.0.dist-info → docling_ibm_models-1.2.1.dist-info}/WHEEL RENAMED Viewed

File without changes

docling-ibm-models 1.2.0__py3-none-any.whl → 1.2.1__py3-none-any.whl

docling-ibm-models 1.2.0py3-none-any.whl → 1.2.1py3-none-any.whl