PyPI - paddlex - Versions diffs - 3.0.1__py3-none-any.whl → 3.0.3__py3-none-any.whl - Mend

paddlex 3.0.1py3-none-any.whl → 3.0.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

paddlex/.version +1 -1
paddlex/inference/models/base/predictor/base_predictor.py +2 -0
paddlex/inference/models/common/static_infer.py +20 -14
paddlex/inference/models/common/ts/funcs.py +19 -8
paddlex/inference/models/formula_recognition/predictor.py +1 -1
paddlex/inference/models/formula_recognition/processors.py +2 -2
paddlex/inference/models/text_recognition/result.py +1 -1
paddlex/inference/pipelines/layout_parsing/layout_objects.py +859 -0
paddlex/inference/pipelines/layout_parsing/pipeline_v2.py +144 -205
paddlex/inference/pipelines/layout_parsing/result_v2.py +13 -272
paddlex/inference/pipelines/layout_parsing/setting.py +1 -0
paddlex/inference/pipelines/layout_parsing/utils.py +108 -312
paddlex/inference/pipelines/layout_parsing/xycut_enhanced/utils.py +302 -247
paddlex/inference/pipelines/layout_parsing/xycut_enhanced/xycuts.py +156 -104
paddlex/inference/pipelines/ocr/result.py +2 -2
paddlex/inference/pipelines/pp_chatocr/pipeline_v4.py +1 -1
paddlex/inference/serving/basic_serving/_app.py +47 -13
paddlex/inference/serving/infra/utils.py +22 -17
paddlex/inference/utils/hpi.py +60 -25
paddlex/inference/utils/hpi_model_info_collection.json +627 -204
paddlex/inference/utils/misc.py +20 -0
paddlex/inference/utils/mkldnn_blocklist.py +36 -2
paddlex/inference/utils/official_models.py +126 -5
paddlex/inference/utils/pp_option.py +81 -21
paddlex/modules/semantic_segmentation/dataset_checker/__init__.py +12 -2
paddlex/ops/__init__.py +6 -3
paddlex/utils/deps.py +2 -2
paddlex/utils/device.py +4 -19
paddlex/utils/download.py +10 -7
paddlex/utils/flags.py +9 -0
paddlex/utils/subclass_register.py +2 -2
{paddlex-3.0.1.dist-info → paddlex-3.0.3.dist-info}/METADATA +307 -162
{paddlex-3.0.1.dist-info → paddlex-3.0.3.dist-info}/RECORD +37 -35
{paddlex-3.0.1.dist-info → paddlex-3.0.3.dist-info}/WHEEL +1 -1
{paddlex-3.0.1.dist-info → paddlex-3.0.3.dist-info}/entry_points.txt +1 -0
{paddlex-3.0.1.dist-info/licenses → paddlex-3.0.3.dist-info}/LICENSE +0 -0
{paddlex-3.0.1.dist-info → paddlex-3.0.3.dist-info}/top_level.txt +0 -0

paddlex/inference/pipelines/layout_parsing/xycut_enhanced/xycuts.py CHANGED Viewed

@@ -17,11 +17,14 @@ from typing import Dict, List, Tuple
 import numpy as np
-from ..result_v2 import LayoutParsingBlock, LayoutParsingRegion
-from ..setting import BLOCK_LABEL_MAP
+from ..layout_objects import LayoutBlock, LayoutRegion
+from ..setting import BLOCK_LABEL_MAP, XYCUT_SETTINGS
 from ..utils import calculate_overlap_ratio, calculate_projection_overlap_ratio
 from .utils import (
     calculate_discontinuous_projection,
+    euclidean_insert,
+    find_local_minima_flat_regions,
+    get_blocks_by_direction_interval,
     get_cut_blocks,
     insert_child_blocks,
     manhattan_insert,
@@ -31,16 +34,16 @@ from .utils import (
     reference_insert,
     shrink_overlapping_boxes,
     sort_normal_blocks,
-    split_projection_profile,
     update_doc_title_child_blocks,
     update_paragraph_title_child_blocks,
+    update_region_child_blocks,
     update_vision_child_blocks,
     weighted_distance_insert,
 )
 def pre_process(
-    region: LayoutParsingRegion,
+    region: LayoutRegion,
 ) -> List:
     """
     Preprocess the layout for sorting purposes.
@@ -63,10 +66,11 @@ def pre_process(
         "sub_paragraph_title",
         "doc_title_text",
         "vision_title",
+        "sub_region",
     ]
     pre_cut_block_idxes = []
     block_map = region.block_map
-    blocks: List[LayoutParsingBlock] = list(block_map.values())
+    blocks: List[LayoutBlock] = list(block_map.values())
     for block in blocks:
         if block.order_label not in mask_labels:
             update_region_label(block, region)
@@ -83,7 +87,6 @@ def pre_process(
         ) / 2
         center_offset = abs(block_center - region.direction_center_coordinate)
         is_centered = center_offset <= tolerance_len
         if is_centered:
             pre_cut_block_idxes.append(block.index)
@@ -121,60 +124,83 @@ def pre_process(
                             block.secondary_direction_start_coordinate
                         )
                         cut_coordinates.append(block.secondary_direction_end_coordinate)
-    secondary_discontinuous = calculate_discontinuous_projection(
-        all_boxes, direction=region.direction
+    secondary_check_bboxes = np.array(
+        [
+            block.bbox
+            for block in blocks
+            if block.order_label not in mask_labels + ["vision"]
+        ]
     )
-    if len(secondary_discontinuous) == 1:
-        if not discontinuous:
-            discontinuous = calculate_discontinuous_projection(
-                all_boxes, direction=cut_direction
-            )
-        current_interval = discontinuous[0]
-        for interval in discontinuous[1:]:
-            gap_len = interval[0] - current_interval[1]
-            if gap_len >= region.text_line_height * 3:
-                cut_coordinates.append(current_interval[1])
-            elif gap_len > region.text_line_height * 1.2:
-                (pre_blocks, post_blocks) = get_cut_blocks(
-                    list(block_map.values()), cut_direction, [current_interval[1]], []
-                )
-                pre_bboxes = np.array([block.bbox for block in pre_blocks])
-                post_bboxes = np.array([block.bbox for block in post_blocks])
-                projection_index = 1 if cut_direction == "horizontal" else 0
-                pre_projection = projection_by_bboxes(pre_bboxes, projection_index)
-                post_projection = projection_by_bboxes(post_bboxes, projection_index)
-                pre_projection_min = np.min(pre_projection)
-                post_projection_min = np.min(post_projection)
-                pre_projection_min += 5 if pre_projection_min != 0 else 0
-                post_projection_min += 5 if post_projection_min != 0 else 0
-                pre_intervals = split_projection_profile(
-                    pre_projection, pre_projection_min, 1
-                )
-                post_intervals = split_projection_profile(
-                    post_projection, post_projection_min, 1
+    if len(secondary_check_bboxes) > 0 or blocks[0].label == "region":
+        secondary_discontinuous = calculate_discontinuous_projection(
+            secondary_check_bboxes, direction=region.direction
+        )
+        if len(secondary_discontinuous) == 1 or blocks[0].label == "region":
+            if not discontinuous:
+                discontinuous = calculate_discontinuous_projection(
+                    all_boxes, direction=cut_direction
                 )
-                pre_gap_boxes = []
-                if pre_intervals is not None:
-                    for start, end in zip(*pre_intervals):
-                        bbox = [0] * 4
-                        bbox[projection_index] = start
-                        bbox[projection_index + 2] = end
-                        pre_gap_boxes.append(bbox)
-                post_gap_boxes = []
-                if post_intervals is not None:
-                    for start, end in zip(*post_intervals):
-                        bbox = [0] * 4
-                        bbox[projection_index] = start
-                        bbox[projection_index + 2] = end
-                        post_gap_boxes.append(bbox)
-                max_gap_boxes_num = max(len(pre_gap_boxes), len(post_gap_boxes))
-                if max_gap_boxes_num > 0:
-                    discontinuous_intervals = calculate_discontinuous_projection(
-                        pre_gap_boxes + post_gap_boxes, direction=region.direction
+            current_interval = discontinuous[0]
+            pre_cut_coordinates = [
+                cood for cood in cut_coordinates if cood < current_interval[1]
+            ]
+            if not pre_cut_coordinates:
+                pre_cut_coordinate = 0
+            else:
+                pre_cut_coordinate = max(pre_cut_coordinates)
+            pre_cut_coordinate = max(current_interval[0], pre_cut_coordinate)
+            for interval in discontinuous[1:]:
+                gap_len = interval[0] - current_interval[1]
+                if (
+                    gap_len >= region.text_line_height * 3
+                    or blocks[0].label == "region"
+                ):
+                    cut_coordinates.append(current_interval[1])
+                elif gap_len > region.text_line_height * 1.2:
+                    pre_blocks = get_blocks_by_direction_interval(
+                        list(block_map.values()),
+                        pre_cut_coordinate,
+                        current_interval[1],
+                        cut_direction,
+                    )
+                    post_blocks = get_blocks_by_direction_interval(
+                        list(block_map.values()),
+                        current_interval[1],
+                        interval[1],
+                        cut_direction,
                     )
-                    if len(discontinuous_intervals) != max_gap_boxes_num:
-                        cut_coordinates.append(current_interval[1])
-            current_interval = interval
+                    pre_bboxes = np.array([block.bbox for block in pre_blocks])
+                    post_bboxes = np.array([block.bbox for block in post_blocks])
+                    projection_index = 1 if cut_direction == "horizontal" else 0
+                    pre_projection = projection_by_bboxes(pre_bboxes, projection_index)
+                    post_projection = projection_by_bboxes(
+                        post_bboxes, projection_index
+                    )
+                    pre_intervals = find_local_minima_flat_regions(pre_projection)
+                    post_intervals = find_local_minima_flat_regions(post_projection)
+                    pre_gap_boxes = []
+                    if pre_intervals is not None:
+                        for start, end in pre_intervals:
+                            bbox = [0] * 4
+                            bbox[projection_index] = start
+                            bbox[projection_index + 2] = end
+                            pre_gap_boxes.append(bbox)
+                    post_gap_boxes = []
+                    if post_intervals is not None:
+                        for start, end in post_intervals:
+                            bbox = [0] * 4
+                            bbox[projection_index] = start
+                            bbox[projection_index + 2] = end
+                            post_gap_boxes.append(bbox)
+                    max_gap_boxes_num = max(len(pre_gap_boxes), len(post_gap_boxes))
+                    if max_gap_boxes_num > 0:
+                        discontinuous_intervals = calculate_discontinuous_projection(
+                            pre_gap_boxes + post_gap_boxes, direction=region.direction
+                        )
+                        if len(discontinuous_intervals) != max_gap_boxes_num:
+                            pre_cut_coordinate = current_interval[1]
+                            cut_coordinates.append(current_interval[1])
+                current_interval = interval
     cut_list = get_cut_blocks(blocks, cut_direction, cut_coordinates, mask_labels)
     pre_cut_list.extend(cut_list)
     if region.direction == "vertical":
@@ -184,14 +210,14 @@ def pre_process(
 def update_region_label(
-    block: LayoutParsingBlock,
-    region: LayoutParsingRegion,
+    block: LayoutBlock,
+    region: LayoutRegion,
 ) -> None:
     """
     Update the region label of a block based on its label and match the block with its children.
     Args:
-        blocks (List[LayoutParsingBlock]): The list of blocks to process.
+        blocks (List[LayoutBlock]): The list of blocks to process.
         config (Dict[str, Any]): The configuration dictionary containing the necessary information.
         block_idx (int): The index of the current block being processed.
@@ -210,17 +236,18 @@ def update_region_label(
     elif block.label in BLOCK_LABEL_MAP["vision_labels"]:
         block.order_label = "vision"
         block.num_of_lines = 1
-        block.direction = region.direction
-        block.update_direction_info()
+        block.update_direction(region.direction)
     elif block.label in BLOCK_LABEL_MAP["footer_labels"]:
         block.order_label = "footer"
     elif block.label in BLOCK_LABEL_MAP["unordered_labels"]:
         block.order_label = "unordered"
+    elif block.label == "region":
+        block.order_label = "region"
     else:
         block.order_label = "normal_text"
     # only vision and doc title block can have child block
-    if block.order_label not in ["vision", "doc_title", "paragraph_title"]:
+    if block.order_label not in ["vision", "doc_title", "paragraph_title", "region"]:
         return
     # match doc title text block
@@ -232,10 +259,12 @@ def update_region_label(
     # match vision title block and vision footnote block
     elif block.order_label == "vision":
         update_vision_child_blocks(block, region)
+    elif block.order_label == "region":
+        update_region_child_blocks(block, region)
 def get_layout_structure(
-    blocks: List[LayoutParsingBlock],
+    blocks: List[LayoutBlock],
     region_direction: str,
     region_secondary_direction: str,
 ) -> Tuple[List[Dict[str, any]], bool]:
@@ -263,11 +292,11 @@ def get_layout_structure(
                 continue
             bbox_iou = calculate_overlap_ratio(block.bbox, ref_block.bbox)
-            if bbox_iou > 0:
+            if bbox_iou:
                 if ref_block.order_label == "vision":
                     ref_block.order_label = "cross_layout"
                     break
-                if block.order_label == "vision" or block.area < ref_block.area:
+                if bbox_iou > 0.1 and block.area < ref_block.area:
                     block.order_label = "cross_layout"
                     break
@@ -320,13 +349,19 @@ def get_layout_structure(
                         and ref_match_projection_iou == 0
                         and secondary_direction_ref_match_projection_overlap_ratio > 0
                     ):
-                        if block.order_label == "vision" or (
+                        if block.order_label in ["vision", "region"] or (
                             ref_block.order_label == "normal_text"
                             and second_ref_block.order_label == "normal_text"
-                            and ref_block.text_line_width
-                            > ref_block.text_line_height * 5
-                            and second_ref_block.text_line_width
-                            > second_ref_block.text_line_height * 5
+                            and ref_block.long_side_length
+                            > ref_block.text_line_height
+                            * XYCUT_SETTINGS.get(
+                                "cross_layout_ref_text_block_words_num_threshold", 8
+                            )
+                            and second_ref_block.long_side_length
+                            > second_ref_block.text_line_height
+                            * XYCUT_SETTINGS.get(
+                                "cross_layout_ref_text_block_words_num_threshold", 8
+                            )
                         ):
                             block.order_label = (
                                 "cross_reference"
@@ -374,20 +409,20 @@ def sort_by_xycut(
 def match_unsorted_blocks(
-    sorted_blocks: List[LayoutParsingBlock],
-    unsorted_blocks: List[LayoutParsingBlock],
-    region: LayoutParsingRegion,
-) -> List[LayoutParsingBlock]:
+    sorted_blocks: List[LayoutBlock],
+    unsorted_blocks: List[LayoutBlock],
+    region: LayoutRegion,
+) -> List[LayoutBlock]:
     """
     Match special blocks with the sorted blocks based on their region labels.
     Args:
-        sorted_blocks (List[LayoutParsingBlock]): Sorted blocks to be matched.
-        unsorted_blocks (List[LayoutParsingBlock]): Unsorted blocks to be matched.
+        sorted_blocks (List[LayoutBlock]): Sorted blocks to be matched.
+        unsorted_blocks (List[LayoutBlock]): Unsorted blocks to be matched.
         config (Dict): Configuration dictionary containing various parameters.
         median_width (int): Median width value used for calculations.
     Returns:
-        List[LayoutParsingBlock]: The updated sorted blocks after matching special blocks.
+        List[LayoutBlock]: The updated sorted blocks after matching special blocks.
     """
     distance_type_map = {
         "cross_layout": weighted_distance_insert,
@@ -398,6 +433,7 @@ def match_unsorted_blocks(
         "cross_reference": reference_insert,
         "unordered": manhattan_insert,
         "other": manhattan_insert,
+        "region": euclidean_insert,
     }
     unsorted_blocks = sort_normal_blocks(
@@ -407,17 +443,19 @@ def match_unsorted_blocks(
         region.direction,
     )
     for idx, block in enumerate(unsorted_blocks):
-        order_label = block.order_label
+        order_label = block.order_label if block.label != "region" else "region"
         if idx == 0 and order_label == "doc_title":
             sorted_blocks.insert(0, block)
             continue
-        sorted_blocks = distance_type_map[order_label](block, sorted_blocks, region)
+        sorted_blocks = distance_type_map[order_label](
+            block=block, sorted_blocks=sorted_blocks, region=region
+        )
     return sorted_blocks
 def xycut_enhanced(
-    region: LayoutParsingRegion,
-) -> LayoutParsingRegion:
+    region: LayoutRegion,
+) -> LayoutRegion:
     """
     xycut_enhance function performs the following steps:
         1. Preprocess the input blocks by extracting headers, footers, and pre-cut blocks.
@@ -428,34 +466,34 @@ def xycut_enhanced(
         6. Return the ordered result list.
     Args:
-        blocks (List[LayoutParsingBlock]): Input blocks to be processed.
+        blocks (List[LayoutBlock]): Input blocks to be processed.
     Returns:
-        List[LayoutParsingBlock]: Ordered result list after processing.
+        List[LayoutBlock]: Ordered result list after processing.
     """
     if len(region.block_map) == 0:
         return []
-    pre_cut_list: List[List[LayoutParsingBlock]] = pre_process(region)
-    final_order_res_list: List[LayoutParsingBlock] = []
+    pre_cut_list: List[List[LayoutBlock]] = pre_process(region)
+    final_order_res_list: List[LayoutBlock] = []
-    header_blocks: List[LayoutParsingBlock] = [
+    header_blocks: List[LayoutBlock] = [
         region.block_map[idx] for idx in region.header_block_idxes
     ]
-    unordered_blocks: List[LayoutParsingBlock] = [
+    unordered_blocks: List[LayoutBlock] = [
         region.block_map[idx] for idx in region.unordered_block_idxes
     ]
-    footer_blocks: List[LayoutParsingBlock] = [
+    footer_blocks: List[LayoutBlock] = [
         region.block_map[idx] for idx in region.footer_block_idxes
     ]
-    header_blocks: List[LayoutParsingBlock] = sort_normal_blocks(
+    header_blocks: List[LayoutBlock] = sort_normal_blocks(
         header_blocks, region.text_line_height, region.text_line_width, region.direction
     )
-    footer_blocks: List[LayoutParsingBlock] = sort_normal_blocks(
+    footer_blocks: List[LayoutBlock] = sort_normal_blocks(
         footer_blocks, region.text_line_height, region.text_line_width, region.direction
     )
-    unordered_blocks: List[LayoutParsingBlock] = sort_normal_blocks(
+    unordered_blocks: List[LayoutBlock] = sort_normal_blocks(
         unordered_blocks,
         region.text_line_height,
         region.text_line_width,
@@ -463,16 +501,26 @@ def xycut_enhanced(
     )
     final_order_res_list.extend(header_blocks)
-    unsorted_blocks: List[LayoutParsingBlock] = []
-    sorted_blocks_by_pre_cuts: List[LayoutParsingBlock] = []
+    unsorted_blocks: List[LayoutBlock] = []
+    sorted_blocks_by_pre_cuts: List[LayoutBlock] = []
     for pre_cut_blocks in pre_cut_list:
-        sorted_blocks: List[LayoutParsingBlock] = []
-        doc_title_blocks: List[LayoutParsingBlock] = []
-        xy_cut_blocks: List[LayoutParsingBlock] = []
+        sorted_blocks: List[LayoutBlock] = []
+        doc_title_blocks: List[LayoutBlock] = []
+        xy_cut_blocks: List[LayoutBlock] = []
-        get_layout_structure(
-            pre_cut_blocks, region.direction, region.secondary_direction
-        )
+        if pre_cut_blocks and pre_cut_blocks[0].label == "region":
+            block_bboxes = np.array([block.bbox for block in pre_cut_blocks])
+            discontinuous = calculate_discontinuous_projection(
+                block_bboxes, direction=region.direction
+            )
+            if len(discontinuous) == 1:
+                get_layout_structure(
+                    pre_cut_blocks, region.direction, region.secondary_direction
+                )
+        else:
+            get_layout_structure(
+                pre_cut_blocks, region.direction, region.secondary_direction
+            )
         # Get xy cut blocks and add other blocks in special_block_map
         for block in pre_cut_blocks:
@@ -494,8 +542,6 @@ def xycut_enhanced(
             discontinuous = calculate_discontinuous_projection(
                 block_bboxes, direction=region.direction
             )
-            if len(discontinuous) > 1:
-                xy_cut_blocks = [block for block in xy_cut_blocks]
             blocks_to_sort = deepcopy(xy_cut_blocks)
             if region.direction == "vertical":
                 for block in blocks_to_sort:
@@ -526,7 +572,7 @@ def xycut_enhanced(
                     )
                 )
                 blocks_to_sort = shrink_overlapping_boxes(
-                    blocks_to_sort, region.direction
+                    blocks_to_sort, region.secondary_direction
                 )
                 block_bboxes = np.array([block.bbox for block in blocks_to_sort])
                 sorted_indexes = sort_by_xycut(
@@ -536,13 +582,19 @@ def xycut_enhanced(
             sorted_blocks = [
                 region.block_map[blocks_to_sort[i].index] for i in sorted_indexes
             ]
         sorted_blocks = match_unsorted_blocks(
             sorted_blocks,
             doc_title_blocks,
             region=region,
         )
+        if unsorted_blocks and unsorted_blocks[0].label == "region":
+            sorted_blocks = match_unsorted_blocks(
+                sorted_blocks,
+                unsorted_blocks,
+                region=region,
+            )
+            unsorted_blocks = []
         sorted_blocks_by_pre_cuts.extend(sorted_blocks)
     final_sorted_blocks = match_unsorted_blocks(

paddlex/inference/pipelines/ocr/result.py CHANGED Viewed

@@ -206,10 +206,10 @@ def draw_box_txt_fine(
         np.ndarray: An image with the text drawn in the specified box.
     """
     box_height = int(
-        math.sqrt((box[0][0] - box[3][0]) ** 2 + (box[0][1] - box[3][1]) ** 2)
+        math.sqrt(float(box[0][0] - box[3][0]) ** 2 + float(box[0][1] - box[3][1]) ** 2)
     )
     box_width = int(
-        math.sqrt((box[0][0] - box[1][0]) ** 2 + (box[0][1] - box[1][1]) ** 2)
+        math.sqrt(float(box[0][0] - box[1][0]) ** 2 + float(box[0][1] - box[1][1]) ** 2)
     )
     if box_height > 2 * box_width and box_height > 30:

paddlex/inference/pipelines/pp_chatocr/pipeline_v4.py CHANGED Viewed

@@ -638,7 +638,7 @@ class PP_ChatOCRv4_Pipeline(PP_ChatOCR_Pipeline):
         for image_array in self.img_reader([input]):
-            image_string = cv2.imencode(".jpg", image_array)[1].tostring()
+            image_string = cv2.imencode(".jpg", image_array)[1].tobytes()
             image_base64 = base64.b64encode(image_string).decode("utf-8")
             result = {}
             for key in key_list:

paddlex/inference/serving/basic_serving/_app.py CHANGED Viewed

@@ -15,6 +15,8 @@
 import asyncio
 import contextlib
 import json
+from queue import Queue
+from threading import Thread
 from typing import (
     Any,
     AsyncGenerator,
@@ -74,16 +76,22 @@ class PipelineWrapper(Generic[PipelineT]):
     def __init__(self, pipeline: PipelineT) -> None:
         super().__init__()
         self._pipeline = pipeline
-        self._lock = asyncio.Lock()
+        # HACK: We work around a bug in Paddle Inference by performing all
+        # inference in the same thread.
+        self._queue = Queue()
+        self._closed = False
+        self._loop = asyncio.get_running_loop()
+        self._thread = Thread(target=self._worker, daemon=False)
+        self._thread.start()
     @property
     def pipeline(self) -> PipelineT:
         return self._pipeline
     async def infer(self, *args: Any, **kwargs: Any) -> List[Any]:
-        def _infer() -> List[Any]:
+        def _infer(*args, **kwargs) -> List[Any]:
             output: list = []
-            with contextlib.closing(self._pipeline(*args, **kwargs)) as it:
+            with contextlib.closing(self._pipeline.predict(*args, **kwargs)) as it:
                 for item in it:
                     if _is_error(item):
                         raise fastapi.HTTPException(
@@ -93,11 +101,34 @@ class PipelineWrapper(Generic[PipelineT]):
             return output
-        return await self.call(_infer)
+        return await self.call(_infer, *args, **kwargs)
     async def call(self, func: Callable[P, R], *args: P.args, **kwargs: P.kwargs) -> R:
-        async with self._lock:
-            return await call_async(func, *args, **kwargs)
+        if self._closed:
+            raise RuntimeError("`PipelineWrapper` has already been closed")
+        fut = self._loop.create_future()
+        self._queue.put((func, args, kwargs, fut))
+        return await fut
+    async def close(self):
+        if not self._closed:
+            self._queue.put(None)
+            await call_async(self._thread.join)
+            self._closed = True
+    def _worker(self):
+        while not self._closed:
+            item = self._queue.get()
+            if item is None:
+                break
+            func, args, kwargs, fut = item
+            try:
+                result = func(*args, **kwargs)
+                self._loop.call_soon_threadsafe(fut.set_result, result)
+            except Exception as e:
+                self._loop.call_soon_threadsafe(fut.set_exception, e)
+            finally:
+                self._queue.task_done()
 @class_requires_deps("aiohttp")
@@ -141,14 +172,17 @@ def create_app(
     @contextlib.asynccontextmanager
     async def _app_lifespan(app: "fastapi.FastAPI") -> AsyncGenerator[None, None]:
         ctx.pipeline = PipelineWrapper[PipelineT](pipeline)
-        if app_aiohttp_session:
-            async with aiohttp.ClientSession(
-                cookie_jar=aiohttp.DummyCookieJar()
-            ) as aiohttp_session:
-                ctx.aiohttp_session = aiohttp_session
+        try:
+            if app_aiohttp_session:
+                async with aiohttp.ClientSession(
+                    cookie_jar=aiohttp.DummyCookieJar()
+                ) as aiohttp_session:
+                    ctx.aiohttp_session = aiohttp_session
+                    yield
+            else:
                 yield
-        else:
-            yield
+        finally:
+            await ctx.pipeline.close()
     # Should we control API versions?
     app = fastapi.FastAPI(lifespan=_app_lifespan)

paddlex/inference/serving/infra/utils.py CHANGED Viewed

@@ -18,6 +18,7 @@ import io
 import mimetypes
 import re
 import tempfile
+import threading
 import uuid
 from functools import partial
 from typing import Awaitable, Callable, List, Optional, Tuple, TypeVar, Union, overload
@@ -176,29 +177,33 @@ def base64_encode(data: bytes) -> str:
     return base64.b64encode(data).decode("ascii")
+_lock = threading.Lock()
 @function_requires_deps("pypdfium2", "opencv-contrib-python")
 def read_pdf(
     bytes_: bytes, max_num_imgs: Optional[int] = None
 ) -> Tuple[List[np.ndarray], PDFInfo]:
     images: List[np.ndarray] = []
     page_info_list: List[PDFPageInfo] = []
-    doc = pdfium.PdfDocument(bytes_)
-    for page in doc:
-        if max_num_imgs is not None and len(images) >= max_num_imgs:
-            break
-        # TODO: Do not always use zoom=2.0
-        zoom = 2.0
-        deg = 0
-        image = page.render(scale=zoom, rotation=deg).to_pil()
-        image = image.convert("RGB")
-        image = np.array(image)
-        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
-        images.append(image)
-        page_info = PDFPageInfo(
-            width=image.shape[1],
-            height=image.shape[0],
-        )
-        page_info_list.append(page_info)
+    with _lock:
+        doc = pdfium.PdfDocument(bytes_)
+        for page in doc:
+            if max_num_imgs is not None and len(images) >= max_num_imgs:
+                break
+            # TODO: Do not always use zoom=2.0
+            zoom = 2.0
+            deg = 0
+            image = page.render(scale=zoom, rotation=deg).to_pil()
+            image = image.convert("RGB")
+            image = np.array(image)
+            image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
+            images.append(image)
+            page_info = PDFPageInfo(
+                width=image.shape[1],
+                height=image.shape[0],
+            )
+            page_info_list.append(page_info)
     pdf_info = PDFInfo(
         numPages=len(page_info_list),
         pages=page_info_list,

paddlex 3.0.1__py3-none-any.whl → 3.0.3__py3-none-any.whl

paddlex 3.0.1py3-none-any.whl → 3.0.3py3-none-any.whl