PyPI - paddlex - Versions diffs - 2.0.0rc4__py3-none-any.whl → 3.0.0__py3-none-any.whl - Mend

paddlex 2.0.0rc4py3-none-any.whl → 3.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (1533) hide show

paddlex/.version +1 -0
paddlex/__init__.py +35 -18
paddlex/__main__.py +39 -0
paddlex/configs/modules/3d_bev_detection/BEVFusion.yaml +38 -0
paddlex/configs/modules/chart_parsing/PP-Chart2Table.yaml +13 -0
paddlex/configs/modules/doc_text_orientation/PP-LCNet_x1_0_doc_ori.yaml +41 -0
paddlex/configs/modules/doc_vlm/PP-DocBee-2B.yaml +14 -0
paddlex/configs/modules/doc_vlm/PP-DocBee-7B.yaml +14 -0
paddlex/configs/modules/doc_vlm/PP-DocBee2-3B.yaml +14 -0
paddlex/configs/modules/face_detection/BlazeFace-FPN-SSH.yaml +40 -0
paddlex/configs/modules/face_detection/BlazeFace.yaml +40 -0
paddlex/configs/modules/face_detection/PP-YOLOE_plus-S_face.yaml +40 -0
paddlex/configs/modules/face_detection/PicoDet_LCNet_x2_5_face.yaml +40 -0
paddlex/configs/modules/face_feature/MobileFaceNet.yaml +41 -0
paddlex/configs/modules/face_feature/ResNet50_face.yaml +41 -0
paddlex/configs/modules/formula_recognition/LaTeX_OCR_rec.yaml +40 -0
paddlex/configs/modules/formula_recognition/PP-FormulaNet-L.yaml +40 -0
paddlex/configs/modules/formula_recognition/PP-FormulaNet-S.yaml +40 -0
paddlex/configs/modules/formula_recognition/PP-FormulaNet_plus-L.yaml +40 -0
paddlex/configs/modules/formula_recognition/PP-FormulaNet_plus-M.yaml +40 -0
paddlex/configs/modules/formula_recognition/PP-FormulaNet_plus-S.yaml +40 -0
paddlex/configs/modules/formula_recognition/UniMERNet.yaml +40 -0
paddlex/configs/modules/human_detection/PP-YOLOE-L_human.yaml +42 -0
paddlex/configs/modules/human_detection/PP-YOLOE-S_human.yaml +42 -0
paddlex/configs/modules/image_anomaly_detection/STFPM.yaml +41 -0
paddlex/configs/modules/image_classification/CLIP_vit_base_patch16_224.yaml +41 -0
paddlex/configs/modules/image_classification/CLIP_vit_large_patch14_224.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_base_224.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_base_384.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_large_224.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_large_384.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_small.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_tiny.yaml +41 -0
paddlex/configs/modules/image_classification/FasterNet-L.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-M.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-S.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-T0.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-T1.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-T2.yaml +40 -0
paddlex/configs/modules/image_classification/MobileNetV1_x0_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV1_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV1_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV1_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x0_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x1_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x2_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x0_35.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x1_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x0_35.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x1_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_conv_large.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_conv_medium.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_conv_small.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_hybrid_large.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_hybrid_medium.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B0.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B1.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B2.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B3.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B4.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B5.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B6.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNet_base.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNet_small.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNet_tiny.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNetV2_base.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNetV2_large.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNetV2_small.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_25.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_35.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x1_5.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x2_0.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x2_5.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet101.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet101_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet152.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet152_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet18.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet18_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet200_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet34.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet34_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet50.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet50_vd.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S1.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S2.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S3.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S4.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_base_patch4_window12_384.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_base_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_large_patch4_window12_384.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_large_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_small_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_tiny_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_feature/PP-ShiTuV2_rec.yaml +42 -0
paddlex/configs/modules/image_feature/PP-ShiTuV2_rec_CLIP_vit_base.yaml +42 -0
paddlex/configs/modules/image_feature/PP-ShiTuV2_rec_CLIP_vit_large.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/CLIP_vit_base_patch16_448_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B0_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B4_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B6_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-LCNet_x1_0_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/ResNet50_ML.yaml +41 -0
paddlex/configs/modules/image_unwarping/UVDoc.yaml +12 -0
paddlex/configs/modules/instance_segmentation/Cascade-MaskRCNN-ResNet50-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Cascade-MaskRCNN-ResNet50-vd-SSLDv2-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-H.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-L.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-M.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-S.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-X.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNeXt101-vd-FPN.yaml +39 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet101-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet101-vd-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50-vd-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50.yaml +40 -0
paddlex/configs/modules/instance_segmentation/PP-YOLOE_seg-S.yaml +40 -0
paddlex/configs/modules/instance_segmentation/SOLOv2.yaml +40 -0
paddlex/configs/modules/keypoint_detection/PP-TinyPose_128x96.yaml +40 -0
paddlex/configs/modules/keypoint_detection/PP-TinyPose_256x192.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocBlockLayout.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout-L.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout-M.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout-S.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout_plus-L.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-L_layout_17cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-L_layout_3cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-S_layout_17cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-S_layout_3cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet_layout_1x.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet_layout_1x_table.yaml +40 -0
paddlex/configs/modules/layout_detection/RT-DETR-H_layout_17cls.yaml +40 -0
paddlex/configs/modules/layout_detection/RT-DETR-H_layout_3cls.yaml +40 -0
paddlex/configs/modules/mainbody_detection/PP-ShiTuV2_det.yaml +41 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_base.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_large.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_medium.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_small.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_tiny.yaml +12 -0
paddlex/configs/modules/object_detection/Cascade-FasterRCNN-ResNet50-FPN.yaml +41 -0
paddlex/configs/modules/object_detection/Cascade-FasterRCNN-ResNet50-vd-SSLDv2-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/CenterNet-DLA-34.yaml +41 -0
paddlex/configs/modules/object_detection/CenterNet-ResNet50.yaml +41 -0
paddlex/configs/modules/object_detection/Co-DINO-R50.yaml +40 -0
paddlex/configs/modules/object_detection/Co-DINO-Swin-L.yaml +40 -0
paddlex/configs/modules/object_detection/Co-Deformable-DETR-R50.yaml +40 -0
paddlex/configs/modules/object_detection/Co-Deformable-DETR-Swin-T.yaml +40 -0
paddlex/configs/modules/object_detection/DETR-R50.yaml +42 -0
paddlex/configs/modules/object_detection/FCOS-ResNet50.yaml +41 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNeXt101-vd-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet101-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet101.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet34-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-vd-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-vd-SSLDv2-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-Swin-Tiny-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-L.yaml +40 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-M.yaml +40 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-S.yaml +40 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-X.yaml +40 -0
paddlex/configs/modules/object_detection/PicoDet-L.yaml +40 -0
paddlex/configs/modules/object_detection/PicoDet-M.yaml +42 -0
paddlex/configs/modules/object_detection/PicoDet-S.yaml +40 -0
paddlex/configs/modules/object_detection/PicoDet-XS.yaml +42 -0
paddlex/configs/modules/object_detection/RT-DETR-H.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-L.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-R18.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-R50.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-X.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-L.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-M.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-N.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-S.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-T.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-X.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOv3-DarkNet53.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOv3-MobileNetV3.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOv3-ResNet50_vd_DCN.yaml +40 -0
paddlex/configs/modules/open_vocabulary_detection/GroundingDINO-T.yaml +13 -0
paddlex/configs/modules/open_vocabulary_detection/YOLO-Worldv2-L.yaml +13 -0
paddlex/configs/modules/open_vocabulary_segmentation/SAM-H_box.yaml +17 -0
paddlex/configs/modules/open_vocabulary_segmentation/SAM-H_point.yaml +15 -0
paddlex/configs/modules/pedestrian_attribute_recognition/PP-LCNet_x1_0_pedestrian_attribute.yaml +41 -0
paddlex/configs/modules/rotated_object_detection/PP-YOLOE-R-L.yaml +40 -0
paddlex/configs/modules/seal_text_detection/PP-OCRv4_mobile_seal_det.yaml +40 -0
paddlex/configs/modules/seal_text_detection/PP-OCRv4_server_seal_det.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3-R101.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3-R50.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3_Plus-R101.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3_Plus-R50.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/MaskFormer_small.yaml +42 -0
paddlex/configs/modules/semantic_segmentation/MaskFormer_tiny.yaml +42 -0
paddlex/configs/modules/semantic_segmentation/OCRNet_HRNet-W18.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/OCRNet_HRNet-W48.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/PP-LiteSeg-B.yaml +41 -0
paddlex/configs/modules/semantic_segmentation/PP-LiteSeg-T.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_base.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_large.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_small.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_tiny.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B0.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B1.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B2.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B3.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B4.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B5.yaml +40 -0
paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-L.yaml +42 -0
paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-S.yaml +42 -0
paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-largesize-L.yaml +42 -0
paddlex/configs/modules/table_cells_detection/RT-DETR-L_wired_table_cell_det.yaml +40 -0
paddlex/configs/modules/table_cells_detection/RT-DETR-L_wireless_table_cell_det.yaml +40 -0
paddlex/configs/modules/table_classification/PP-LCNet_x1_0_table_cls.yaml +41 -0
paddlex/configs/modules/table_structure_recognition/SLANeXt_wired.yaml +39 -0
paddlex/configs/modules/table_structure_recognition/SLANeXt_wireless.yaml +39 -0
paddlex/configs/modules/table_structure_recognition/SLANet.yaml +39 -0
paddlex/configs/modules/table_structure_recognition/SLANet_plus.yaml +39 -0
paddlex/configs/modules/text_detection/PP-OCRv3_mobile_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv3_server_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv4_mobile_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv4_server_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv5_mobile_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv5_server_det.yaml +40 -0
paddlex/configs/modules/text_recognition/PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv4_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv4_server_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv4_server_rec_doc.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv5_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv5_server_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/arabic_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ch_RepSVTR_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ch_SVTRv2_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/chinese_cht_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/cyrillic_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/devanagari_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/en_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/en_PP-OCRv4_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/japan_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ka_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/korean_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/latin_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ta_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/te_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/textline_orientation/PP-LCNet_x0_25_textline_ori.yaml +41 -0
paddlex/configs/modules/ts_anomaly_detection/AutoEncoder_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/DLinear_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/Nonstationary_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/PatchTST_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/TimesNet_ad.yaml +37 -0
paddlex/configs/modules/ts_classification/TimesNet_cls.yaml +37 -0
paddlex/configs/modules/ts_forecast/DLinear.yaml +38 -0
paddlex/configs/modules/ts_forecast/NLinear.yaml +38 -0
paddlex/configs/modules/ts_forecast/Nonstationary.yaml +38 -0
paddlex/configs/modules/ts_forecast/PatchTST.yaml +38 -0
paddlex/configs/modules/ts_forecast/RLinear.yaml +38 -0
paddlex/configs/modules/ts_forecast/TiDE.yaml +38 -0
paddlex/configs/modules/ts_forecast/TimesNet.yaml +38 -0
paddlex/configs/modules/vehicle_attribute_recognition/PP-LCNet_x1_0_vehicle_attribute.yaml +41 -0
paddlex/configs/modules/vehicle_detection/PP-YOLOE-L_vehicle.yaml +41 -0
paddlex/configs/modules/vehicle_detection/PP-YOLOE-S_vehicle.yaml +42 -0
paddlex/configs/modules/video_classification/PP-TSM-R50_8frames_uniform.yaml +42 -0
paddlex/configs/modules/video_classification/PP-TSMv2-LCNetV2_16frames_uniform.yaml +42 -0
paddlex/configs/modules/video_classification/PP-TSMv2-LCNetV2_8frames_uniform.yaml +42 -0
paddlex/configs/modules/video_detection/YOWO.yaml +40 -0
paddlex/configs/pipelines/3d_bev_detection.yaml +9 -0
paddlex/configs/pipelines/OCR.yaml +45 -0
paddlex/configs/pipelines/PP-ChatOCRv3-doc.yaml +151 -0
paddlex/configs/pipelines/PP-ChatOCRv4-doc.yaml +237 -0
paddlex/configs/pipelines/PP-ShiTuV2.yaml +18 -0
paddlex/configs/pipelines/PP-StructureV3.yaml +226 -0
paddlex/configs/pipelines/anomaly_detection.yaml +8 -0
paddlex/configs/pipelines/doc_preprocessor.yaml +15 -0
paddlex/configs/pipelines/doc_understanding.yaml +9 -0
paddlex/configs/pipelines/face_recognition.yaml +18 -0
paddlex/configs/pipelines/formula_recognition.yaml +39 -0
paddlex/configs/pipelines/human_keypoint_detection.yaml +17 -0
paddlex/configs/pipelines/image_classification.yaml +10 -0
paddlex/configs/pipelines/image_multilabel_classification.yaml +9 -0
paddlex/configs/pipelines/instance_segmentation.yaml +10 -0
paddlex/configs/pipelines/layout_parsing.yaml +102 -0
paddlex/configs/pipelines/multilingual_speech_recognition.yaml +9 -0
paddlex/configs/pipelines/object_detection.yaml +10 -0
paddlex/configs/pipelines/open_vocabulary_detection.yaml +12 -0
paddlex/configs/pipelines/open_vocabulary_segmentation.yaml +13 -0
paddlex/configs/pipelines/pedestrian_attribute_recognition.yaml +15 -0
paddlex/configs/pipelines/rotated_object_detection.yaml +10 -0
paddlex/configs/pipelines/seal_recognition.yaml +52 -0
paddlex/configs/pipelines/semantic_segmentation.yaml +10 -0
paddlex/configs/pipelines/small_object_detection.yaml +10 -0
paddlex/configs/pipelines/table_recognition.yaml +57 -0
paddlex/configs/pipelines/table_recognition_v2.yaml +82 -0
paddlex/configs/pipelines/ts_anomaly_detection.yaml +8 -0
paddlex/configs/pipelines/ts_classification.yaml +8 -0
paddlex/configs/pipelines/ts_forecast.yaml +8 -0
paddlex/configs/pipelines/vehicle_attribute_recognition.yaml +15 -0
paddlex/configs/pipelines/video_classification.yaml +9 -0
paddlex/configs/pipelines/video_detection.yaml +10 -0
paddlex/constants.py +17 -0
paddlex/engine.py +56 -0
paddlex/hpip_links.html +31 -0
paddlex/inference/__init__.py +19 -0
paddlex/inference/common/__init__.py +13 -0
paddlex/inference/common/batch_sampler/__init__.py +21 -0
paddlex/inference/common/batch_sampler/audio_batch_sampler.py +83 -0
paddlex/inference/common/batch_sampler/base_batch_sampler.py +94 -0
paddlex/inference/common/batch_sampler/det_3d_batch_sampler.py +144 -0
paddlex/inference/common/batch_sampler/doc_vlm_batch_sampler.py +87 -0
paddlex/inference/common/batch_sampler/image_batch_sampler.py +121 -0
paddlex/inference/common/batch_sampler/ts_batch_sampler.py +109 -0
paddlex/inference/common/batch_sampler/video_batch_sampler.py +74 -0
paddlex/inference/common/reader/__init__.py +19 -0
paddlex/inference/common/reader/audio_reader.py +46 -0
paddlex/inference/common/reader/det_3d_reader.py +241 -0
paddlex/inference/common/reader/image_reader.py +73 -0
paddlex/inference/common/reader/ts_reader.py +46 -0
paddlex/inference/common/reader/video_reader.py +42 -0
paddlex/inference/common/result/__init__.py +29 -0
paddlex/inference/common/result/base_cv_result.py +41 -0
paddlex/inference/common/result/base_result.py +72 -0
paddlex/inference/common/result/base_ts_result.py +41 -0
paddlex/inference/common/result/base_video_result.py +36 -0
paddlex/inference/common/result/mixin.py +709 -0
paddlex/inference/models/__init__.py +86 -0
paddlex/inference/models/anomaly_detection/__init__.py +15 -0
paddlex/inference/models/anomaly_detection/predictor.py +135 -0
paddlex/inference/models/anomaly_detection/processors.py +53 -0
paddlex/inference/models/anomaly_detection/result.py +71 -0
paddlex/inference/models/base/__init__.py +15 -0
paddlex/inference/models/base/predictor/__init__.py +15 -0
paddlex/inference/models/base/predictor/base_predictor.py +414 -0
paddlex/inference/models/common/__init__.py +26 -0
paddlex/inference/models/common/static_infer.py +801 -0
paddlex/inference/models/common/tokenizer/__init__.py +21 -0
paddlex/inference/models/common/tokenizer/bert_tokenizer.py +655 -0
paddlex/inference/models/common/tokenizer/clip_tokenizer.py +609 -0
paddlex/inference/models/common/tokenizer/gpt_tokenizer.py +453 -0
paddlex/inference/models/common/tokenizer/qwen2_5_tokenizer.py +112 -0
paddlex/inference/models/common/tokenizer/qwen2_tokenizer.py +438 -0
paddlex/inference/models/common/tokenizer/qwen_tokenizer.py +288 -0
paddlex/inference/models/common/tokenizer/tokenizer_utils.py +2149 -0
paddlex/inference/models/common/tokenizer/tokenizer_utils_base.py +3720 -0
paddlex/inference/models/common/tokenizer/utils.py +66 -0
paddlex/inference/models/common/tokenizer/vocab.py +647 -0
paddlex/inference/models/common/ts/__init__.py +15 -0
paddlex/inference/models/common/ts/funcs.py +540 -0
paddlex/inference/models/common/ts/processors.py +322 -0
paddlex/inference/models/common/vision/__init__.py +23 -0
paddlex/inference/models/common/vision/funcs.py +98 -0
paddlex/inference/models/common/vision/processors.py +285 -0
paddlex/inference/models/common/vlm/__init__.py +13 -0
paddlex/inference/models/common/vlm/activations.py +189 -0
paddlex/inference/models/common/vlm/bert_padding.py +127 -0
paddlex/inference/models/common/vlm/conversion_utils.py +99 -0
paddlex/inference/models/common/vlm/distributed.py +229 -0
paddlex/inference/models/common/vlm/flash_attn_utils.py +119 -0
paddlex/inference/models/common/vlm/fusion_ops.py +205 -0
paddlex/inference/models/common/vlm/generation/__init__.py +34 -0
paddlex/inference/models/common/vlm/generation/configuration_utils.py +533 -0
paddlex/inference/models/common/vlm/generation/logits_process.py +730 -0
paddlex/inference/models/common/vlm/generation/stopping_criteria.py +106 -0
paddlex/inference/models/common/vlm/generation/utils.py +2162 -0
paddlex/inference/models/common/vlm/transformers/__init__.py +16 -0
paddlex/inference/models/common/vlm/transformers/configuration_utils.py +1037 -0
paddlex/inference/models/common/vlm/transformers/conversion_utils.py +408 -0
paddlex/inference/models/common/vlm/transformers/model_outputs.py +1612 -0
paddlex/inference/models/common/vlm/transformers/model_utils.py +2014 -0
paddlex/inference/models/common/vlm/transformers/utils.py +178 -0
paddlex/inference/models/common/vlm/utils.py +109 -0
paddlex/inference/models/doc_vlm/__init__.py +15 -0
paddlex/inference/models/doc_vlm/modeling/GOT_ocr_2_0.py +830 -0
paddlex/inference/models/doc_vlm/modeling/__init__.py +17 -0
paddlex/inference/models/doc_vlm/modeling/qwen2.py +1606 -0
paddlex/inference/models/doc_vlm/modeling/qwen2_5_vl.py +3006 -0
paddlex/inference/models/doc_vlm/modeling/qwen2_vl.py +2495 -0
paddlex/inference/models/doc_vlm/predictor.py +253 -0
paddlex/inference/models/doc_vlm/processors/GOT_ocr_2_0.py +97 -0
paddlex/inference/models/doc_vlm/processors/__init__.py +17 -0
paddlex/inference/models/doc_vlm/processors/common.py +561 -0
paddlex/inference/models/doc_vlm/processors/qwen2_5_vl.py +548 -0
paddlex/inference/models/doc_vlm/processors/qwen2_vl.py +543 -0
paddlex/inference/models/doc_vlm/result.py +21 -0
paddlex/inference/models/face_feature/__init__.py +15 -0
paddlex/inference/models/face_feature/predictor.py +66 -0
paddlex/inference/models/formula_recognition/__init__.py +15 -0
paddlex/inference/models/formula_recognition/predictor.py +193 -0
paddlex/inference/models/formula_recognition/processors.py +1015 -0
paddlex/inference/models/formula_recognition/result.py +411 -0
paddlex/inference/models/image_classification/__init__.py +15 -0
paddlex/inference/models/image_classification/predictor.py +172 -0
paddlex/inference/models/image_classification/processors.py +89 -0
paddlex/inference/models/image_classification/result.py +93 -0
paddlex/inference/models/image_feature/__init__.py +15 -0
paddlex/inference/models/image_feature/predictor.py +146 -0
paddlex/inference/models/image_feature/processors.py +31 -0
paddlex/inference/models/image_feature/result.py +32 -0
paddlex/inference/models/image_multilabel_classification/__init__.py +15 -0
paddlex/inference/models/image_multilabel_classification/predictor.py +95 -0
paddlex/inference/models/image_multilabel_classification/processors.py +89 -0
paddlex/inference/models/image_multilabel_classification/result.py +96 -0
paddlex/inference/models/image_unwarping/__init__.py +15 -0
paddlex/inference/models/image_unwarping/predictor.py +97 -0
paddlex/inference/models/image_unwarping/processors.py +92 -0
paddlex/inference/models/image_unwarping/result.py +47 -0
paddlex/inference/models/instance_segmentation/__init__.py +15 -0
paddlex/inference/models/instance_segmentation/predictor.py +202 -0
paddlex/inference/models/instance_segmentation/processors.py +102 -0
paddlex/inference/models/instance_segmentation/result.py +162 -0
paddlex/inference/models/keypoint_detection/__init__.py +15 -0
paddlex/inference/models/keypoint_detection/predictor.py +190 -0
paddlex/inference/models/keypoint_detection/processors.py +367 -0
paddlex/inference/models/keypoint_detection/result.py +197 -0
paddlex/inference/models/m_3d_bev_detection/__init__.py +15 -0
paddlex/inference/models/m_3d_bev_detection/predictor.py +303 -0
paddlex/inference/models/m_3d_bev_detection/processors.py +990 -0
paddlex/inference/models/m_3d_bev_detection/result.py +68 -0
paddlex/inference/models/m_3d_bev_detection/visualizer_3d.py +169 -0
paddlex/inference/models/multilingual_speech_recognition/__init__.py +15 -0
paddlex/inference/models/multilingual_speech_recognition/predictor.py +137 -0
paddlex/inference/models/multilingual_speech_recognition/processors.py +1933 -0
paddlex/inference/models/multilingual_speech_recognition/result.py +21 -0
paddlex/inference/models/object_detection/__init__.py +15 -0
paddlex/inference/models/object_detection/predictor.py +344 -0
paddlex/inference/models/object_detection/processors.py +885 -0
paddlex/inference/models/object_detection/result.py +114 -0
paddlex/inference/models/object_detection/utils.py +70 -0
paddlex/inference/models/open_vocabulary_detection/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_detection/predictor.py +172 -0
paddlex/inference/models/open_vocabulary_detection/processors/__init__.py +16 -0
paddlex/inference/models/open_vocabulary_detection/processors/common.py +114 -0
paddlex/inference/models/open_vocabulary_detection/processors/groundingdino_processors.py +496 -0
paddlex/inference/models/open_vocabulary_detection/processors/yoloworld_processors.py +209 -0
paddlex/inference/models/open_vocabulary_segmentation/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_segmentation/predictor.py +113 -0
paddlex/inference/models/open_vocabulary_segmentation/processors/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_segmentation/processors/sam_processer.py +249 -0
paddlex/inference/models/open_vocabulary_segmentation/results/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_segmentation/results/sam_result.py +149 -0
paddlex/inference/models/semantic_segmentation/__init__.py +15 -0
paddlex/inference/models/semantic_segmentation/predictor.py +158 -0
paddlex/inference/models/semantic_segmentation/processors.py +117 -0
paddlex/inference/models/semantic_segmentation/result.py +73 -0
paddlex/inference/models/table_structure_recognition/__init__.py +15 -0
paddlex/inference/models/table_structure_recognition/predictor.py +161 -0
paddlex/inference/models/table_structure_recognition/processors.py +229 -0
paddlex/inference/models/table_structure_recognition/result.py +63 -0
paddlex/inference/models/text_detection/__init__.py +15 -0
paddlex/inference/models/text_detection/predictor.py +191 -0
paddlex/inference/models/text_detection/processors.py +538 -0
paddlex/inference/models/text_detection/result.py +46 -0
paddlex/inference/models/text_recognition/__init__.py +15 -0
paddlex/inference/models/text_recognition/predictor.py +98 -0
paddlex/inference/models/text_recognition/processors.py +245 -0
paddlex/inference/models/text_recognition/result.py +76 -0
paddlex/inference/models/ts_anomaly_detection/__init__.py +15 -0
paddlex/inference/models/ts_anomaly_detection/predictor.py +141 -0
paddlex/inference/models/ts_anomaly_detection/processors.py +98 -0
paddlex/inference/models/ts_anomaly_detection/result.py +83 -0
paddlex/inference/models/ts_classification/__init__.py +15 -0
paddlex/inference/models/ts_classification/predictor.py +122 -0
paddlex/inference/models/ts_classification/processors.py +122 -0
paddlex/inference/models/ts_classification/result.py +87 -0
paddlex/inference/models/ts_forecasting/__init__.py +15 -0
paddlex/inference/models/ts_forecasting/predictor.py +154 -0
paddlex/inference/models/ts_forecasting/processors.py +158 -0
paddlex/inference/models/ts_forecasting/result.py +96 -0
paddlex/inference/models/video_classification/__init__.py +15 -0
paddlex/inference/models/video_classification/predictor.py +141 -0
paddlex/inference/models/video_classification/processors.py +409 -0
paddlex/inference/models/video_classification/result.py +96 -0
paddlex/inference/models/video_detection/__init__.py +15 -0
paddlex/inference/models/video_detection/predictor.py +129 -0
paddlex/inference/models/video_detection/processors.py +463 -0
paddlex/inference/models/video_detection/result.py +109 -0
paddlex/inference/pipelines/__init__.py +239 -0
paddlex/inference/pipelines/_parallel.py +172 -0
paddlex/inference/pipelines/anomaly_detection/__init__.py +15 -0
paddlex/inference/pipelines/anomaly_detection/pipeline.py +82 -0
paddlex/inference/pipelines/attribute_recognition/__init__.py +15 -0
paddlex/inference/pipelines/attribute_recognition/pipeline.py +120 -0
paddlex/inference/pipelines/attribute_recognition/result.py +102 -0
paddlex/inference/pipelines/base.py +156 -0
paddlex/inference/pipelines/components/__init__.py +29 -0
paddlex/inference/pipelines/components/chat_server/__init__.py +16 -0
paddlex/inference/pipelines/components/chat_server/base.py +39 -0
paddlex/inference/pipelines/components/chat_server/openai_bot_chat.py +236 -0
paddlex/inference/pipelines/components/common/__init__.py +19 -0
paddlex/inference/pipelines/components/common/base_operator.py +37 -0
paddlex/inference/pipelines/components/common/base_result.py +66 -0
paddlex/inference/pipelines/components/common/convert_points_and_boxes.py +45 -0
paddlex/inference/pipelines/components/common/crop_image_regions.py +556 -0
paddlex/inference/pipelines/components/common/seal_det_warp.py +972 -0
paddlex/inference/pipelines/components/common/sort_boxes.py +85 -0
paddlex/inference/pipelines/components/common/warp_image.py +50 -0
paddlex/inference/pipelines/components/faisser.py +357 -0
paddlex/inference/pipelines/components/prompt_engineering/__init__.py +16 -0
paddlex/inference/pipelines/components/prompt_engineering/base.py +35 -0
paddlex/inference/pipelines/components/prompt_engineering/generate_ensemble_prompt.py +128 -0
paddlex/inference/pipelines/components/prompt_engineering/generate_kie_prompt.py +148 -0
paddlex/inference/pipelines/components/retriever/__init__.py +16 -0
paddlex/inference/pipelines/components/retriever/base.py +228 -0
paddlex/inference/pipelines/components/retriever/openai_bot_retriever.py +70 -0
paddlex/inference/pipelines/components/retriever/qianfan_bot_retriever.py +166 -0
paddlex/inference/pipelines/components/utils/__init__.py +13 -0
paddlex/inference/pipelines/components/utils/mixin.py +206 -0
paddlex/inference/pipelines/doc_preprocessor/__init__.py +15 -0
paddlex/inference/pipelines/doc_preprocessor/pipeline.py +209 -0
paddlex/inference/pipelines/doc_preprocessor/result.py +98 -0
paddlex/inference/pipelines/doc_understanding/__init__.py +15 -0
paddlex/inference/pipelines/doc_understanding/pipeline.py +71 -0
paddlex/inference/pipelines/face_recognition/__init__.py +15 -0
paddlex/inference/pipelines/face_recognition/pipeline.py +63 -0
paddlex/inference/pipelines/face_recognition/result.py +44 -0
paddlex/inference/pipelines/formula_recognition/__init__.py +15 -0
paddlex/inference/pipelines/formula_recognition/pipeline.py +347 -0
paddlex/inference/pipelines/formula_recognition/result.py +282 -0
paddlex/inference/pipelines/image_classification/__init__.py +15 -0
paddlex/inference/pipelines/image_classification/pipeline.py +90 -0
paddlex/inference/pipelines/image_multilabel_classification/__init__.py +15 -0
paddlex/inference/pipelines/image_multilabel_classification/pipeline.py +97 -0
paddlex/inference/pipelines/instance_segmentation/__init__.py +15 -0
paddlex/inference/pipelines/instance_segmentation/pipeline.py +91 -0
paddlex/inference/pipelines/keypoint_detection/__init__.py +15 -0
paddlex/inference/pipelines/keypoint_detection/pipeline.py +158 -0
paddlex/inference/pipelines/layout_parsing/__init__.py +16 -0
paddlex/inference/pipelines/layout_parsing/pipeline.py +568 -0
paddlex/inference/pipelines/layout_parsing/pipeline_v2.py +1382 -0
paddlex/inference/pipelines/layout_parsing/result.py +191 -0
paddlex/inference/pipelines/layout_parsing/result_v2.py +745 -0
paddlex/inference/pipelines/layout_parsing/setting.py +87 -0
paddlex/inference/pipelines/layout_parsing/utils.py +951 -0
paddlex/inference/pipelines/layout_parsing/xycut_enhanced/__init__.py +16 -0
paddlex/inference/pipelines/layout_parsing/xycut_enhanced/utils.py +1143 -0
paddlex/inference/pipelines/layout_parsing/xycut_enhanced/xycuts.py +562 -0
paddlex/inference/pipelines/m_3d_bev_detection/__init__.py +15 -0
paddlex/inference/pipelines/m_3d_bev_detection/pipeline.py +74 -0
paddlex/inference/pipelines/multilingual_speech_recognition/__init__.py +15 -0
paddlex/inference/pipelines/multilingual_speech_recognition/pipeline.py +78 -0
paddlex/inference/pipelines/object_detection/__init__.py +15 -0
paddlex/inference/pipelines/object_detection/pipeline.py +115 -0
paddlex/inference/pipelines/ocr/__init__.py +15 -0
paddlex/inference/pipelines/ocr/pipeline.py +463 -0
paddlex/inference/pipelines/ocr/result.py +255 -0
paddlex/inference/pipelines/open_vocabulary_detection/__init__.py +15 -0
paddlex/inference/pipelines/open_vocabulary_detection/pipeline.py +86 -0
paddlex/inference/pipelines/open_vocabulary_segmentation/__init__.py +15 -0
paddlex/inference/pipelines/open_vocabulary_segmentation/pipeline.py +100 -0
paddlex/inference/pipelines/pp_chatocr/__init__.py +16 -0
paddlex/inference/pipelines/pp_chatocr/pipeline_base.py +111 -0
paddlex/inference/pipelines/pp_chatocr/pipeline_v3.py +781 -0
paddlex/inference/pipelines/pp_chatocr/pipeline_v4.py +992 -0
paddlex/inference/pipelines/pp_shitu_v2/__init__.py +15 -0
paddlex/inference/pipelines/pp_shitu_v2/pipeline.py +156 -0
paddlex/inference/pipelines/pp_shitu_v2/result.py +126 -0
paddlex/inference/pipelines/rotated_object_detection/__init__.py +15 -0
paddlex/inference/pipelines/rotated_object_detection/pipeline.py +95 -0
paddlex/inference/pipelines/seal_recognition/__init__.py +15 -0
paddlex/inference/pipelines/seal_recognition/pipeline.py +335 -0
paddlex/inference/pipelines/seal_recognition/result.py +89 -0
paddlex/inference/pipelines/semantic_segmentation/__init__.py +15 -0
paddlex/inference/pipelines/semantic_segmentation/pipeline.py +95 -0
paddlex/inference/pipelines/small_object_detection/__init__.py +15 -0
paddlex/inference/pipelines/small_object_detection/pipeline.py +95 -0
paddlex/inference/pipelines/table_recognition/__init__.py +16 -0
paddlex/inference/pipelines/table_recognition/pipeline.py +486 -0
paddlex/inference/pipelines/table_recognition/pipeline_v2.py +1395 -0
paddlex/inference/pipelines/table_recognition/result.py +218 -0
paddlex/inference/pipelines/table_recognition/table_recognition_post_processing.py +366 -0
paddlex/inference/pipelines/table_recognition/table_recognition_post_processing_v2.py +488 -0
paddlex/inference/pipelines/table_recognition/utils.py +44 -0
paddlex/inference/pipelines/ts_anomaly_detection/__init__.py +15 -0
paddlex/inference/pipelines/ts_anomaly_detection/pipeline.py +72 -0
paddlex/inference/pipelines/ts_classification/__init__.py +15 -0
paddlex/inference/pipelines/ts_classification/pipeline.py +72 -0
paddlex/inference/pipelines/ts_forecasting/__init__.py +15 -0
paddlex/inference/pipelines/ts_forecasting/pipeline.py +72 -0
paddlex/inference/pipelines/video_classification/__init__.py +15 -0
paddlex/inference/pipelines/video_classification/pipeline.py +79 -0
paddlex/inference/pipelines/video_detection/__init__.py +15 -0
paddlex/inference/pipelines/video_detection/pipeline.py +86 -0
paddlex/inference/serving/__init__.py +17 -0
paddlex/inference/serving/basic_serving/__init__.py +18 -0
paddlex/inference/serving/basic_serving/_app.py +221 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/__init__.py +44 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/__init__.py +13 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/common.py +104 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/image_recognition.py +36 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/ocr.py +95 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/anomaly_detection.py +67 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/doc_preprocessor.py +100 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/doc_understanding.py +153 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/face_recognition.py +226 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/formula_recognition.py +100 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/human_keypoint_detection.py +81 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/image_classification.py +69 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/image_multilabel_classification.py +73 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/instance_segmentation.py +87 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/layout_parsing.py +117 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/m_3d_bev_detection.py +79 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/multilingual_speech_recognition.py +92 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/object_detection.py +77 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ocr.py +102 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/open_vocabulary_detection.py +81 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/open_vocabulary_segmentation.py +91 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pedestrian_attribute_recognition.py +84 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv3_doc.py +193 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv4_doc.py +223 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_shituv2.py +221 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_structurev3.py +143 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/rotated_object_detection.py +81 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/seal_recognition.py +106 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/semantic_segmentation.py +67 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/small_object_detection.py +72 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition.py +108 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition_v2.py +113 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ts_anomaly_detection.py +65 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ts_classification.py +64 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ts_forecast.py +65 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/vehicle_attribute_recognition.py +84 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/video_classification.py +76 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/video_detection.py +92 -0
paddlex/inference/serving/basic_serving/_server.py +40 -0
paddlex/inference/serving/infra/__init__.py +13 -0
paddlex/inference/serving/infra/config.py +36 -0
paddlex/inference/serving/infra/models.py +79 -0
paddlex/inference/serving/infra/storage.py +180 -0
paddlex/inference/serving/infra/utils.py +285 -0
paddlex/inference/serving/schemas/__init__.py +13 -0
paddlex/inference/serving/schemas/anomaly_detection.py +39 -0
paddlex/inference/serving/schemas/doc_preprocessor.py +54 -0
paddlex/inference/serving/schemas/doc_understanding.py +78 -0
paddlex/inference/serving/schemas/face_recognition.py +124 -0
paddlex/inference/serving/schemas/formula_recognition.py +56 -0
paddlex/inference/serving/schemas/human_keypoint_detection.py +55 -0
paddlex/inference/serving/schemas/image_classification.py +45 -0
paddlex/inference/serving/schemas/image_multilabel_classification.py +47 -0
paddlex/inference/serving/schemas/instance_segmentation.py +53 -0
paddlex/inference/serving/schemas/layout_parsing.py +71 -0
paddlex/inference/serving/schemas/m_3d_bev_detection.py +48 -0
paddlex/inference/serving/schemas/multilingual_speech_recognition.py +57 -0
paddlex/inference/serving/schemas/object_detection.py +52 -0
paddlex/inference/serving/schemas/ocr.py +60 -0
paddlex/inference/serving/schemas/open_vocabulary_detection.py +52 -0
paddlex/inference/serving/schemas/open_vocabulary_segmentation.py +52 -0
paddlex/inference/serving/schemas/pedestrian_attribute_recognition.py +61 -0
paddlex/inference/serving/schemas/pp_chatocrv3_doc.py +133 -0
paddlex/inference/serving/schemas/pp_chatocrv4_doc.py +150 -0
paddlex/inference/serving/schemas/pp_shituv2.py +124 -0
paddlex/inference/serving/schemas/pp_structurev3.py +88 -0
paddlex/inference/serving/schemas/rotated_object_detection.py +52 -0
paddlex/inference/serving/schemas/seal_recognition.py +62 -0
paddlex/inference/serving/schemas/semantic_segmentation.py +45 -0
paddlex/inference/serving/schemas/shared/__init__.py +13 -0
paddlex/inference/serving/schemas/shared/classification.py +23 -0
paddlex/inference/serving/schemas/shared/image_segmentation.py +28 -0
paddlex/inference/serving/schemas/shared/object_detection.py +24 -0
paddlex/inference/serving/schemas/shared/ocr.py +25 -0
paddlex/inference/serving/schemas/small_object_detection.py +52 -0
paddlex/inference/serving/schemas/table_recognition.py +64 -0
paddlex/inference/serving/schemas/table_recognition_v2.py +69 -0
paddlex/inference/serving/schemas/ts_anomaly_detection.py +37 -0
paddlex/inference/serving/schemas/ts_classification.py +38 -0
paddlex/inference/serving/schemas/ts_forecast.py +37 -0
paddlex/inference/serving/schemas/vehicle_attribute_recognition.py +61 -0
paddlex/inference/serving/schemas/video_classification.py +44 -0
paddlex/inference/serving/schemas/video_detection.py +56 -0
paddlex/inference/utils/__init__.py +13 -0
paddlex/inference/utils/benchmark.py +379 -0
paddlex/inference/utils/color_map.py +123 -0
paddlex/inference/utils/get_pipeline_path.py +27 -0
paddlex/inference/utils/hpi.py +254 -0
paddlex/inference/utils/hpi_model_info_collection.json +2331 -0
paddlex/inference/utils/io/__init__.py +36 -0
paddlex/inference/utils/io/readers.py +504 -0
paddlex/inference/utils/io/style.py +381 -0
paddlex/inference/utils/io/tablepyxl.py +157 -0
paddlex/inference/utils/io/writers.py +458 -0
paddlex/inference/utils/model_paths.py +48 -0
paddlex/inference/utils/new_ir_blocklist.py +27 -0
paddlex/inference/utils/official_models.py +367 -0
paddlex/inference/utils/pp_option.py +339 -0
paddlex/inference/utils/trt_blocklist.py +43 -0
paddlex/inference/utils/trt_config.py +420 -0
paddlex/model.py +131 -0
paddlex/modules/__init__.py +115 -0
paddlex/modules/anomaly_detection/__init__.py +18 -0
paddlex/modules/anomaly_detection/dataset_checker/__init__.py +94 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/analyse_dataset.py +82 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/check_dataset.py +91 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/convert_dataset.py +233 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/split_dataset.py +87 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/utils/visualizer.py +76 -0
paddlex/modules/anomaly_detection/evaluator.py +58 -0
paddlex/modules/anomaly_detection/exportor.py +22 -0
paddlex/modules/anomaly_detection/model_list.py +16 -0
paddlex/modules/anomaly_detection/trainer.py +70 -0
paddlex/modules/base/__init__.py +18 -0
paddlex/modules/base/build_model.py +33 -0
paddlex/modules/base/dataset_checker/__init__.py +16 -0
paddlex/modules/base/dataset_checker/dataset_checker.py +169 -0
paddlex/modules/base/dataset_checker/utils.py +108 -0
paddlex/modules/base/evaluator.py +170 -0
paddlex/modules/base/exportor.py +145 -0
paddlex/modules/base/trainer.py +144 -0
paddlex/modules/base/utils/__init__.py +13 -0
paddlex/modules/base/utils/cinn_setting.py +89 -0
paddlex/modules/base/utils/coco_eval.py +94 -0
paddlex/modules/base/utils/topk_eval.py +118 -0
paddlex/modules/doc_vlm/__init__.py +18 -0
paddlex/modules/doc_vlm/dataset_checker.py +29 -0
paddlex/modules/doc_vlm/evaluator.py +29 -0
paddlex/modules/doc_vlm/exportor.py +29 -0
paddlex/modules/doc_vlm/model_list.py +16 -0
paddlex/modules/doc_vlm/trainer.py +41 -0
paddlex/modules/face_recognition/__init__.py +18 -0
paddlex/modules/face_recognition/dataset_checker/__init__.py +71 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/__init__.py +16 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/check_dataset.py +172 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/utils/visualizer.py +153 -0
paddlex/modules/face_recognition/evaluator.py +52 -0
paddlex/modules/face_recognition/exportor.py +22 -0
paddlex/modules/face_recognition/model_list.py +15 -0
paddlex/modules/face_recognition/trainer.py +75 -0
paddlex/modules/formula_recognition/__init__.py +18 -0
paddlex/modules/formula_recognition/dataset_checker/__init__.py +113 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/analyse_dataset.py +158 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/check_dataset.py +76 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/convert_dataset.py +95 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/split_dataset.py +80 -0
paddlex/modules/formula_recognition/evaluator.py +80 -0
paddlex/modules/formula_recognition/exportor.py +22 -0
paddlex/modules/formula_recognition/model_list.py +23 -0
paddlex/modules/formula_recognition/trainer.py +123 -0
paddlex/modules/general_recognition/__init__.py +18 -0
paddlex/modules/general_recognition/dataset_checker/__init__.py +107 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/analyse_dataset.py +96 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/check_dataset.py +99 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/convert_dataset.py +100 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/split_dataset.py +82 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/utils/visualizer.py +147 -0
paddlex/modules/general_recognition/evaluator.py +31 -0
paddlex/modules/general_recognition/exportor.py +22 -0
paddlex/modules/general_recognition/model_list.py +19 -0
paddlex/modules/general_recognition/trainer.py +52 -0
paddlex/modules/image_classification/__init__.py +18 -0
paddlex/modules/image_classification/dataset_checker/__init__.py +104 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/analyse_dataset.py +92 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/check_dataset.py +132 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/convert_dataset.py +51 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/utils/visualizer.py +153 -0
paddlex/modules/image_classification/evaluator.py +43 -0
paddlex/modules/image_classification/exportor.py +22 -0
paddlex/modules/image_classification/model_list.py +99 -0
paddlex/modules/image_classification/trainer.py +82 -0
paddlex/modules/image_unwarping/__init__.py +13 -0
paddlex/modules/image_unwarping/model_list.py +17 -0
paddlex/modules/instance_segmentation/__init__.py +18 -0
paddlex/modules/instance_segmentation/dataset_checker/__init__.py +107 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/analyse_dataset.py +82 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/check_dataset.py +95 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/convert_dataset.py +241 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/split_dataset.py +122 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/utils/visualizer.py +223 -0
paddlex/modules/instance_segmentation/evaluator.py +32 -0
paddlex/modules/instance_segmentation/exportor.py +22 -0
paddlex/modules/instance_segmentation/model_list.py +33 -0
paddlex/modules/instance_segmentation/trainer.py +31 -0
paddlex/modules/keypoint_detection/__init__.py +18 -0
paddlex/modules/keypoint_detection/dataset_checker/__init__.py +56 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/__init__.py +15 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/check_dataset.py +91 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/utils/visualizer.py +124 -0
paddlex/modules/keypoint_detection/evaluator.py +41 -0
paddlex/modules/keypoint_detection/exportor.py +22 -0
paddlex/modules/keypoint_detection/model_list.py +16 -0
paddlex/modules/keypoint_detection/trainer.py +39 -0
paddlex/modules/m_3d_bev_detection/__init__.py +18 -0
paddlex/modules/m_3d_bev_detection/dataset_checker/__init__.py +95 -0
paddlex/modules/m_3d_bev_detection/dataset_checker/dataset_src/__init__.py +17 -0
paddlex/modules/m_3d_bev_detection/dataset_checker/dataset_src/analyse_dataset.py +106 -0
paddlex/modules/m_3d_bev_detection/dataset_checker/dataset_src/check_dataset.py +101 -0
paddlex/modules/m_3d_bev_detection/evaluator.py +46 -0
paddlex/modules/m_3d_bev_detection/exportor.py +22 -0
paddlex/modules/m_3d_bev_detection/model_list.py +18 -0
paddlex/modules/m_3d_bev_detection/trainer.py +68 -0
paddlex/modules/multilabel_classification/__init__.py +18 -0
paddlex/modules/multilabel_classification/dataset_checker/__init__.py +106 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/analyse_dataset.py +94 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/check_dataset.py +132 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/convert_dataset.py +120 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/utils/visualizer.py +149 -0
paddlex/modules/multilabel_classification/evaluator.py +43 -0
paddlex/modules/multilabel_classification/exportor.py +22 -0
paddlex/modules/multilabel_classification/model_list.py +24 -0
paddlex/modules/multilabel_classification/trainer.py +85 -0
paddlex/modules/multilingual_speech_recognition/__init__.py +18 -0
paddlex/modules/multilingual_speech_recognition/dataset_checker.py +27 -0
paddlex/modules/multilingual_speech_recognition/evaluator.py +27 -0
paddlex/modules/multilingual_speech_recognition/exportor.py +27 -0
paddlex/modules/multilingual_speech_recognition/model_list.py +22 -0
paddlex/modules/multilingual_speech_recognition/trainer.py +42 -0
paddlex/modules/object_detection/__init__.py +18 -0
paddlex/modules/object_detection/dataset_checker/__init__.py +106 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/analyse_dataset.py +82 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/check_dataset.py +91 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/convert_dataset.py +438 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/split_dataset.py +123 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/utils/visualizer.py +193 -0
paddlex/modules/object_detection/evaluator.py +57 -0
paddlex/modules/object_detection/exportor.py +22 -0
paddlex/modules/object_detection/model_list.py +86 -0
paddlex/modules/object_detection/trainer.py +98 -0
paddlex/modules/open_vocabulary_detection/__init__.py +18 -0
paddlex/modules/open_vocabulary_detection/dataset_checker.py +29 -0
paddlex/modules/open_vocabulary_detection/evaluator.py +29 -0
paddlex/modules/open_vocabulary_detection/exportor.py +29 -0
paddlex/modules/open_vocabulary_detection/model_list.py +16 -0
paddlex/modules/open_vocabulary_detection/trainer.py +44 -0
paddlex/modules/open_vocabulary_segmentation/__init__.py +18 -0
paddlex/modules/open_vocabulary_segmentation/dataset_checker.py +29 -0
paddlex/modules/open_vocabulary_segmentation/evaluator.py +29 -0
paddlex/modules/open_vocabulary_segmentation/exportor.py +29 -0
paddlex/modules/open_vocabulary_segmentation/model_list.py +19 -0
paddlex/modules/open_vocabulary_segmentation/trainer.py +44 -0
paddlex/modules/semantic_segmentation/__init__.py +18 -0
paddlex/modules/semantic_segmentation/dataset_checker/__init__.py +109 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/analyse_dataset.py +76 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/check_dataset.py +80 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/convert_dataset.py +165 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/split_dataset.py +87 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/utils/visualizer.py +75 -0
paddlex/modules/semantic_segmentation/evaluator.py +58 -0
paddlex/modules/semantic_segmentation/exportor.py +31 -0
paddlex/modules/semantic_segmentation/model_list.py +37 -0
paddlex/modules/semantic_segmentation/trainer.py +72 -0
paddlex/modules/table_recognition/__init__.py +18 -0
paddlex/modules/table_recognition/dataset_checker/__init__.py +98 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/analyse_dataset.py +59 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/check_dataset.py +87 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/split_dataset.py +80 -0
paddlex/modules/table_recognition/evaluator.py +43 -0
paddlex/modules/table_recognition/exportor.py +22 -0
paddlex/modules/table_recognition/model_list.py +21 -0
paddlex/modules/table_recognition/trainer.py +67 -0
paddlex/modules/text_detection/__init__.py +18 -0
paddlex/modules/text_detection/dataset_checker/__init__.py +107 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/analyse_dataset.py +220 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/check_dataset.py +106 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/split_dataset.py +140 -0
paddlex/modules/text_detection/evaluator.py +41 -0
paddlex/modules/text_detection/exportor.py +22 -0
paddlex/modules/text_detection/model_list.py +26 -0
paddlex/modules/text_detection/trainer.py +65 -0
paddlex/modules/text_recognition/__init__.py +18 -0
paddlex/modules/text_recognition/dataset_checker/__init__.py +125 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/analyse_dataset.py +162 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/check_dataset.py +104 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/convert_dataset.py +95 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/split_dataset.py +80 -0
paddlex/modules/text_recognition/evaluator.py +64 -0
paddlex/modules/text_recognition/exportor.py +22 -0
paddlex/modules/text_recognition/model_list.py +36 -0
paddlex/modules/text_recognition/trainer.py +105 -0
paddlex/modules/ts_anomaly_detection/__init__.py +19 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/__init__.py +111 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/analyse_dataset.py +19 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/convert_dataset.py +74 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/split_dataset.py +63 -0
paddlex/modules/ts_anomaly_detection/evaluator.py +67 -0
paddlex/modules/ts_anomaly_detection/exportor.py +44 -0
paddlex/modules/ts_anomaly_detection/model_list.py +22 -0
paddlex/modules/ts_anomaly_detection/trainer.py +113 -0
paddlex/modules/ts_classification/__init__.py +19 -0
paddlex/modules/ts_classification/dataset_checker/__init__.py +111 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/analyse_dataset.py +77 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/convert_dataset.py +74 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/split_dataset.py +88 -0
paddlex/modules/ts_classification/evaluator.py +66 -0
paddlex/modules/ts_classification/exportor.py +44 -0
paddlex/modules/ts_classification/model_list.py +18 -0
paddlex/modules/ts_classification/trainer.py +108 -0
paddlex/modules/ts_forecast/__init__.py +19 -0
paddlex/modules/ts_forecast/dataset_checker/__init__.py +111 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/analyse_dataset.py +19 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/convert_dataset.py +73 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/split_dataset.py +63 -0
paddlex/modules/ts_forecast/evaluator.py +66 -0
paddlex/modules/ts_forecast/exportor.py +44 -0
paddlex/modules/ts_forecast/model_list.py +24 -0
paddlex/modules/ts_forecast/trainer.py +108 -0
paddlex/modules/video_classification/__init__.py +18 -0
paddlex/modules/video_classification/dataset_checker/__init__.py +93 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/analyse_dataset.py +93 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/check_dataset.py +120 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/split_dataset.py +82 -0
paddlex/modules/video_classification/evaluator.py +44 -0
paddlex/modules/video_classification/exportor.py +22 -0
paddlex/modules/video_classification/model_list.py +19 -0
paddlex/modules/video_classification/trainer.py +88 -0
paddlex/modules/video_detection/__init__.py +18 -0
paddlex/modules/video_detection/dataset_checker/__init__.py +86 -0
paddlex/modules/video_detection/dataset_checker/dataset_src/__init__.py +17 -0
paddlex/modules/video_detection/dataset_checker/dataset_src/analyse_dataset.py +100 -0
paddlex/modules/video_detection/dataset_checker/dataset_src/check_dataset.py +132 -0
paddlex/modules/video_detection/evaluator.py +42 -0
paddlex/modules/video_detection/exportor.py +22 -0
paddlex/modules/video_detection/model_list.py +15 -0
paddlex/modules/video_detection/trainer.py +82 -0
paddlex/ops/__init__.py +152 -0
paddlex/ops/iou3d_nms/iou3d_cpu.cpp +266 -0
paddlex/ops/iou3d_nms/iou3d_cpu.h +28 -0
paddlex/ops/iou3d_nms/iou3d_nms.cpp +206 -0
paddlex/ops/iou3d_nms/iou3d_nms.h +35 -0
paddlex/ops/iou3d_nms/iou3d_nms_api.cpp +114 -0
paddlex/ops/iou3d_nms/iou3d_nms_kernel.cu +484 -0
paddlex/ops/setup.py +37 -0
paddlex/ops/voxel/voxelize_op.cc +194 -0
paddlex/ops/voxel/voxelize_op.cu +346 -0
paddlex/paddlex_cli.py +476 -0
paddlex/repo_apis/Paddle3D_api/__init__.py +17 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/__init__.py +18 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/config.py +118 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/model.py +238 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/register.py +55 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/runner.py +104 -0
paddlex/repo_apis/Paddle3D_api/pp3d_config.py +145 -0
paddlex/repo_apis/PaddleClas_api/__init__.py +17 -0
paddlex/repo_apis/PaddleClas_api/cls/__init__.py +19 -0
paddlex/repo_apis/PaddleClas_api/cls/config.py +595 -0
paddlex/repo_apis/PaddleClas_api/cls/model.py +355 -0
paddlex/repo_apis/PaddleClas_api/cls/register.py +907 -0
paddlex/repo_apis/PaddleClas_api/cls/runner.py +218 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/__init__.py +18 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/config.py +141 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/model.py +20 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/register.py +68 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/runner.py +50 -0
paddlex/repo_apis/PaddleDetection_api/__init__.py +17 -0
paddlex/repo_apis/PaddleDetection_api/config_helper.py +280 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/__init__.py +18 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/config.py +457 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/model.py +403 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/register.py +262 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/runner.py +225 -0
paddlex/repo_apis/PaddleDetection_api/object_det/__init__.py +19 -0
paddlex/repo_apis/PaddleDetection_api/object_det/config.py +540 -0
paddlex/repo_apis/PaddleDetection_api/object_det/model.py +429 -0
paddlex/repo_apis/PaddleDetection_api/object_det/official_categories.py +245 -0
paddlex/repo_apis/PaddleDetection_api/object_det/register.py +1135 -0
paddlex/repo_apis/PaddleDetection_api/object_det/runner.py +225 -0
paddlex/repo_apis/PaddleNLP_api/__init__.py +13 -0
paddlex/repo_apis/PaddleOCR_api/__init__.py +22 -0
paddlex/repo_apis/PaddleOCR_api/config_utils.py +53 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/config.py +571 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/model.py +398 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/register.py +99 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/runner.py +239 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/config.py +64 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/model.py +126 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/register.py +70 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/runner.py +51 -0
paddlex/repo_apis/PaddleOCR_api/text_det/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/text_det/config.py +62 -0
paddlex/repo_apis/PaddleOCR_api/text_det/model.py +72 -0
paddlex/repo_apis/PaddleOCR_api/text_det/register.py +107 -0
paddlex/repo_apis/PaddleOCR_api/text_det/runner.py +53 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/config.py +564 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/model.py +398 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/register.py +216 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/runner.py +239 -0
paddlex/repo_apis/PaddleSeg_api/__init__.py +16 -0
paddlex/repo_apis/PaddleSeg_api/base_seg_config.py +134 -0
paddlex/repo_apis/PaddleSeg_api/seg/__init__.py +16 -0
paddlex/repo_apis/PaddleSeg_api/seg/config.py +183 -0
paddlex/repo_apis/PaddleSeg_api/seg/model.py +491 -0
paddlex/repo_apis/PaddleSeg_api/seg/register.py +272 -0
paddlex/repo_apis/PaddleSeg_api/seg/runner.py +261 -0
paddlex/repo_apis/PaddleTS_api/__init__.py +20 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/config.py +88 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/register.py +146 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_base/__init__.py +13 -0
paddlex/repo_apis/PaddleTS_api/ts_base/config.py +244 -0
paddlex/repo_apis/PaddleTS_api/ts_base/model.py +276 -0
paddlex/repo_apis/PaddleTS_api/ts_base/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/config.py +72 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/register.py +59 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/config.py +136 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/register.py +186 -0
paddlex/repo_apis/PaddleVideo_api/__init__.py +17 -0
paddlex/repo_apis/PaddleVideo_api/config_utils.py +51 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/__init__.py +19 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/config.py +548 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/model.py +346 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/register.py +70 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/runner.py +204 -0
paddlex/repo_apis/PaddleVideo_api/video_det/__init__.py +19 -0
paddlex/repo_apis/PaddleVideo_api/video_det/config.py +549 -0
paddlex/repo_apis/PaddleVideo_api/video_det/model.py +298 -0
paddlex/repo_apis/PaddleVideo_api/video_det/register.py +44 -0
paddlex/repo_apis/PaddleVideo_api/video_det/runner.py +199 -0
paddlex/repo_apis/__init__.py +13 -0
paddlex/repo_apis/base/__init__.py +22 -0
paddlex/repo_apis/base/config.py +237 -0
paddlex/repo_apis/base/model.py +563 -0
paddlex/repo_apis/base/register.py +135 -0
paddlex/repo_apis/base/runner.py +390 -0
paddlex/repo_apis/base/utils/__init__.py +13 -0
paddlex/repo_apis/base/utils/arg.py +64 -0
paddlex/repo_apis/base/utils/subprocess.py +107 -0
paddlex/repo_manager/__init__.py +17 -0
paddlex/repo_manager/core.py +253 -0
paddlex/repo_manager/meta.py +180 -0
paddlex/repo_manager/repo.py +425 -0
paddlex/repo_manager/utils.py +148 -0
paddlex/utils/__init__.py +1 -12
paddlex/utils/cache.py +146 -0
paddlex/utils/config.py +216 -0
paddlex/utils/custom_device_list.py +311 -0
paddlex/utils/deps.py +249 -0
paddlex/utils/device.py +195 -0
paddlex/utils/download.py +168 -182
paddlex/utils/env.py +31 -48
paddlex/utils/errors/__init__.py +17 -0
paddlex/utils/errors/dataset_checker.py +78 -0
paddlex/utils/errors/others.py +138 -0
paddlex/utils/file_interface.py +211 -0
paddlex/utils/flags.py +70 -0
paddlex/utils/fonts/__init__.py +97 -0
paddlex/utils/func_register.py +41 -0
paddlex/utils/install.py +87 -0
paddlex/utils/interactive_get_pipeline.py +55 -0
paddlex/utils/lazy_loader.py +68 -0
paddlex/utils/logging.py +140 -33
paddlex/utils/misc.py +201 -0
paddlex/utils/pipeline_arguments.py +719 -0
paddlex/utils/result_saver.py +58 -0
paddlex/utils/subclass_register.py +99 -0
paddlex/version.py +55 -0
paddlex-3.0.0.dist-info/METADATA +1168 -0
paddlex-3.0.0.dist-info/RECORD +1093 -0
paddlex-3.0.0.dist-info/WHEEL +5 -0
paddlex-3.0.0.dist-info/entry_points.txt +2 -0
paddlex-3.0.0.dist-info/licenses/LICENSE +169 -0
paddlex-3.0.0.dist-info/top_level.txt +1 -0
PaddleClas/__init__.py +0 -16
PaddleClas/paddleclas.py +0 -375
PaddleClas/ppcls/__init__.py +0 -20
PaddleClas/ppcls/data/__init__.py +0 -15
PaddleClas/ppcls/data/imaug/__init__.py +0 -94
PaddleClas/ppcls/data/imaug/autoaugment.py +0 -264
PaddleClas/ppcls/data/imaug/batch_operators.py +0 -117
PaddleClas/ppcls/data/imaug/cutout.py +0 -41
PaddleClas/ppcls/data/imaug/fmix.py +0 -217
PaddleClas/ppcls/data/imaug/grid.py +0 -89
PaddleClas/ppcls/data/imaug/hide_and_seek.py +0 -44
PaddleClas/ppcls/data/imaug/operators.py +0 -244
PaddleClas/ppcls/data/imaug/randaugment.py +0 -106
PaddleClas/ppcls/data/imaug/random_erasing.py +0 -55
PaddleClas/ppcls/data/reader.py +0 -318
PaddleClas/ppcls/modeling/__init__.py +0 -20
PaddleClas/ppcls/modeling/architectures/__init__.py +0 -51
PaddleClas/ppcls/modeling/architectures/alexnet.py +0 -132
PaddleClas/ppcls/modeling/architectures/darknet.py +0 -161
PaddleClas/ppcls/modeling/architectures/densenet.py +0 -308
PaddleClas/ppcls/modeling/architectures/distillation_models.py +0 -65
PaddleClas/ppcls/modeling/architectures/distilled_vision_transformer.py +0 -196
PaddleClas/ppcls/modeling/architectures/dpn.py +0 -425
PaddleClas/ppcls/modeling/architectures/efficientnet.py +0 -901
PaddleClas/ppcls/modeling/architectures/ghostnet.py +0 -331
PaddleClas/ppcls/modeling/architectures/googlenet.py +0 -207
PaddleClas/ppcls/modeling/architectures/hrnet.py +0 -742
PaddleClas/ppcls/modeling/architectures/inception_v3.py +0 -481
PaddleClas/ppcls/modeling/architectures/inception_v4.py +0 -455
PaddleClas/ppcls/modeling/architectures/mixnet.py +0 -782
PaddleClas/ppcls/modeling/architectures/mobilenet_v1.py +0 -266
PaddleClas/ppcls/modeling/architectures/mobilenet_v2.py +0 -248
PaddleClas/ppcls/modeling/architectures/mobilenet_v3.py +0 -359
PaddleClas/ppcls/modeling/architectures/regnet.py +0 -383
PaddleClas/ppcls/modeling/architectures/repvgg.py +0 -339
PaddleClas/ppcls/modeling/architectures/res2net.py +0 -272
PaddleClas/ppcls/modeling/architectures/res2net_vd.py +0 -295
PaddleClas/ppcls/modeling/architectures/resnest.py +0 -705
PaddleClas/ppcls/modeling/architectures/resnet.py +0 -316
PaddleClas/ppcls/modeling/architectures/resnet_vc.py +0 -309
PaddleClas/ppcls/modeling/architectures/resnet_vd.py +0 -354
PaddleClas/ppcls/modeling/architectures/resnext.py +0 -253
PaddleClas/ppcls/modeling/architectures/resnext101_wsl.py +0 -447
PaddleClas/ppcls/modeling/architectures/resnext_vd.py +0 -266
PaddleClas/ppcls/modeling/architectures/rexnet.py +0 -240
PaddleClas/ppcls/modeling/architectures/se_resnet_vd.py +0 -378
PaddleClas/ppcls/modeling/architectures/se_resnext.py +0 -290
PaddleClas/ppcls/modeling/architectures/se_resnext_vd.py +0 -285
PaddleClas/ppcls/modeling/architectures/shufflenet_v2.py +0 -320
PaddleClas/ppcls/modeling/architectures/squeezenet.py +0 -154
PaddleClas/ppcls/modeling/architectures/vgg.py +0 -152
PaddleClas/ppcls/modeling/architectures/vision_transformer.py +0 -402
PaddleClas/ppcls/modeling/architectures/xception.py +0 -345
PaddleClas/ppcls/modeling/architectures/xception_deeplab.py +0 -386
PaddleClas/ppcls/modeling/loss.py +0 -154
PaddleClas/ppcls/modeling/utils.py +0 -53
PaddleClas/ppcls/optimizer/__init__.py +0 -19
PaddleClas/ppcls/optimizer/learning_rate.py +0 -159
PaddleClas/ppcls/optimizer/optimizer.py +0 -165
PaddleClas/ppcls/utils/__init__.py +0 -27
PaddleClas/ppcls/utils/check.py +0 -151
PaddleClas/ppcls/utils/config.py +0 -201
PaddleClas/ppcls/utils/logger.py +0 -120
PaddleClas/ppcls/utils/metrics.py +0 -107
PaddleClas/ppcls/utils/misc.py +0 -62
PaddleClas/ppcls/utils/model_zoo.py +0 -213
PaddleClas/ppcls/utils/save_load.py +0 -163
PaddleClas/setup.py +0 -55
PaddleClas/tools/__init__.py +0 -15
PaddleClas/tools/download.py +0 -50
PaddleClas/tools/ema.py +0 -58
PaddleClas/tools/eval.py +0 -112
PaddleClas/tools/export_model.py +0 -85
PaddleClas/tools/export_serving_model.py +0 -76
PaddleClas/tools/infer/__init__.py +0 -16
PaddleClas/tools/infer/infer.py +0 -94
PaddleClas/tools/infer/predict.py +0 -117
PaddleClas/tools/infer/utils.py +0 -233
PaddleClas/tools/program.py +0 -444
PaddleClas/tools/test_hubserving.py +0 -113
PaddleClas/tools/train.py +0 -141
paddlex/cls.py +0 -76
paddlex/command.py +0 -215
paddlex/cv/__init__.py +0 -17
paddlex/cv/datasets/__init__.py +0 -18
paddlex/cv/datasets/coco.py +0 -169
paddlex/cv/datasets/imagenet.py +0 -88
paddlex/cv/datasets/seg_dataset.py +0 -91
paddlex/cv/datasets/voc.py +0 -301
paddlex/cv/models/__init__.py +0 -18
paddlex/cv/models/base.py +0 -623
paddlex/cv/models/classifier.py +0 -814
paddlex/cv/models/detector.py +0 -1747
paddlex/cv/models/load_model.py +0 -126
paddlex/cv/models/segmenter.py +0 -673
paddlex/cv/models/slim/__init__.py +0 -13
paddlex/cv/models/slim/prune.py +0 -55
paddlex/cv/models/utils/__init__.py +0 -13
paddlex/cv/models/utils/det_metrics/__init__.py +0 -15
paddlex/cv/models/utils/det_metrics/coco_utils.py +0 -217
paddlex/cv/models/utils/det_metrics/metrics.py +0 -220
paddlex/cv/models/utils/ema.py +0 -48
paddlex/cv/models/utils/seg_metrics.py +0 -62
paddlex/cv/models/utils/visualize.py +0 -394
paddlex/cv/transforms/__init__.py +0 -46
paddlex/cv/transforms/batch_operators.py +0 -286
paddlex/cv/transforms/box_utils.py +0 -41
paddlex/cv/transforms/functions.py +0 -193
paddlex/cv/transforms/operators.py +0 -1402
paddlex/det.py +0 -43
paddlex/paddleseg/__init__.py +0 -17
paddlex/paddleseg/core/__init__.py +0 -20
paddlex/paddleseg/core/infer.py +0 -289
paddlex/paddleseg/core/predict.py +0 -145
paddlex/paddleseg/core/train.py +0 -258
paddlex/paddleseg/core/val.py +0 -172
paddlex/paddleseg/cvlibs/__init__.py +0 -17
paddlex/paddleseg/cvlibs/callbacks.py +0 -279
paddlex/paddleseg/cvlibs/config.py +0 -359
paddlex/paddleseg/cvlibs/manager.py +0 -142
paddlex/paddleseg/cvlibs/param_init.py +0 -91
paddlex/paddleseg/datasets/__init__.py +0 -21
paddlex/paddleseg/datasets/ade.py +0 -112
paddlex/paddleseg/datasets/cityscapes.py +0 -86
paddlex/paddleseg/datasets/cocostuff.py +0 -79
paddlex/paddleseg/datasets/dataset.py +0 -164
paddlex/paddleseg/datasets/mini_deep_globe_road_extraction.py +0 -95
paddlex/paddleseg/datasets/optic_disc_seg.py +0 -97
paddlex/paddleseg/datasets/pascal_context.py +0 -80
paddlex/paddleseg/datasets/voc.py +0 -113
paddlex/paddleseg/models/__init__.py +0 -39
paddlex/paddleseg/models/ann.py +0 -436
paddlex/paddleseg/models/attention_unet.py +0 -189
paddlex/paddleseg/models/backbones/__init__.py +0 -18
paddlex/paddleseg/models/backbones/hrnet.py +0 -815
paddlex/paddleseg/models/backbones/mobilenetv3.py +0 -365
paddlex/paddleseg/models/backbones/resnet_vd.py +0 -364
paddlex/paddleseg/models/backbones/xception_deeplab.py +0 -415
paddlex/paddleseg/models/bisenet.py +0 -311
paddlex/paddleseg/models/danet.py +0 -220
paddlex/paddleseg/models/decoupled_segnet.py +0 -233
paddlex/paddleseg/models/deeplab.py +0 -258
paddlex/paddleseg/models/dnlnet.py +0 -231
paddlex/paddleseg/models/emanet.py +0 -219
paddlex/paddleseg/models/fast_scnn.py +0 -318
paddlex/paddleseg/models/fcn.py +0 -135
paddlex/paddleseg/models/gcnet.py +0 -223
paddlex/paddleseg/models/gscnn.py +0 -357
paddlex/paddleseg/models/hardnet.py +0 -309
paddlex/paddleseg/models/isanet.py +0 -202
paddlex/paddleseg/models/layers/__init__.py +0 -19
paddlex/paddleseg/models/layers/activation.py +0 -73
paddlex/paddleseg/models/layers/attention.py +0 -146
paddlex/paddleseg/models/layers/layer_libs.py +0 -168
paddlex/paddleseg/models/layers/nonlocal2d.py +0 -155
paddlex/paddleseg/models/layers/pyramid_pool.py +0 -182
paddlex/paddleseg/models/losses/__init__.py +0 -27
paddlex/paddleseg/models/losses/binary_cross_entropy_loss.py +0 -174
paddlex/paddleseg/models/losses/bootstrapped_cross_entropy.py +0 -73
paddlex/paddleseg/models/losses/cross_entropy_loss.py +0 -94
paddlex/paddleseg/models/losses/decoupledsegnet_relax_boundary_loss.py +0 -129
paddlex/paddleseg/models/losses/dice_loss.py +0 -61
paddlex/paddleseg/models/losses/edge_attention_loss.py +0 -78
paddlex/paddleseg/models/losses/gscnn_dual_task_loss.py +0 -141
paddlex/paddleseg/models/losses/l1_loss.py +0 -76
paddlex/paddleseg/models/losses/lovasz_loss.py +0 -222
paddlex/paddleseg/models/losses/mean_square_error_loss.py +0 -65
paddlex/paddleseg/models/losses/mixed_loss.py +0 -58
paddlex/paddleseg/models/losses/ohem_cross_entropy_loss.py +0 -99
paddlex/paddleseg/models/losses/ohem_edge_attention_loss.py +0 -114
paddlex/paddleseg/models/ocrnet.py +0 -248
paddlex/paddleseg/models/pspnet.py +0 -147
paddlex/paddleseg/models/sfnet.py +0 -236
paddlex/paddleseg/models/shufflenet_slim.py +0 -268
paddlex/paddleseg/models/u2net.py +0 -574
paddlex/paddleseg/models/unet.py +0 -155
paddlex/paddleseg/models/unet_3plus.py +0 -316
paddlex/paddleseg/models/unet_plusplus.py +0 -237
paddlex/paddleseg/transforms/__init__.py +0 -16
paddlex/paddleseg/transforms/functional.py +0 -161
paddlex/paddleseg/transforms/transforms.py +0 -937
paddlex/paddleseg/utils/__init__.py +0 -22
paddlex/paddleseg/utils/config_check.py +0 -60
paddlex/paddleseg/utils/download.py +0 -163
paddlex/paddleseg/utils/env/__init__.py +0 -16
paddlex/paddleseg/utils/env/seg_env.py +0 -56
paddlex/paddleseg/utils/env/sys_env.py +0 -122
paddlex/paddleseg/utils/logger.py +0 -48
paddlex/paddleseg/utils/metrics.py +0 -146
paddlex/paddleseg/utils/progbar.py +0 -212
paddlex/paddleseg/utils/timer.py +0 -53
paddlex/paddleseg/utils/utils.py +0 -120
paddlex/paddleseg/utils/visualize.py +0 -90
paddlex/ppcls/__init__.py +0 -20
paddlex/ppcls/data/__init__.py +0 -15
paddlex/ppcls/data/imaug/__init__.py +0 -94
paddlex/ppcls/data/imaug/autoaugment.py +0 -264
paddlex/ppcls/data/imaug/batch_operators.py +0 -117
paddlex/ppcls/data/imaug/cutout.py +0 -41
paddlex/ppcls/data/imaug/fmix.py +0 -217
paddlex/ppcls/data/imaug/grid.py +0 -89
paddlex/ppcls/data/imaug/hide_and_seek.py +0 -44
paddlex/ppcls/data/imaug/operators.py +0 -256
paddlex/ppcls/data/imaug/randaugment.py +0 -106
paddlex/ppcls/data/imaug/random_erasing.py +0 -55
paddlex/ppcls/data/reader.py +0 -318
paddlex/ppcls/modeling/__init__.py +0 -20
paddlex/ppcls/modeling/architectures/__init__.py +0 -51
paddlex/ppcls/modeling/architectures/alexnet.py +0 -132
paddlex/ppcls/modeling/architectures/darknet.py +0 -161
paddlex/ppcls/modeling/architectures/densenet.py +0 -308
paddlex/ppcls/modeling/architectures/distillation_models.py +0 -65
paddlex/ppcls/modeling/architectures/distilled_vision_transformer.py +0 -196
paddlex/ppcls/modeling/architectures/dpn.py +0 -425
paddlex/ppcls/modeling/architectures/efficientnet.py +0 -901
paddlex/ppcls/modeling/architectures/ghostnet.py +0 -331
paddlex/ppcls/modeling/architectures/googlenet.py +0 -207
paddlex/ppcls/modeling/architectures/hrnet.py +0 -742
paddlex/ppcls/modeling/architectures/inception_v3.py +0 -541
paddlex/ppcls/modeling/architectures/inception_v4.py +0 -455
paddlex/ppcls/modeling/architectures/mixnet.py +0 -782
paddlex/ppcls/modeling/architectures/mobilenet_v1.py +0 -266
paddlex/ppcls/modeling/architectures/mobilenet_v2.py +0 -248
paddlex/ppcls/modeling/architectures/mobilenet_v3.py +0 -359
paddlex/ppcls/modeling/architectures/regnet.py +0 -383
paddlex/ppcls/modeling/architectures/repvgg.py +0 -339
paddlex/ppcls/modeling/architectures/res2net.py +0 -272
paddlex/ppcls/modeling/architectures/res2net_vd.py +0 -295
paddlex/ppcls/modeling/architectures/resnest.py +0 -705
paddlex/ppcls/modeling/architectures/resnet.py +0 -317
paddlex/ppcls/modeling/architectures/resnet_vc.py +0 -309
paddlex/ppcls/modeling/architectures/resnet_vd.py +0 -354
paddlex/ppcls/modeling/architectures/resnext.py +0 -259
paddlex/ppcls/modeling/architectures/resnext101_wsl.py +0 -447
paddlex/ppcls/modeling/architectures/resnext_vd.py +0 -266
paddlex/ppcls/modeling/architectures/rexnet.py +0 -240
paddlex/ppcls/modeling/architectures/se_resnet_vd.py +0 -378
paddlex/ppcls/modeling/architectures/se_resnext.py +0 -290
paddlex/ppcls/modeling/architectures/se_resnext_vd.py +0 -285
paddlex/ppcls/modeling/architectures/shufflenet_v2.py +0 -320
paddlex/ppcls/modeling/architectures/squeezenet.py +0 -154
paddlex/ppcls/modeling/architectures/vgg.py +0 -152
paddlex/ppcls/modeling/architectures/vision_transformer.py +0 -402
paddlex/ppcls/modeling/architectures/xception.py +0 -345
paddlex/ppcls/modeling/architectures/xception_deeplab.py +0 -386
paddlex/ppcls/modeling/loss.py +0 -158
paddlex/ppcls/modeling/utils.py +0 -53
paddlex/ppcls/optimizer/__init__.py +0 -19
paddlex/ppcls/optimizer/learning_rate.py +0 -159
paddlex/ppcls/optimizer/optimizer.py +0 -165
paddlex/ppcls/utils/__init__.py +0 -27
paddlex/ppcls/utils/check.py +0 -151
paddlex/ppcls/utils/config.py +0 -201
paddlex/ppcls/utils/logger.py +0 -120
paddlex/ppcls/utils/metrics.py +0 -112
paddlex/ppcls/utils/misc.py +0 -62
paddlex/ppcls/utils/model_zoo.py +0 -213
paddlex/ppcls/utils/save_load.py +0 -163
paddlex/ppdet/__init__.py +0 -16
paddlex/ppdet/core/__init__.py +0 -15
paddlex/ppdet/core/config/__init__.py +0 -13
paddlex/ppdet/core/config/schema.py +0 -248
paddlex/ppdet/core/config/yaml_helpers.py +0 -118
paddlex/ppdet/core/workspace.py +0 -279
paddlex/ppdet/data/__init__.py +0 -21
paddlex/ppdet/data/reader.py +0 -304
paddlex/ppdet/data/shm_utils.py +0 -67
paddlex/ppdet/data/source/__init__.py +0 -27
paddlex/ppdet/data/source/category.py +0 -823
paddlex/ppdet/data/source/coco.py +0 -243
paddlex/ppdet/data/source/dataset.py +0 -192
paddlex/ppdet/data/source/keypoint_coco.py +0 -656
paddlex/ppdet/data/source/mot.py +0 -360
paddlex/ppdet/data/source/voc.py +0 -204
paddlex/ppdet/data/source/widerface.py +0 -180
paddlex/ppdet/data/transform/__init__.py +0 -28
paddlex/ppdet/data/transform/autoaugment_utils.py +0 -1593
paddlex/ppdet/data/transform/batch_operators.py +0 -758
paddlex/ppdet/data/transform/gridmask_utils.py +0 -83
paddlex/ppdet/data/transform/keypoint_operators.py +0 -665
paddlex/ppdet/data/transform/mot_operators.py +0 -636
paddlex/ppdet/data/transform/op_helper.py +0 -468
paddlex/ppdet/data/transform/operators.py +0 -2103
paddlex/ppdet/engine/__init__.py +0 -29
paddlex/ppdet/engine/callbacks.py +0 -262
paddlex/ppdet/engine/env.py +0 -47
paddlex/ppdet/engine/export_utils.py +0 -118
paddlex/ppdet/engine/tracker.py +0 -425
paddlex/ppdet/engine/trainer.py +0 -535
paddlex/ppdet/metrics/__init__.py +0 -23
paddlex/ppdet/metrics/coco_utils.py +0 -184
paddlex/ppdet/metrics/json_results.py +0 -151
paddlex/ppdet/metrics/keypoint_metrics.py +0 -202
paddlex/ppdet/metrics/map_utils.py +0 -396
paddlex/ppdet/metrics/metrics.py +0 -300
paddlex/ppdet/metrics/mot_eval_utils.py +0 -192
paddlex/ppdet/metrics/mot_metrics.py +0 -184
paddlex/ppdet/metrics/widerface_utils.py +0 -393
paddlex/ppdet/model_zoo/__init__.py +0 -18
paddlex/ppdet/model_zoo/model_zoo.py +0 -86
paddlex/ppdet/model_zoo/tests/__init__.py +0 -13
paddlex/ppdet/model_zoo/tests/test_get_model.py +0 -48
paddlex/ppdet/model_zoo/tests/test_list_model.py +0 -68
paddlex/ppdet/modeling/__init__.py +0 -41
paddlex/ppdet/modeling/architectures/__init__.py +0 -40
paddlex/ppdet/modeling/architectures/cascade_rcnn.py +0 -144
paddlex/ppdet/modeling/architectures/centernet.py +0 -103
paddlex/ppdet/modeling/architectures/deepsort.py +0 -111
paddlex/ppdet/modeling/architectures/fairmot.py +0 -107
paddlex/ppdet/modeling/architectures/faster_rcnn.py +0 -106
paddlex/ppdet/modeling/architectures/fcos.py +0 -105
paddlex/ppdet/modeling/architectures/jde.py +0 -125
paddlex/ppdet/modeling/architectures/keypoint_hrhrnet.py +0 -286
paddlex/ppdet/modeling/architectures/keypoint_hrnet.py +0 -203
paddlex/ppdet/modeling/architectures/mask_rcnn.py +0 -135
paddlex/ppdet/modeling/architectures/meta_arch.py +0 -45
paddlex/ppdet/modeling/architectures/s2anet.py +0 -103
paddlex/ppdet/modeling/architectures/solov2.py +0 -110
paddlex/ppdet/modeling/architectures/ssd.py +0 -84
paddlex/ppdet/modeling/architectures/ttfnet.py +0 -98
paddlex/ppdet/modeling/architectures/yolo.py +0 -104
paddlex/ppdet/modeling/backbones/__init__.py +0 -37
paddlex/ppdet/modeling/backbones/blazenet.py +0 -322
paddlex/ppdet/modeling/backbones/darknet.py +0 -341
paddlex/ppdet/modeling/backbones/dla.py +0 -244
paddlex/ppdet/modeling/backbones/ghostnet.py +0 -476
paddlex/ppdet/modeling/backbones/hrnet.py +0 -724
paddlex/ppdet/modeling/backbones/mobilenet_v1.py +0 -410
paddlex/ppdet/modeling/backbones/mobilenet_v3.py +0 -497
paddlex/ppdet/modeling/backbones/name_adapter.py +0 -69
paddlex/ppdet/modeling/backbones/res2net.py +0 -358
paddlex/ppdet/modeling/backbones/resnet.py +0 -606
paddlex/ppdet/modeling/backbones/senet.py +0 -140
paddlex/ppdet/modeling/backbones/vgg.py +0 -216
paddlex/ppdet/modeling/bbox_utils.py +0 -464
paddlex/ppdet/modeling/heads/__init__.py +0 -41
paddlex/ppdet/modeling/heads/bbox_head.py +0 -379
paddlex/ppdet/modeling/heads/cascade_head.py +0 -285
paddlex/ppdet/modeling/heads/centernet_head.py +0 -194
paddlex/ppdet/modeling/heads/face_head.py +0 -113
paddlex/ppdet/modeling/heads/fcos_head.py +0 -270
paddlex/ppdet/modeling/heads/keypoint_hrhrnet_head.py +0 -108
paddlex/ppdet/modeling/heads/mask_head.py +0 -253
paddlex/ppdet/modeling/heads/roi_extractor.py +0 -111
paddlex/ppdet/modeling/heads/s2anet_head.py +0 -845
paddlex/ppdet/modeling/heads/solov2_head.py +0 -537
paddlex/ppdet/modeling/heads/ssd_head.py +0 -175
paddlex/ppdet/modeling/heads/ttf_head.py +0 -314
paddlex/ppdet/modeling/heads/yolo_head.py +0 -124
paddlex/ppdet/modeling/keypoint_utils.py +0 -302
paddlex/ppdet/modeling/layers.py +0 -1142
paddlex/ppdet/modeling/losses/__init__.py +0 -35
paddlex/ppdet/modeling/losses/ctfocal_loss.py +0 -67
paddlex/ppdet/modeling/losses/fairmot_loss.py +0 -41
paddlex/ppdet/modeling/losses/fcos_loss.py +0 -225
paddlex/ppdet/modeling/losses/iou_aware_loss.py +0 -48
paddlex/ppdet/modeling/losses/iou_loss.py +0 -210
paddlex/ppdet/modeling/losses/jde_loss.py +0 -182
paddlex/ppdet/modeling/losses/keypoint_loss.py +0 -228
paddlex/ppdet/modeling/losses/solov2_loss.py +0 -101
paddlex/ppdet/modeling/losses/ssd_loss.py +0 -163
paddlex/ppdet/modeling/losses/yolo_loss.py +0 -212
paddlex/ppdet/modeling/mot/__init__.py +0 -25
paddlex/ppdet/modeling/mot/matching/__init__.py +0 -19
paddlex/ppdet/modeling/mot/matching/deepsort_matching.py +0 -382
paddlex/ppdet/modeling/mot/matching/jde_matching.py +0 -145
paddlex/ppdet/modeling/mot/motion/__init__.py +0 -17
paddlex/ppdet/modeling/mot/motion/kalman_filter.py +0 -270
paddlex/ppdet/modeling/mot/tracker/__init__.py +0 -23
paddlex/ppdet/modeling/mot/tracker/base_jde_tracker.py +0 -267
paddlex/ppdet/modeling/mot/tracker/base_sde_tracker.py +0 -145
paddlex/ppdet/modeling/mot/tracker/deepsort_tracker.py +0 -165
paddlex/ppdet/modeling/mot/tracker/jde_tracker.py +0 -262
paddlex/ppdet/modeling/mot/utils.py +0 -181
paddlex/ppdet/modeling/mot/visualization.py +0 -130
paddlex/ppdet/modeling/necks/__init__.py +0 -25
paddlex/ppdet/modeling/necks/centernet_fpn.py +0 -185
paddlex/ppdet/modeling/necks/fpn.py +0 -233
paddlex/ppdet/modeling/necks/hrfpn.py +0 -131
paddlex/ppdet/modeling/necks/ttf_fpn.py +0 -243
paddlex/ppdet/modeling/necks/yolo_fpn.py +0 -1034
paddlex/ppdet/modeling/ops.py +0 -1599
paddlex/ppdet/modeling/post_process.py +0 -449
paddlex/ppdet/modeling/proposal_generator/__init__.py +0 -2
paddlex/ppdet/modeling/proposal_generator/anchor_generator.py +0 -135
paddlex/ppdet/modeling/proposal_generator/proposal_generator.py +0 -81
paddlex/ppdet/modeling/proposal_generator/rpn_head.py +0 -269
paddlex/ppdet/modeling/proposal_generator/target.py +0 -671
paddlex/ppdet/modeling/proposal_generator/target_layer.py +0 -476
paddlex/ppdet/modeling/reid/__init__.py +0 -23
paddlex/ppdet/modeling/reid/fairmot_embedding_head.py +0 -117
paddlex/ppdet/modeling/reid/jde_embedding_head.py +0 -189
paddlex/ppdet/modeling/reid/pyramidal_embedding.py +0 -151
paddlex/ppdet/modeling/reid/resnet.py +0 -320
paddlex/ppdet/modeling/shape_spec.py +0 -33
paddlex/ppdet/modeling/tests/__init__.py +0 -13
paddlex/ppdet/modeling/tests/test_architectures.py +0 -59
paddlex/ppdet/modeling/tests/test_base.py +0 -75
paddlex/ppdet/modeling/tests/test_ops.py +0 -839
paddlex/ppdet/modeling/tests/test_yolov3_loss.py +0 -420
paddlex/ppdet/optimizer.py +0 -285
paddlex/ppdet/slim/__init__.py +0 -62
paddlex/ppdet/slim/distill.py +0 -111
paddlex/ppdet/slim/prune.py +0 -85
paddlex/ppdet/slim/quant.py +0 -52
paddlex/ppdet/utils/__init__.py +0 -13
paddlex/ppdet/utils/check.py +0 -93
paddlex/ppdet/utils/checkpoint.py +0 -216
paddlex/ppdet/utils/cli.py +0 -151
paddlex/ppdet/utils/colormap.py +0 -56
paddlex/ppdet/utils/download.py +0 -477
paddlex/ppdet/utils/logger.py +0 -71
paddlex/ppdet/utils/stats.py +0 -95
paddlex/ppdet/utils/visualizer.py +0 -292
paddlex/ppdet/utils/voc_utils.py +0 -87
paddlex/seg.py +0 -38
paddlex/tools/__init__.py +0 -16
paddlex/tools/convert.py +0 -52
paddlex/tools/dataset_conversion/__init__.py +0 -24
paddlex/tools/dataset_conversion/x2coco.py +0 -379
paddlex/tools/dataset_conversion/x2imagenet.py +0 -82
paddlex/tools/dataset_conversion/x2seg.py +0 -343
paddlex/tools/dataset_conversion/x2voc.py +0 -230
paddlex/tools/dataset_split/__init__.py +0 -23
paddlex/tools/dataset_split/coco_split.py +0 -69
paddlex/tools/dataset_split/imagenet_split.py +0 -75
paddlex/tools/dataset_split/seg_split.py +0 -96
paddlex/tools/dataset_split/utils.py +0 -75
paddlex/tools/dataset_split/voc_split.py +0 -91
paddlex/tools/split.py +0 -41
paddlex/utils/checkpoint.py +0 -439
paddlex/utils/shm.py +0 -67
paddlex/utils/stats.py +0 -68
paddlex/utils/utils.py +0 -140
paddlex-2.0.0rc4.dist-info/LICENSE +0 -201
paddlex-2.0.0rc4.dist-info/METADATA +0 -29
paddlex-2.0.0rc4.dist-info/RECORD +0 -445
paddlex-2.0.0rc4.dist-info/WHEEL +0 -5
paddlex-2.0.0rc4.dist-info/entry_points.txt +0 -3
paddlex-2.0.0rc4.dist-info/top_level.txt +0 -2

paddlex/inference/pipelines/layout_parsing/pipeline_v2.py ADDED Viewed

@@ -0,0 +1,1382 @@
+# Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from __future__ import annotations
+import copy
+import re
+from typing import Any, Dict, List, Optional, Tuple, Union
+import numpy as np
+from PIL import Image
+from ....utils import logging
+from ....utils.deps import pipeline_requires_extra
+from ...common.batch_sampler import ImageBatchSampler
+from ...common.reader import ReadImage
+from ...models.object_detection.result import DetResult
+from ...utils.hpi import HPIConfig
+from ...utils.pp_option import PaddlePredictorOption
+from .._parallel import AutoParallelImageSimpleInferencePipeline
+from ..base import BasePipeline
+from ..ocr.result import OCRResult
+from .result_v2 import LayoutParsingBlock, LayoutParsingRegion, LayoutParsingResultV2
+from .setting import BLOCK_LABEL_MAP, BLOCK_SETTINGS, LINE_SETTINGS, REGION_SETTINGS
+from .utils import (
+    caculate_bbox_area,
+    calculate_minimum_enclosing_bbox,
+    calculate_overlap_ratio,
+    convert_formula_res_to_ocr_format,
+    format_line,
+    gather_imgs,
+    get_bbox_intersection,
+    get_sub_regions_ocr_res,
+    group_boxes_into_lines,
+    remove_overlap_blocks,
+    shrink_supplement_region_bbox,
+    split_boxes_by_projection,
+    update_region_box,
+)
+class _LayoutParsingPipelineV2(BasePipeline):
+    """Layout Parsing Pipeline V2"""
+    def __init__(
+        self,
+        config: dict,
+        device: str = None,
+        pp_option: PaddlePredictorOption = None,
+        use_hpip: bool = False,
+        hpi_config: Optional[Union[Dict[str, Any], HPIConfig]] = None,
+    ) -> None:
+        """Initializes the layout parsing pipeline.
+        Args:
+            config (Dict): Configuration dictionary containing various settings.
+            device (str, optional): Device to run the predictions on. Defaults to None.
+            pp_option (PaddlePredictorOption, optional): PaddlePredictor options. Defaults to None.
+            use_hpip (bool, optional): Whether to use the high-performance
+                inference plugin (HPIP) by default. Defaults to False.
+            hpi_config (Optional[Union[Dict[str, Any], HPIConfig]], optional):
+                The default high-performance inference configuration dictionary.
+                Defaults to None.
+        """
+        super().__init__(
+            device=device,
+            pp_option=pp_option,
+            use_hpip=use_hpip,
+            hpi_config=hpi_config,
+        )
+        self.inintial_predictor(config)
+        self.batch_sampler = ImageBatchSampler(batch_size=config.get("batch_size", 1))
+        self.img_reader = ReadImage(format="BGR")
+    def inintial_predictor(self, config: dict) -> None:
+        """Initializes the predictor based on the provided configuration.
+        Args:
+            config (Dict): A dictionary containing the configuration for the predictor.
+        Returns:
+            None
+        """
+        self.use_doc_preprocessor = config.get("use_doc_preprocessor", True)
+        self.use_table_recognition = config.get("use_table_recognition", True)
+        self.use_seal_recognition = config.get("use_seal_recognition", True)
+        self.use_region_detection = config.get(
+            "use_region_detection",
+            True,
+        )
+        self.use_formula_recognition = config.get(
+            "use_formula_recognition",
+            True,
+        )
+        self.use_chart_recognition = config.get(
+            "use_chart_recognition",
+            False,
+        )
+        if self.use_doc_preprocessor:
+            doc_preprocessor_config = config.get("SubPipelines", {}).get(
+                "DocPreprocessor",
+                {
+                    "pipeline_config_error": "config error for doc_preprocessor_pipeline!",
+                },
+            )
+            self.doc_preprocessor_pipeline = self.create_pipeline(
+                doc_preprocessor_config,
+            )
+        if self.use_region_detection:
+            region_detection_config = config.get("SubModules", {}).get(
+                "RegionDetection",
+                {
+                    "model_config_error": "config error for block_region_detection_model!"
+                },
+            )
+            self.region_detection_model = self.create_model(
+                region_detection_config,
+            )
+        layout_det_config = config.get("SubModules", {}).get(
+            "LayoutDetection",
+            {"model_config_error": "config error for layout_det_model!"},
+        )
+        layout_kwargs = {}
+        if (threshold := layout_det_config.get("threshold", None)) is not None:
+            layout_kwargs["threshold"] = threshold
+        if (layout_nms := layout_det_config.get("layout_nms", None)) is not None:
+            layout_kwargs["layout_nms"] = layout_nms
+        if (
+            layout_unclip_ratio := layout_det_config.get("layout_unclip_ratio", None)
+        ) is not None:
+            layout_kwargs["layout_unclip_ratio"] = layout_unclip_ratio
+        if (
+            layout_merge_bboxes_mode := layout_det_config.get(
+                "layout_merge_bboxes_mode", None
+            )
+        ) is not None:
+            layout_kwargs["layout_merge_bboxes_mode"] = layout_merge_bboxes_mode
+        self.layout_det_model = self.create_model(layout_det_config, **layout_kwargs)
+        general_ocr_config = config.get("SubPipelines", {}).get(
+            "GeneralOCR",
+            {"pipeline_config_error": "config error for general_ocr_pipeline!"},
+        )
+        self.general_ocr_pipeline = self.create_pipeline(
+            general_ocr_config,
+        )
+        if self.use_seal_recognition:
+            seal_recognition_config = config.get("SubPipelines", {}).get(
+                "SealRecognition",
+                {
+                    "pipeline_config_error": "config error for seal_recognition_pipeline!",
+                },
+            )
+            self.seal_recognition_pipeline = self.create_pipeline(
+                seal_recognition_config,
+            )
+        if self.use_table_recognition:
+            table_recognition_config = config.get("SubPipelines", {}).get(
+                "TableRecognition",
+                {
+                    "pipeline_config_error": "config error for table_recognition_pipeline!",
+                },
+            )
+            self.table_recognition_pipeline = self.create_pipeline(
+                table_recognition_config,
+            )
+        if self.use_formula_recognition:
+            formula_recognition_config = config.get("SubPipelines", {}).get(
+                "FormulaRecognition",
+                {
+                    "pipeline_config_error": "config error for formula_recognition_pipeline!",
+                },
+            )
+            self.formula_recognition_pipeline = self.create_pipeline(
+                formula_recognition_config,
+            )
+        if self.use_chart_recognition:
+            chart_recognition_config = config.get("SubModules", {}).get(
+                "ChartRecognition",
+                {
+                    "model_config_error": "config error for block_region_detection_model!"
+                },
+            )
+            self.chart_recognition_model = self.create_model(
+                chart_recognition_config,
+            )
+        return
+    def get_text_paragraphs_ocr_res(
+        self,
+        overall_ocr_res: OCRResult,
+        layout_det_res: DetResult,
+    ) -> OCRResult:
+        """
+        Retrieves the OCR results for text paragraphs, excluding those of formulas, tables, and seals.
+        Args:
+            overall_ocr_res (OCRResult): The overall OCR result containing text information.
+            layout_det_res (DetResult): The detection result containing the layout information of the document.
+        Returns:
+            OCRResult: The OCR result for text paragraphs after excluding formulas, tables, and seals.
+        """
+        object_boxes = []
+        for box_info in layout_det_res["boxes"]:
+            if box_info["label"].lower() in ["formula", "table", "seal"]:
+                object_boxes.append(box_info["coordinate"])
+        object_boxes = np.array(object_boxes)
+        sub_regions_ocr_res = get_sub_regions_ocr_res(
+            overall_ocr_res, object_boxes, flag_within=False
+        )
+        return sub_regions_ocr_res
+    def check_model_settings_valid(self, input_params: dict) -> bool:
+        """
+        Check if the input parameters are valid based on the initialized models.
+        Args:
+            input_params (Dict): A dictionary containing input parameters.
+        Returns:
+            bool: True if all required models are initialized according to input parameters, False otherwise.
+        """
+        if input_params["use_doc_preprocessor"] and not self.use_doc_preprocessor:
+            logging.error(
+                "Set use_doc_preprocessor, but the models for doc preprocessor are not initialized.",
+            )
+            return False
+        if input_params["use_seal_recognition"] and not self.use_seal_recognition:
+            logging.error(
+                "Set use_seal_recognition, but the models for seal recognition are not initialized.",
+            )
+            return False
+        if input_params["use_table_recognition"] and not self.use_table_recognition:
+            logging.error(
+                "Set use_table_recognition, but the models for table recognition are not initialized.",
+            )
+            return False
+        return True
+    def standardized_data(
+        self,
+        image: list,
+        region_det_res: DetResult,
+        layout_det_res: DetResult,
+        overall_ocr_res: OCRResult,
+        formula_res_list: list,
+        text_rec_model: Any,
+        text_rec_score_thresh: Union[float, None] = None,
+    ) -> list:
+        """
+        Retrieves the layout parsing result based on the layout detection result, OCR result, and other recognition results.
+        Args:
+            image (list): The input image.
+            overall_ocr_res (OCRResult): An object containing the overall OCR results, including detected text boxes and recognized text. The structure is expected to have:
+                - "input_img": The image on which OCR was performed.
+                - "dt_boxes": A list of detected text box coordinates.
+                - "rec_texts": A list of recognized text corresponding to the detected boxes.
+            layout_det_res (DetResult): An object containing the layout detection results, including detected layout boxes and their labels. The structure is expected to have:
+                - "boxes": A list of dictionaries with keys "coordinate" for box coordinates and "block_label" for the type of content.
+            table_res_list (list): A list of table detection results, where each item is a dictionary containing:
+                - "block_bbox": The bounding box of the table layout.
+                - "pred_html": The predicted HTML representation of the table.
+            formula_res_list (list): A list of formula recognition results.
+            text_rec_model (Any): The text recognition model.
+            text_rec_score_thresh (Optional[float], optional): The score threshold for text recognition. Defaults to None.
+        Returns:
+            list: A list of dictionaries representing the layout parsing result.
+        """
+        matched_ocr_dict = {}
+        region_to_block_map = {}
+        block_to_ocr_map = {}
+        object_boxes = []
+        footnote_list = []
+        paragraph_title_list = []
+        bottom_text_y_max = 0
+        max_block_area = 0.0
+        doc_title_num = 0
+        base_region_bbox = [65535, 65535, 0, 0]
+        layout_det_res = remove_overlap_blocks(
+            layout_det_res,
+            threshold=0.5,
+            smaller=True,
+        )
+        # convert formula_res_list to OCRResult format
+        convert_formula_res_to_ocr_format(formula_res_list, overall_ocr_res)
+        # match layout boxes and ocr boxes and get some information for layout_order_config
+        for box_idx, box_info in enumerate(layout_det_res["boxes"]):
+            box = box_info["coordinate"]
+            label = box_info["label"].lower()
+            object_boxes.append(box)
+            _, _, _, y2 = box
+            # update the region box and max_block_area according to the layout boxes
+            base_region_bbox = update_region_box(box, base_region_bbox)
+            max_block_area = max(max_block_area, caculate_bbox_area(box))
+            # update_layout_order_config_block_index(layout_order_config, label, box_idx)
+            # set the label of footnote to text, when it is above the text boxes
+            if label == "footnote":
+                footnote_list.append(box_idx)
+            elif label == "paragraph_title":
+                paragraph_title_list.append(box_idx)
+            if label == "text":
+                bottom_text_y_max = max(y2, bottom_text_y_max)
+            if label == "doc_title":
+                doc_title_num += 1
+            if label not in ["formula", "table", "seal"]:
+                _, matched_idxes = get_sub_regions_ocr_res(
+                    overall_ocr_res, [box], return_match_idx=True
+                )
+                block_to_ocr_map[box_idx] = matched_idxes
+                for matched_idx in matched_idxes:
+                    if matched_ocr_dict.get(matched_idx, None) is None:
+                        matched_ocr_dict[matched_idx] = [box_idx]
+                    else:
+                        matched_ocr_dict[matched_idx].append(box_idx)
+        # fix the footnote label
+        for footnote_idx in footnote_list:
+            if (
+                layout_det_res["boxes"][footnote_idx]["coordinate"][3]
+                < bottom_text_y_max
+            ):
+                layout_det_res["boxes"][footnote_idx]["label"] = "text"
+        # check if there is only one paragraph title and without doc_title
+        only_one_paragraph_title = len(paragraph_title_list) == 1 and doc_title_num == 0
+        if only_one_paragraph_title:
+            paragraph_title_block_area = caculate_bbox_area(
+                layout_det_res["boxes"][paragraph_title_list[0]]["coordinate"]
+            )
+            title_area_max_block_threshold = BLOCK_SETTINGS.get(
+                "title_conversion_area_ratio_threshold", 0.3
+            )
+            if (
+                paragraph_title_block_area
+                > max_block_area * title_area_max_block_threshold
+            ):
+                layout_det_res["boxes"][paragraph_title_list[0]]["label"] = "doc_title"
+        # Replace the OCR information of the hurdles.
+        for overall_ocr_idx, layout_box_ids in matched_ocr_dict.items():
+            if len(layout_box_ids) > 1:
+                matched_no = 0
+                overall_ocr_box = copy.deepcopy(
+                    overall_ocr_res["rec_boxes"][overall_ocr_idx]
+                )
+                overall_ocr_dt_poly = copy.deepcopy(
+                    overall_ocr_res["dt_polys"][overall_ocr_idx]
+                )
+                for box_idx in layout_box_ids:
+                    layout_box = layout_det_res["boxes"][box_idx]["coordinate"]
+                    crop_box = get_bbox_intersection(overall_ocr_box, layout_box)
+                    for ocr_idx in block_to_ocr_map[box_idx]:
+                        ocr_box = overall_ocr_res["rec_boxes"][ocr_idx]
+                        iou = calculate_overlap_ratio(ocr_box, crop_box, "small")
+                        if iou > 0.8:
+                            overall_ocr_res["rec_texts"][ocr_idx] = ""
+                    x1, y1, x2, y2 = [int(i) for i in crop_box]
+                    crop_img = np.array(image)[y1:y2, x1:x2]
+                    crop_img_rec_res = list(text_rec_model([crop_img]))[0]
+                    crop_img_dt_poly = get_bbox_intersection(
+                        overall_ocr_dt_poly, layout_box, return_format="poly"
+                    )
+                    crop_img_rec_score = crop_img_rec_res["rec_score"]
+                    crop_img_rec_text = crop_img_rec_res["rec_text"]
+                    text_rec_score_thresh = (
+                        text_rec_score_thresh
+                        if text_rec_score_thresh is not None
+                        else (self.general_ocr_pipeline.text_rec_score_thresh)
+                    )
+                    if crop_img_rec_score >= text_rec_score_thresh:
+                        matched_no += 1
+                        if matched_no == 1:
+                            # the first matched ocr be replaced by the first matched layout box
+                            overall_ocr_res["dt_polys"][
+                                overall_ocr_idx
+                            ] = crop_img_dt_poly
+                            overall_ocr_res["rec_boxes"][overall_ocr_idx] = crop_box
+                            overall_ocr_res["rec_polys"][
+                                overall_ocr_idx
+                            ] = crop_img_dt_poly
+                            overall_ocr_res["rec_scores"][
+                                overall_ocr_idx
+                            ] = crop_img_rec_score
+                            overall_ocr_res["rec_texts"][
+                                overall_ocr_idx
+                            ] = crop_img_rec_text
+                        else:
+                            # the other matched ocr be appended to the overall ocr result
+                            overall_ocr_res["dt_polys"].append(crop_img_dt_poly)
+                            overall_ocr_res["rec_boxes"] = np.vstack(
+                                (overall_ocr_res["rec_boxes"], crop_box)
+                            )
+                            overall_ocr_res["rec_polys"].append(crop_img_dt_poly)
+                            overall_ocr_res["rec_scores"].append(crop_img_rec_score)
+                            overall_ocr_res["rec_texts"].append(crop_img_rec_text)
+                            overall_ocr_res["rec_labels"].append("text")
+                            block_to_ocr_map[box_idx].remove(overall_ocr_idx)
+                            block_to_ocr_map[box_idx].append(
+                                len(overall_ocr_res["rec_texts"]) - 1
+                            )
+        # use layout bbox to do ocr recognition when there is no matched ocr
+        for layout_box_idx, overall_ocr_idxes in block_to_ocr_map.items():
+            has_text = False
+            for idx in overall_ocr_idxes:
+                if overall_ocr_res["rec_texts"][idx] != "":
+                    has_text = True
+                    break
+            if not has_text and layout_det_res["boxes"][layout_box_idx][
+                "label"
+            ] not in BLOCK_LABEL_MAP.get("vision_labels", []):
+                crop_box = layout_det_res["boxes"][layout_box_idx]["coordinate"]
+                x1, y1, x2, y2 = [int(i) for i in crop_box]
+                crop_img = np.array(image)[y1:y2, x1:x2]
+                crop_img_rec_res = next(text_rec_model([crop_img]))
+                crop_img_dt_poly = get_bbox_intersection(
+                    crop_box, crop_box, return_format="poly"
+                )
+                crop_img_rec_score = crop_img_rec_res["rec_score"]
+                crop_img_rec_text = crop_img_rec_res["rec_text"]
+                text_rec_score_thresh = (
+                    text_rec_score_thresh
+                    if text_rec_score_thresh is not None
+                    else (self.general_ocr_pipeline.text_rec_score_thresh)
+                )
+                if crop_img_rec_score >= text_rec_score_thresh:
+                    overall_ocr_res["rec_boxes"] = np.vstack(
+                        (overall_ocr_res["rec_boxes"], crop_box)
+                    )
+                    overall_ocr_res["rec_polys"].append(crop_img_dt_poly)
+                    overall_ocr_res["rec_scores"].append(crop_img_rec_score)
+                    overall_ocr_res["rec_texts"].append(crop_img_rec_text)
+                    overall_ocr_res["rec_labels"].append("text")
+                    block_to_ocr_map[layout_box_idx].append(
+                        len(overall_ocr_res["rec_texts"]) - 1
+                    )
+        # when there is no layout detection result but there is ocr result, convert ocr detection result to layout detection result
+        if len(layout_det_res["boxes"]) == 0 and len(overall_ocr_res["rec_boxes"]) > 0:
+            for idx, ocr_rec_box in enumerate(overall_ocr_res["rec_boxes"]):
+                base_region_bbox = update_region_box(ocr_rec_box, base_region_bbox)
+                layout_det_res["boxes"].append(
+                    {
+                        "label": "text",
+                        "coordinate": ocr_rec_box,
+                        "score": overall_ocr_res["rec_scores"][idx],
+                    }
+                )
+                block_to_ocr_map[idx] = [idx]
+        block_bboxes = [box["coordinate"] for box in layout_det_res["boxes"]]
+        region_det_res["boxes"] = sorted(
+            region_det_res["boxes"],
+            key=lambda item: caculate_bbox_area(item["coordinate"]),
+        )
+        if len(region_det_res["boxes"]) == 0:
+            region_det_res["boxes"] = [
+                {
+                    "coordinate": base_region_bbox,
+                    "label": "SupplementaryRegion",
+                    "score": 1,
+                }
+            ]
+            region_to_block_map[0] = range(len(block_bboxes))
+        else:
+            block_idxes_set = set(range(len(block_bboxes)))
+            # match block to region
+            for region_idx, region_info in enumerate(region_det_res["boxes"]):
+                matched_idxes = []
+                region_to_block_map[region_idx] = []
+                region_bbox = region_info["coordinate"]
+                for block_idx in block_idxes_set:
+                    overlap_ratio = calculate_overlap_ratio(
+                        region_bbox, block_bboxes[block_idx], mode="small"
+                    )
+                    if overlap_ratio > REGION_SETTINGS.get(
+                        "match_block_overlap_ratio_threshold", 0.8
+                    ):
+                        region_to_block_map[region_idx].append(block_idx)
+                        matched_idxes.append(block_idx)
+                if len(matched_idxes) > 0:
+                    for block_idx in matched_idxes:
+                        block_idxes_set.remove(block_idx)
+                    matched_bboxes = [block_bboxes[idx] for idx in matched_idxes]
+                    new_region_bbox = calculate_minimum_enclosing_bbox(matched_bboxes)
+                    region_det_res["boxes"][region_idx]["coordinate"] = new_region_bbox
+            # Supplement region when there is no matched block
+            if len(block_idxes_set) > 0:
+                while len(block_idxes_set) > 0:
+                    matched_idxes = []
+                    unmatched_bboxes = [block_bboxes[idx] for idx in block_idxes_set]
+                    supplement_region_bbox = calculate_minimum_enclosing_bbox(
+                        unmatched_bboxes
+                    )
+                    # check if the new region bbox is overlapped with other region bbox, if have, then shrink the new region bbox
+                    for region_info in region_det_res["boxes"]:
+                        region_bbox = region_info["coordinate"]
+                        overlap_ratio = calculate_overlap_ratio(
+                            supplement_region_bbox, region_bbox
+                        )
+                        if overlap_ratio > 0:
+                            supplement_region_bbox, matched_idxes = (
+                                shrink_supplement_region_bbox(
+                                    supplement_region_bbox,
+                                    region_bbox,
+                                    image.shape[1],
+                                    image.shape[0],
+                                    block_idxes_set,
+                                    block_bboxes,
+                                )
+                            )
+                    if len(matched_idxes) == 0:
+                        matched_idxes = list(block_idxes_set)
+                    region_idx = len(region_det_res["boxes"])
+                    region_to_block_map[region_idx] = list(matched_idxes)
+                    for block_idx in matched_idxes:
+                        block_idxes_set.remove(block_idx)
+                    region_det_res["boxes"].append(
+                        {
+                            "coordinate": supplement_region_bbox,
+                            "label": "SupplementaryRegion",
+                            "score": 1,
+                        }
+                    )
+        region_block_ocr_idx_map = dict(
+            region_to_block_map=region_to_block_map,
+            block_to_ocr_map=block_to_ocr_map,
+        )
+        return region_block_ocr_idx_map, region_det_res, layout_det_res
+    def sort_line_by_projection(
+        self,
+        line: List[List[Union[List[int], str]]],
+        input_img: np.ndarray,
+        text_rec_model: Any,
+        text_rec_score_thresh: Union[float, None] = None,
+        direction: str = "vertical",
+    ) -> None:
+        """
+        Sort a line of text spans based on their vertical position within the layout bounding box.
+        Args:
+            line (list): A list of spans, where each span is a list containing a bounding box and text.
+            input_img (ndarray): The input image used for OCR.
+            general_ocr_pipeline (Any): The general OCR pipeline used for text recognition.
+        Returns:
+            list: The sorted line of text spans.
+        """
+        sort_index = 0 if direction == "horizontal" else 1
+        splited_boxes = split_boxes_by_projection(line, direction)
+        splited_lines = []
+        if len(line) != len(splited_boxes):
+            splited_boxes.sort(key=lambda span: span[0][sort_index])
+            for span in splited_boxes:
+                bbox, text, label = span
+                if label == "text":
+                    crop_img = input_img[
+                        int(bbox[1]) : int(bbox[3]),
+                        int(bbox[0]) : int(bbox[2]),
+                    ]
+                    crop_img_rec_res = list(text_rec_model([crop_img]))[0]
+                    crop_img_rec_score = crop_img_rec_res["rec_score"]
+                    crop_img_rec_text = crop_img_rec_res["rec_text"]
+                    text = (
+                        crop_img_rec_text
+                        if crop_img_rec_score >= text_rec_score_thresh
+                        else ""
+                    )
+                    span[1] = text
+                splited_lines.append(span)
+        else:
+            splited_lines = line
+        return splited_lines
+    def get_block_rec_content(
+        self,
+        image: list,
+        ocr_rec_res: dict,
+        block: LayoutParsingBlock,
+        text_rec_model: Any,
+        text_rec_score_thresh: Union[float, None] = None,
+    ) -> str:
+        if len(ocr_rec_res["rec_texts"]) == 0:
+            block.content = ""
+            return block
+        lines, text_direction, text_line_height = group_boxes_into_lines(
+            ocr_rec_res,
+            LINE_SETTINGS.get("line_height_iou_threshold", 0.8),
+        )
+        # format line
+        text_lines = []
+        need_new_line_num = 0
+        # words start coordinate and stop coordinate in the line
+        words_start_index = 0 if text_direction == "horizontal" else 1
+        words_stop_index = words_start_index + 2
+        lines_start_index = 1 if text_direction == "horizontal" else 3
+        line_width_list = []
+        if block.label == "reference":
+            rec_boxes = ocr_rec_res["boxes"]
+            block_start_coordinate = min([box[words_start_index] for box in rec_boxes])
+            block_stop_coordinate = max([box[words_stop_index] for box in rec_boxes])
+        else:
+            block_start_coordinate = block.bbox[words_start_index]
+            block_stop_coordinate = block.bbox[words_stop_index]
+        for idx, line in enumerate(lines):
+            line.sort(
+                key=lambda span: (
+                    span[0][words_start_index] // 2,
+                    (
+                        span[0][lines_start_index]
+                        if text_direction == "horizontal"
+                        else -span[0][lines_start_index]
+                    ),
+                )
+            )
+            line_width = line[-1][0][words_stop_index] - line[0][0][words_start_index]
+            line_width_list.append(line_width)
+            # merge formula and text
+            ocr_labels = [span[2] for span in line]
+            if "formula" in ocr_labels:
+                line = self.sort_line_by_projection(
+                    line, image, text_rec_model, text_rec_score_thresh, text_direction
+                )
+            line_text, need_new_line = format_line(
+                line,
+                text_direction,
+                np.max(line_width_list),
+                block_start_coordinate,
+                block_stop_coordinate,
+                line_gap_limit=text_line_height * 1.5,
+                block_label=block.label,
+            )
+            if need_new_line:
+                need_new_line_num += 1
+            if idx == 0:
+                line_start_coordinate = line[0][0][0]
+                block.seg_start_coordinate = line_start_coordinate
+            elif idx == len(lines) - 1:
+                line_end_coordinate = line[-1][0][2]
+                block.seg_end_coordinate = line_end_coordinate
+            text_lines.append(line_text)
+        delim = LINE_SETTINGS["delimiter_map"].get(block.label, "")
+        if need_new_line_num > len(text_lines) * 0.5 and delim == "":
+            text_lines = [text.replace("\n", "") for text in text_lines]
+            delim = "\n"
+        content = delim.join(text_lines)
+        block.content = content
+        block.num_of_lines = len(text_lines)
+        block.direction = text_direction
+        block.text_line_height = text_line_height
+        block.text_line_width = np.mean(line_width_list)
+        return block
+    def get_layout_parsing_blocks(
+        self,
+        image: list,
+        region_block_ocr_idx_map: dict,
+        region_det_res: DetResult,
+        overall_ocr_res: OCRResult,
+        layout_det_res: DetResult,
+        table_res_list: list,
+        seal_res_list: list,
+        chart_res_list: list,
+        text_rec_model: Any,
+        text_rec_score_thresh: Union[float, None] = None,
+    ) -> list:
+        """
+        Extract structured information from OCR and layout detection results.
+        Args:
+            image (list): The input image.
+            overall_ocr_res (OCRResult): An object containing the overall OCR results, including detected text boxes and recognized text. The structure is expected to have:
+                - "input_img": The image on which OCR was performed.
+                - "dt_boxes": A list of detected text box coordinates.
+                - "rec_texts": A list of recognized text corresponding to the detected boxes.
+            layout_det_res (DetResult): An object containing the layout detection results, including detected layout boxes and their labels. The structure is expected to have:
+                - "boxes": A list of dictionaries with keys "coordinate" for box coordinates and "block_label" for the type of content.
+            table_res_list (list): A list of table detection results, where each item is a dictionary containing:
+                - "block_bbox": The bounding box of the table layout.
+                - "pred_html": The predicted HTML representation of the table.
+            seal_res_list (List): A list of seal detection results. The details of each item depend on the specific application context.
+            text_rec_model (Any): A model for text recognition.
+            text_rec_score_thresh (Union[float, None]): The minimum score required for a recognized character to be considered valid. If None, use the default value specified during initialization. Default is None.
+        Returns:
+            list: A list of structured boxes where each item is a dictionary containing:
+                - "block_label": The label of the content (e.g., 'table', 'chart', 'image').
+                - The label as a key with either table HTML or image data and text.
+                - "block_bbox": The coordinates of the layout box.
+        """
+        table_index = 0
+        seal_index = 0
+        chart_index = 0
+        layout_parsing_blocks: List[LayoutParsingBlock] = []
+        for box_idx, box_info in enumerate(layout_det_res["boxes"]):
+            label = box_info["label"]
+            block_bbox = box_info["coordinate"]
+            rec_res = {"boxes": [], "rec_texts": [], "rec_labels": []}
+            block = LayoutParsingBlock(label=label, bbox=block_bbox)
+            if label == "table" and len(table_res_list) > 0:
+                block.content = table_res_list[table_index]["pred_html"]
+                table_index += 1
+            elif label == "seal" and len(seal_res_list) > 0:
+                block.content = "\n".join(seal_res_list[seal_index]["rec_texts"])
+                seal_index += 1
+            elif label == "chart" and len(chart_res_list) > 0:
+                block.content = chart_res_list[chart_index]
+                chart_index += 1
+            else:
+                if label == "formula":
+                    _, ocr_idx_list = get_sub_regions_ocr_res(
+                        overall_ocr_res, [block_bbox], return_match_idx=True
+                    )
+                    region_block_ocr_idx_map["block_to_ocr_map"][box_idx] = ocr_idx_list
+                else:
+                    ocr_idx_list = region_block_ocr_idx_map["block_to_ocr_map"].get(
+                        box_idx, []
+                    )
+                for box_no in ocr_idx_list:
+                    rec_res["boxes"].append(overall_ocr_res["rec_boxes"][box_no])
+                    rec_res["rec_texts"].append(
+                        overall_ocr_res["rec_texts"][box_no],
+                    )
+                    rec_res["rec_labels"].append(
+                        overall_ocr_res["rec_labels"][box_no],
+                    )
+                block = self.get_block_rec_content(
+                    image=image,
+                    block=block,
+                    ocr_rec_res=rec_res,
+                    text_rec_model=text_rec_model,
+                    text_rec_score_thresh=text_rec_score_thresh,
+                )
+            if (
+                label
+                in ["seal", "table", "formula", "chart"]
+                + BLOCK_LABEL_MAP["image_labels"]
+            ):
+                x_min, y_min, x_max, y_max = list(map(int, block_bbox))
+                img_path = (
+                    f"imgs/img_in_{block.label}_box_{x_min}_{y_min}_{x_max}_{y_max}.jpg"
+                )
+                img = Image.fromarray(image[y_min:y_max, x_min:x_max, ::-1])
+                block.image = {"path": img_path, "img": img}
+            layout_parsing_blocks.append(block)
+        region_list: List[LayoutParsingRegion] = []
+        for region_idx, region_info in enumerate(region_det_res["boxes"]):
+            region_bbox = region_info["coordinate"]
+            region_blocks = [
+                layout_parsing_blocks[idx]
+                for idx in region_block_ocr_idx_map["region_to_block_map"][region_idx]
+            ]
+            region = LayoutParsingRegion(
+                bbox=region_bbox,
+                blocks=region_blocks,
+                image_shape=image.shape[:2],
+            )
+            region_list.append(region)
+        region_list = sorted(
+            region_list,
+            key=lambda r: (r.weighted_distance),
+        )
+        return region_list
+    def get_layout_parsing_res(
+        self,
+        image: list,
+        region_det_res: DetResult,
+        layout_det_res: DetResult,
+        overall_ocr_res: OCRResult,
+        table_res_list: list,
+        seal_res_list: list,
+        chart_res_list: list,
+        formula_res_list: list,
+        text_rec_score_thresh: Union[float, None] = None,
+    ) -> list:
+        """
+        Retrieves the layout parsing result based on the layout detection result, OCR result, and other recognition results.
+        Args:
+            image (list): The input image.
+            layout_det_res (DetResult): The detection result containing the layout information of the document.
+            overall_ocr_res (OCRResult): The overall OCR result containing text information.
+            table_res_list (list): A list of table recognition results.
+            seal_res_list (list): A list of seal recognition results.
+            formula_res_list (list): A list of formula recognition results.
+            text_rec_score_thresh (Optional[float], optional): The score threshold for text recognition. Defaults to None.
+        Returns:
+            list: A list of dictionaries representing the layout parsing result.
+        """
+        # Standardize data
+        region_block_ocr_idx_map, region_det_res, layout_det_res = (
+            self.standardized_data(
+                image=image,
+                region_det_res=region_det_res,
+                layout_det_res=layout_det_res,
+                overall_ocr_res=overall_ocr_res,
+                formula_res_list=formula_res_list,
+                text_rec_model=self.general_ocr_pipeline.text_rec_model,
+                text_rec_score_thresh=text_rec_score_thresh,
+            )
+        )
+        # Format layout parsing block
+        region_list = self.get_layout_parsing_blocks(
+            image=image,
+            region_block_ocr_idx_map=region_block_ocr_idx_map,
+            region_det_res=region_det_res,
+            overall_ocr_res=overall_ocr_res,
+            layout_det_res=layout_det_res,
+            table_res_list=table_res_list,
+            seal_res_list=seal_res_list,
+            chart_res_list=chart_res_list,
+            text_rec_model=self.general_ocr_pipeline.text_rec_model,
+            text_rec_score_thresh=self.general_ocr_pipeline.text_rec_score_thresh,
+        )
+        parsing_res_list = []
+        for region in region_list:
+            parsing_res_list.extend(region.sort())
+        index = 1
+        for block in parsing_res_list:
+            if block.label in BLOCK_LABEL_MAP["visualize_index_labels"]:
+                block.order_index = index
+                index += 1
+        return parsing_res_list
+    def get_model_settings(
+        self,
+        use_doc_orientation_classify: Union[bool, None],
+        use_doc_unwarping: Union[bool, None],
+        use_seal_recognition: Union[bool, None],
+        use_table_recognition: Union[bool, None],
+        use_formula_recognition: Union[bool, None],
+        use_chart_recognition: Union[bool, None],
+        use_region_detection: Union[bool, None],
+    ) -> dict:
+        """
+        Get the model settings based on the provided parameters or default values.
+        Args:
+            use_doc_orientation_classify (Union[bool, None]): Enables document orientation classification if True. Defaults to system setting if None.
+            use_doc_unwarping (Union[bool, None]): Enables document unwarping if True. Defaults to system setting if None.
+            use_seal_recognition (Union[bool, None]): Enables seal recognition if True. Defaults to system setting if None.
+            use_table_recognition (Union[bool, None]): Enables table recognition if True. Defaults to system setting if None.
+            use_formula_recognition (Union[bool, None]): Enables formula recognition if True. Defaults to system setting if None.
+        Returns:
+            dict: A dictionary containing the model settings.
+        """
+        if use_doc_orientation_classify is None and use_doc_unwarping is None:
+            use_doc_preprocessor = self.use_doc_preprocessor
+        else:
+            if use_doc_orientation_classify is True or use_doc_unwarping is True:
+                use_doc_preprocessor = True
+            else:
+                use_doc_preprocessor = False
+        if use_seal_recognition is None:
+            use_seal_recognition = self.use_seal_recognition
+        if use_table_recognition is None:
+            use_table_recognition = self.use_table_recognition
+        if use_formula_recognition is None:
+            use_formula_recognition = self.use_formula_recognition
+        if use_region_detection is None:
+            use_region_detection = self.use_region_detection
+        if use_chart_recognition is None:
+            use_chart_recognition = self.use_chart_recognition
+        return dict(
+            use_doc_preprocessor=use_doc_preprocessor,
+            use_seal_recognition=use_seal_recognition,
+            use_table_recognition=use_table_recognition,
+            use_formula_recognition=use_formula_recognition,
+            use_chart_recognition=use_chart_recognition,
+            use_region_detection=use_region_detection,
+        )
+    def predict(
+        self,
+        input: Union[str, list[str], np.ndarray, list[np.ndarray]],
+        use_doc_orientation_classify: Union[bool, None] = False,
+        use_doc_unwarping: Union[bool, None] = False,
+        use_textline_orientation: Optional[bool] = None,
+        use_seal_recognition: Union[bool, None] = None,
+        use_table_recognition: Union[bool, None] = None,
+        use_formula_recognition: Union[bool, None] = None,
+        use_chart_recognition: Union[bool, None] = False,
+        use_region_detection: Union[bool, None] = None,
+        layout_threshold: Optional[Union[float, dict]] = None,
+        layout_nms: Optional[bool] = None,
+        layout_unclip_ratio: Optional[Union[float, Tuple[float, float], dict]] = None,
+        layout_merge_bboxes_mode: Optional[str] = None,
+        text_det_limit_side_len: Union[int, None] = None,
+        text_det_limit_type: Union[str, None] = None,
+        text_det_thresh: Union[float, None] = None,
+        text_det_box_thresh: Union[float, None] = None,
+        text_det_unclip_ratio: Union[float, None] = None,
+        text_rec_score_thresh: Union[float, None] = None,
+        seal_det_limit_side_len: Union[int, None] = None,
+        seal_det_limit_type: Union[str, None] = None,
+        seal_det_thresh: Union[float, None] = None,
+        seal_det_box_thresh: Union[float, None] = None,
+        seal_det_unclip_ratio: Union[float, None] = None,
+        seal_rec_score_thresh: Union[float, None] = None,
+        use_wired_table_cells_trans_to_html: bool = False,
+        use_wireless_table_cells_trans_to_html: bool = False,
+        use_table_orientation_classify: bool = True,
+        use_ocr_results_with_table_cells: bool = True,
+        use_e2e_wired_table_rec_model: bool = False,
+        use_e2e_wireless_table_rec_model: bool = True,
+        **kwargs,
+    ) -> LayoutParsingResultV2:
+        """
+        Predicts the layout parsing result for the given input.
+        Args:
+            use_doc_orientation_classify (Optional[bool]): Whether to use document orientation classification.
+            use_doc_unwarping (Optional[bool]): Whether to use document unwarping.
+            use_textline_orientation (Optional[bool]): Whether to use textline orientation prediction.
+            use_seal_recognition (Optional[bool]): Whether to use seal recognition.
+            use_table_recognition (Optional[bool]): Whether to use table recognition.
+            use_formula_recognition (Optional[bool]): Whether to use formula recognition.
+            use_region_detection (Optional[bool]): Whether to use region detection.
+            layout_threshold (Optional[float]): The threshold value to filter out low-confidence predictions. Default is None.
+            layout_nms (bool, optional): Whether to use layout-aware NMS. Defaults to False.
+            layout_unclip_ratio (Optional[Union[float, Tuple[float, float]]], optional): The ratio of unclipping the bounding box.
+                Defaults to None.
+                If it's a single number, then both width and height are used.
+                If it's a tuple of two numbers, then they are used separately for width and height respectively.
+                If it's None, then no unclipping will be performed.
+            layout_merge_bboxes_mode (Optional[str], optional): The mode for merging bounding boxes. Defaults to None.
+            text_det_limit_side_len (Optional[int]): Maximum side length for text detection.
+            text_det_limit_type (Optional[str]): Type of limit to apply for text detection.
+            text_det_thresh (Optional[float]): Threshold for text detection.
+            text_det_box_thresh (Optional[float]): Threshold for text detection boxes.
+            text_det_unclip_ratio (Optional[float]): Ratio for unclipping text detection boxes.
+            text_rec_score_thresh (Optional[float]): Score threshold for text recognition.
+            seal_det_limit_side_len (Optional[int]): Maximum side length for seal detection.
+            seal_det_limit_type (Optional[str]): Type of limit to apply for seal detection.
+            seal_det_thresh (Optional[float]): Threshold for seal detection.
+            seal_det_box_thresh (Optional[float]): Threshold for seal detection boxes.
+            seal_det_unclip_ratio (Optional[float]): Ratio for unclipping seal detection boxes.
+            seal_rec_score_thresh (Optional[float]): Score threshold for seal recognition.
+            use_wired_table_cells_trans_to_html (bool): Whether to use wired table cells trans to HTML.
+            use_wireless_table_cells_trans_to_html (bool): Whether to use wireless table cells trans to HTML.
+            use_table_orientation_classify (bool): Whether to use table orientation classification.
+            use_ocr_results_with_table_cells (bool): Whether to use OCR results processed by table cells.
+            use_e2e_wired_table_rec_model (bool): Whether to use end-to-end wired table recognition model.
+            use_e2e_wireless_table_rec_model (bool): Whether to use end-to-end wireless table recognition model.
+            **kwargs (Any): Additional settings to extend functionality.
+        Returns:
+            LayoutParsingResultV2: The predicted layout parsing result.
+        """
+        model_settings = self.get_model_settings(
+            use_doc_orientation_classify,
+            use_doc_unwarping,
+            use_seal_recognition,
+            use_table_recognition,
+            use_formula_recognition,
+            use_chart_recognition,
+            use_region_detection,
+        )
+        if not self.check_model_settings_valid(model_settings):
+            yield {"error": "the input params for model settings are invalid!"}
+        for batch_data in self.batch_sampler(input):
+            image_arrays = self.img_reader(batch_data.instances)
+            if model_settings["use_doc_preprocessor"]:
+                doc_preprocessor_results = list(
+                    self.doc_preprocessor_pipeline(
+                        image_arrays,
+                        use_doc_orientation_classify=use_doc_orientation_classify,
+                        use_doc_unwarping=use_doc_unwarping,
+                    )
+                )
+            else:
+                doc_preprocessor_results = [{"output_img": arr} for arr in image_arrays]
+            doc_preprocessor_images = [
+                item["output_img"] for item in doc_preprocessor_results
+            ]
+            layout_det_results = list(
+                self.layout_det_model(
+                    doc_preprocessor_images,
+                    threshold=layout_threshold,
+                    layout_nms=layout_nms,
+                    layout_unclip_ratio=layout_unclip_ratio,
+                    layout_merge_bboxes_mode=layout_merge_bboxes_mode,
+                )
+            )
+            imgs_in_doc = [
+                gather_imgs(img, res["boxes"])
+                for img, res in zip(doc_preprocessor_images, layout_det_results)
+            ]
+            if model_settings["use_region_detection"]:
+                region_det_results = list(
+                    self.region_detection_model(
+                        doc_preprocessor_images,
+                        layout_nms=True,
+                        layout_merge_bboxes_mode="small",
+                    ),
+                )
+            else:
+                region_det_results = [{"boxes": []} for _ in doc_preprocessor_images]
+            if model_settings["use_formula_recognition"]:
+                formula_res_all = list(
+                    self.formula_recognition_pipeline(
+                        doc_preprocessor_images,
+                        use_layout_detection=False,
+                        use_doc_orientation_classify=False,
+                        use_doc_unwarping=False,
+                        layout_det_res=layout_det_results,
+                    ),
+                )
+                formula_res_lists = [
+                    item["formula_res_list"] for item in formula_res_all
+                ]
+            else:
+                formula_res_lists = [[] for _ in doc_preprocessor_images]
+            for doc_preprocessor_image, formula_res_list in zip(
+                doc_preprocessor_images, formula_res_lists
+            ):
+                for formula_res in formula_res_list:
+                    x_min, y_min, x_max, y_max = list(map(int, formula_res["dt_polys"]))
+                    doc_preprocessor_image[y_min:y_max, x_min:x_max, :] = 255.0
+            overall_ocr_results = list(
+                self.general_ocr_pipeline(
+                    doc_preprocessor_images,
+                    use_textline_orientation=use_textline_orientation,
+                    text_det_limit_side_len=text_det_limit_side_len,
+                    text_det_limit_type=text_det_limit_type,
+                    text_det_thresh=text_det_thresh,
+                    text_det_box_thresh=text_det_box_thresh,
+                    text_det_unclip_ratio=text_det_unclip_ratio,
+                    text_rec_score_thresh=text_rec_score_thresh,
+                ),
+            )
+            for overall_ocr_res in overall_ocr_results:
+                overall_ocr_res["rec_labels"] = ["text"] * len(
+                    overall_ocr_res["rec_texts"]
+                )
+            if model_settings["use_table_recognition"]:
+                table_res_lists = []
+                for (
+                    layout_det_res,
+                    doc_preprocessor_image,
+                    overall_ocr_res,
+                    formula_res_list,
+                    imgs_in_doc_for_img,
+                ) in zip(
+                    layout_det_results,
+                    doc_preprocessor_images,
+                    overall_ocr_results,
+                    formula_res_lists,
+                    imgs_in_doc,
+                ):
+                    table_contents_for_img = copy.deepcopy(overall_ocr_res)
+                    for formula_res in formula_res_list:
+                        x_min, y_min, x_max, y_max = list(
+                            map(int, formula_res["dt_polys"])
+                        )
+                        poly_points = [
+                            (x_min, y_min),
+                            (x_max, y_min),
+                            (x_max, y_max),
+                            (x_min, y_max),
+                        ]
+                        table_contents_for_img["dt_polys"].append(poly_points)
+                        rec_formula = formula_res["rec_formula"]
+                        if not rec_formula.startswith("$") or not rec_formula.endswith(
+                            "$"
+                        ):
+                            rec_formula = f"${rec_formula}$"
+                        table_contents_for_img["rec_texts"].append(f"{rec_formula}")
+                        if table_contents_for_img["rec_boxes"].size == 0:
+                            table_contents_for_img["rec_boxes"] = np.array(
+                                [formula_res["dt_polys"]]
+                            )
+                        else:
+                            table_contents_for_img["rec_boxes"] = np.vstack(
+                                (
+                                    table_contents_for_img["rec_boxes"],
+                                    [formula_res["dt_polys"]],
+                                )
+                            )
+                        table_contents_for_img["rec_polys"].append(poly_points)
+                        table_contents_for_img["rec_scores"].append(1)
+                    for img in imgs_in_doc_for_img:
+                        img_path = img["path"]
+                        x_min, y_min, x_max, y_max = img["coordinate"]
+                        poly_points = [
+                            (x_min, y_min),
+                            (x_max, y_min),
+                            (x_max, y_max),
+                            (x_min, y_max),
+                        ]
+                        table_contents_for_img["dt_polys"].append(poly_points)
+                        table_contents_for_img["rec_texts"].append(
+                            f'<div style="text-align: center;"><img src="{img_path}" alt="Image" /></div>'
+                        )
+                        if table_contents_for_img["rec_boxes"].size == 0:
+                            table_contents_for_img["rec_boxes"] = np.array(
+                                [img["coordinate"]]
+                            )
+                        else:
+                            table_contents_for_img["rec_boxes"] = np.vstack(
+                                (table_contents_for_img["rec_boxes"], img["coordinate"])
+                            )
+                        table_contents_for_img["rec_polys"].append(poly_points)
+                        table_contents_for_img["rec_scores"].append(img["score"])
+                    table_res_all = list(
+                        self.table_recognition_pipeline(
+                            doc_preprocessor_image,
+                            use_doc_orientation_classify=False,
+                            use_doc_unwarping=False,
+                            use_layout_detection=False,
+                            use_ocr_model=False,
+                            overall_ocr_res=table_contents_for_img,
+                            layout_det_res=layout_det_res,
+                            cell_sort_by_y_projection=True,
+                            use_wired_table_cells_trans_to_html=use_wired_table_cells_trans_to_html,
+                            use_wireless_table_cells_trans_to_html=use_wireless_table_cells_trans_to_html,
+                            use_table_orientation_classify=use_table_orientation_classify,
+                            use_ocr_results_with_table_cells=use_ocr_results_with_table_cells,
+                            use_e2e_wired_table_rec_model=use_e2e_wired_table_rec_model,
+                            use_e2e_wireless_table_rec_model=use_e2e_wireless_table_rec_model,
+                        ),
+                    )
+                    single_table_res_lists = [
+                        item["table_res_list"] for item in table_res_all
+                    ]
+                    table_res_lists.extend(single_table_res_lists)
+            else:
+                table_res_lists = [[] for _ in doc_preprocessor_images]
+            if model_settings["use_seal_recognition"]:
+                seal_res_all = list(
+                    self.seal_recognition_pipeline(
+                        doc_preprocessor_images,
+                        use_doc_orientation_classify=False,
+                        use_doc_unwarping=False,
+                        use_layout_detection=False,
+                        layout_det_res=layout_det_results,
+                        seal_det_limit_side_len=seal_det_limit_side_len,
+                        seal_det_limit_type=seal_det_limit_type,
+                        seal_det_thresh=seal_det_thresh,
+                        seal_det_box_thresh=seal_det_box_thresh,
+                        seal_det_unclip_ratio=seal_det_unclip_ratio,
+                        seal_rec_score_thresh=seal_rec_score_thresh,
+                    ),
+                )
+                seal_res_lists = [item["seal_res_list"] for item in seal_res_all]
+            else:
+                seal_res_lists = [[] for _ in doc_preprocessor_images]
+            for (
+                input_path,
+                page_index,
+                doc_preprocessor_image,
+                doc_preprocessor_res,
+                layout_det_res,
+                region_det_res,
+                overall_ocr_res,
+                table_res_list,
+                seal_res_list,
+                formula_res_list,
+                imgs_in_doc_for_img,
+            ) in zip(
+                batch_data.input_paths,
+                batch_data.page_indexes,
+                doc_preprocessor_images,
+                doc_preprocessor_results,
+                layout_det_results,
+                region_det_results,
+                overall_ocr_results,
+                table_res_lists,
+                seal_res_lists,
+                formula_res_lists,
+                imgs_in_doc,
+            ):
+                chart_res_list = []
+                if model_settings["use_chart_recognition"]:
+                    chart_imgs_list = []
+                    for bbox in layout_det_res["boxes"]:
+                        if bbox["label"] == "chart":
+                            x_min, y_min, x_max, y_max = bbox["coordinate"]
+                            chart_img = doc_preprocessor_image[
+                                int(y_min) : int(y_max), int(x_min) : int(x_max), :
+                            ]
+                            chart_imgs_list.append({"image": chart_img})
+                    for chart_res_batch in self.chart_recognition_model(
+                        input=chart_imgs_list
+                    ):
+                        chart_res_list.append(chart_res_batch["result"])
+                parsing_res_list = self.get_layout_parsing_res(
+                    doc_preprocessor_image,
+                    region_det_res=region_det_res,
+                    layout_det_res=layout_det_res,
+                    overall_ocr_res=overall_ocr_res,
+                    table_res_list=table_res_list,
+                    seal_res_list=seal_res_list,
+                    chart_res_list=chart_res_list,
+                    formula_res_list=formula_res_list,
+                    text_rec_score_thresh=text_rec_score_thresh,
+                )
+                for formula_res in formula_res_list:
+                    x_min, y_min, x_max, y_max = list(map(int, formula_res["dt_polys"]))
+                    doc_preprocessor_image[y_min:y_max, x_min:x_max, :] = formula_res[
+                        "input_img"
+                    ]
+                single_img_res = {
+                    "input_path": input_path,
+                    "page_index": page_index,
+                    "doc_preprocessor_res": doc_preprocessor_res,
+                    "layout_det_res": layout_det_res,
+                    "region_det_res": region_det_res,
+                    "overall_ocr_res": overall_ocr_res,
+                    "table_res_list": table_res_list,
+                    "seal_res_list": seal_res_list,
+                    "chart_res_list": chart_res_list,
+                    "formula_res_list": formula_res_list,
+                    "parsing_res_list": parsing_res_list,
+                    "imgs_in_doc": imgs_in_doc_for_img,
+                    "model_settings": model_settings,
+                }
+                yield LayoutParsingResultV2(single_img_res)
+    def concatenate_markdown_pages(self, markdown_list: list) -> tuple:
+        """
+        Concatenate Markdown content from multiple pages into a single document.
+        Args:
+            markdown_list (list): A list containing Markdown data for each page.
+        Returns:
+            tuple: A tuple containing the processed Markdown text.
+        """
+        markdown_texts = ""
+        previous_page_last_element_paragraph_end_flag = True
+        for res in markdown_list:
+            # Get the paragraph flags for the current page
+            page_first_element_paragraph_start_flag: bool = res[
+                "page_continuation_flags"
+            ][0]
+            page_last_element_paragraph_end_flag: bool = res["page_continuation_flags"][
+                1
+            ]
+            # Determine whether to add a space or a newline
+            if (
+                not page_first_element_paragraph_start_flag
+                and not previous_page_last_element_paragraph_end_flag
+            ):
+                last_char_of_markdown = markdown_texts[-1] if markdown_texts else ""
+                first_char_of_handler = (
+                    res["markdown_texts"][0] if res["markdown_texts"] else ""
+                )
+                # Check if the last character and the first character are Chinese characters
+                last_is_chinese_char = (
+                    re.match(r"[\u4e00-\u9fff]", last_char_of_markdown)
+                    if last_char_of_markdown
+                    else False
+                )
+                first_is_chinese_char = (
+                    re.match(r"[\u4e00-\u9fff]", first_char_of_handler)
+                    if first_char_of_handler
+                    else False
+                )
+                if not (last_is_chinese_char or first_is_chinese_char):
+                    markdown_texts += " " + res["markdown_texts"]
+                else:
+                    markdown_texts += res["markdown_texts"]
+            else:
+                markdown_texts += "\n\n" + res["markdown_texts"]
+            previous_page_last_element_paragraph_end_flag = (
+                page_last_element_paragraph_end_flag
+            )
+        return markdown_texts
+@pipeline_requires_extra("ocr")
+class LayoutParsingPipelineV2(AutoParallelImageSimpleInferencePipeline):
+    entities = ["PP-StructureV3"]
+    @property
+    def _pipeline_cls(self):
+        return _LayoutParsingPipelineV2
+    def _get_batch_size(self, config):
+        return config.get("batch_size", 1)

paddlex 2.0.0rc4__py3-none-any.whl → 3.0.0__py3-none-any.whl

paddlex 2.0.0rc4py3-none-any.whl → 3.0.0py3-none-any.whl