PyPI - paddlex - Versions diffs - 2.1.0__py3-none-any.whl → 3.0.0rc0__py3-none-any.whl - Mend

paddlex 2.1.0py3-none-any.whl → 3.0.0rc0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (1708) hide show

paddlex/.version +1 -0
paddlex/__init__.py +52 -19
paddlex/__main__.py +39 -0
paddlex/configs/modules/3d_bev_detection/BEVFusion.yaml +38 -0
paddlex/configs/modules/doc_text_orientation/PP-LCNet_x1_0_doc_ori.yaml +41 -0
paddlex/configs/modules/face_detection/BlazeFace-FPN-SSH.yaml +40 -0
paddlex/configs/modules/face_detection/BlazeFace.yaml +40 -0
paddlex/configs/modules/face_detection/PP-YOLOE_plus-S_face.yaml +40 -0
paddlex/configs/modules/face_detection/PicoDet_LCNet_x2_5_face.yaml +40 -0
paddlex/configs/modules/face_feature/MobileFaceNet.yaml +41 -0
paddlex/configs/modules/face_feature/ResNet50_face.yaml +41 -0
paddlex/configs/modules/formula_recognition/LaTeX_OCR_rec.yaml +40 -0
paddlex/configs/modules/formula_recognition/PP-FormulaNet-L.yaml +40 -0
paddlex/configs/modules/formula_recognition/PP-FormulaNet-S.yaml +40 -0
paddlex/configs/modules/formula_recognition/UniMERNet.yaml +40 -0
paddlex/configs/modules/human_detection/PP-YOLOE-L_human.yaml +42 -0
paddlex/configs/modules/human_detection/PP-YOLOE-S_human.yaml +42 -0
paddlex/configs/modules/image_anomaly_detection/STFPM.yaml +41 -0
paddlex/configs/modules/image_classification/CLIP_vit_base_patch16_224.yaml +41 -0
paddlex/configs/modules/image_classification/CLIP_vit_large_patch14_224.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_base_224.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_base_384.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_large_224.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_large_384.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_small.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_tiny.yaml +41 -0
paddlex/configs/modules/image_classification/FasterNet-L.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-M.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-S.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-T0.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-T1.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-T2.yaml +40 -0
paddlex/configs/modules/image_classification/MobileNetV1_x0_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV1_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV1_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV1_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x0_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x1_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x2_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x0_35.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x1_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x0_35.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x1_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_conv_large.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_conv_medium.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_conv_small.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_hybrid_large.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_hybrid_medium.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B0.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B1.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B2.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B3.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B4.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B5.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B6.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNet_base.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNet_small.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNet_tiny.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNetV2_base.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNetV2_large.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNetV2_small.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_25.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_35.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x1_5.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x2_0.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x2_5.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet101.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet101_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet152.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet152_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet18.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet18_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet200_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet34.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet34_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet50.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet50_vd.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S1.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S2.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S3.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S4.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_base_patch4_window12_384.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_base_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_large_patch4_window12_384.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_large_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_small_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_tiny_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_feature/PP-ShiTuV2_rec.yaml +42 -0
paddlex/configs/modules/image_feature/PP-ShiTuV2_rec_CLIP_vit_base.yaml +42 -0
paddlex/configs/modules/image_feature/PP-ShiTuV2_rec_CLIP_vit_large.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/CLIP_vit_base_patch16_448_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B0_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B4_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B6_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-LCNet_x1_0_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/ResNet50_ML.yaml +41 -0
paddlex/configs/modules/image_unwarping/UVDoc.yaml +12 -0
paddlex/configs/modules/instance_segmentation/Cascade-MaskRCNN-ResNet50-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Cascade-MaskRCNN-ResNet50-vd-SSLDv2-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-H.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-L.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-M.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-S.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-X.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNeXt101-vd-FPN.yaml +39 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet101-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet101-vd-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50-vd-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50.yaml +40 -0
paddlex/configs/modules/instance_segmentation/PP-YOLOE_seg-S.yaml +40 -0
paddlex/configs/modules/instance_segmentation/SOLOv2.yaml +40 -0
paddlex/configs/modules/keypoint_detection/PP-TinyPose_128x96.yaml +40 -0
paddlex/configs/modules/keypoint_detection/PP-TinyPose_256x192.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout-L.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout-M.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout-S.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-L_layout_17cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-L_layout_3cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-S_layout_17cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-S_layout_3cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet_layout_1x.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet_layout_1x_table.yaml +40 -0
paddlex/configs/modules/layout_detection/RT-DETR-H_layout_17cls.yaml +40 -0
paddlex/configs/modules/layout_detection/RT-DETR-H_layout_3cls.yaml +40 -0
paddlex/configs/modules/mainbody_detection/PP-ShiTuV2_det.yaml +41 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_base.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_large.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_medium.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_small.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_tiny.yaml +12 -0
paddlex/configs/modules/object_detection/Cascade-FasterRCNN-ResNet50-FPN.yaml +41 -0
paddlex/configs/modules/object_detection/Cascade-FasterRCNN-ResNet50-vd-SSLDv2-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/CenterNet-DLA-34.yaml +41 -0
paddlex/configs/modules/object_detection/CenterNet-ResNet50.yaml +41 -0
paddlex/configs/modules/object_detection/Co-DINO-R50.yaml +40 -0
paddlex/configs/modules/object_detection/Co-DINO-Swin-L.yaml +40 -0
paddlex/configs/modules/object_detection/Co-Deformable-DETR-R50.yaml +40 -0
paddlex/configs/modules/object_detection/Co-Deformable-DETR-Swin-T.yaml +40 -0
paddlex/configs/modules/object_detection/DETR-R50.yaml +42 -0
paddlex/configs/modules/object_detection/FCOS-ResNet50.yaml +41 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNeXt101-vd-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet101-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet101.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet34-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-vd-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-vd-SSLDv2-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-Swin-Tiny-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-L.yaml +40 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-M.yaml +40 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-S.yaml +40 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-X.yaml +40 -0
paddlex/configs/modules/object_detection/PicoDet-L.yaml +40 -0
paddlex/configs/modules/object_detection/PicoDet-M.yaml +42 -0
paddlex/configs/modules/object_detection/PicoDet-S.yaml +40 -0
paddlex/configs/modules/object_detection/PicoDet-XS.yaml +42 -0
paddlex/configs/modules/object_detection/RT-DETR-H.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-L.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-R18.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-R50.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-X.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-L.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-M.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-N.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-S.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-T.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-X.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOv3-DarkNet53.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOv3-MobileNetV3.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOv3-ResNet50_vd_DCN.yaml +40 -0
paddlex/configs/modules/open_vocabulary_detection/GroundingDINO-T.yaml +13 -0
paddlex/configs/modules/open_vocabulary_segmentation/SAM-H_box.yaml +17 -0
paddlex/configs/modules/open_vocabulary_segmentation/SAM-H_point.yaml +15 -0
paddlex/configs/modules/pedestrian_attribute_recognition/PP-LCNet_x1_0_pedestrian_attribute.yaml +41 -0
paddlex/configs/modules/rotated_object_detection/PP-YOLOE-R-L.yaml +40 -0
paddlex/configs/modules/seal_text_detection/PP-OCRv4_mobile_seal_det.yaml +40 -0
paddlex/configs/modules/seal_text_detection/PP-OCRv4_server_seal_det.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3-R101.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3-R50.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3_Plus-R101.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3_Plus-R50.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/MaskFormer_small.yaml +42 -0
paddlex/configs/modules/semantic_segmentation/MaskFormer_tiny.yaml +42 -0
paddlex/configs/modules/semantic_segmentation/OCRNet_HRNet-W18.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/OCRNet_HRNet-W48.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/PP-LiteSeg-B.yaml +41 -0
paddlex/configs/modules/semantic_segmentation/PP-LiteSeg-T.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_base.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_large.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_small.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_tiny.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B0.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B1.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B2.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B3.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B4.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B5.yaml +40 -0
paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-L.yaml +42 -0
paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-S.yaml +42 -0
paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-largesize-L.yaml +42 -0
paddlex/configs/modules/table_cells_detection/RT-DETR-L_wired_table_cell_det.yaml +40 -0
paddlex/configs/modules/table_cells_detection/RT-DETR-L_wireless_table_cell_det.yaml +40 -0
paddlex/configs/modules/table_classification/PP-LCNet_x1_0_table_cls.yaml +41 -0
paddlex/configs/modules/table_structure_recognition/SLANeXt_wired.yaml +39 -0
paddlex/configs/modules/table_structure_recognition/SLANeXt_wireless.yaml +39 -0
paddlex/configs/modules/table_structure_recognition/SLANet.yaml +39 -0
paddlex/configs/modules/table_structure_recognition/SLANet_plus.yaml +39 -0
paddlex/configs/modules/text_detection/PP-OCRv3_mobile_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv3_server_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv4_mobile_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv4_server_det.yaml +40 -0
paddlex/configs/modules/text_recognition/PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv4_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv4_server_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv4_server_rec_doc.yaml +39 -0
paddlex/configs/modules/text_recognition/arabic_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ch_RepSVTR_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ch_SVTRv2_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/chinese_cht_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/cyrillic_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/devanagari_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/en_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/en_PP-OCRv4_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/japan_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ka_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/korean_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/latin_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ta_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/te_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/textline_orientation/PP-LCNet_x0_25_textline_ori.yaml +41 -0
paddlex/configs/modules/ts_anomaly_detection/AutoEncoder_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/DLinear_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/Nonstationary_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/PatchTST_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/TimesNet_ad.yaml +37 -0
paddlex/configs/modules/ts_classification/TimesNet_cls.yaml +37 -0
paddlex/configs/modules/ts_forecast/DLinear.yaml +38 -0
paddlex/configs/modules/ts_forecast/NLinear.yaml +38 -0
paddlex/configs/modules/ts_forecast/Nonstationary.yaml +38 -0
paddlex/configs/modules/ts_forecast/PatchTST.yaml +38 -0
paddlex/configs/modules/ts_forecast/RLinear.yaml +38 -0
paddlex/configs/modules/ts_forecast/TiDE.yaml +38 -0
paddlex/configs/modules/ts_forecast/TimesNet.yaml +38 -0
paddlex/configs/modules/vehicle_attribute_recognition/PP-LCNet_x1_0_vehicle_attribute.yaml +41 -0
paddlex/configs/modules/vehicle_detection/PP-YOLOE-L_vehicle.yaml +41 -0
paddlex/configs/modules/vehicle_detection/PP-YOLOE-S_vehicle.yaml +42 -0
paddlex/configs/modules/video_classification/PP-TSM-R50_8frames_uniform.yaml +42 -0
paddlex/configs/modules/video_classification/PP-TSMv2-LCNetV2_16frames_uniform.yaml +42 -0
paddlex/configs/modules/video_classification/PP-TSMv2-LCNetV2_8frames_uniform.yaml +42 -0
paddlex/configs/modules/video_detection/YOWO.yaml +40 -0
paddlex/configs/pipelines/3d_bev_detection.yaml +9 -0
paddlex/configs/pipelines/OCR.yaml +44 -0
paddlex/configs/pipelines/PP-ChatOCRv3-doc.yaml +149 -0
paddlex/configs/pipelines/PP-ChatOCRv4-doc.yaml +184 -0
paddlex/configs/pipelines/PP-ShiTuV2.yaml +18 -0
paddlex/configs/pipelines/PP-StructureV3.yaml +226 -0
paddlex/configs/pipelines/anomaly_detection.yaml +8 -0
paddlex/configs/pipelines/doc_preprocessor.yaml +15 -0
paddlex/configs/pipelines/face_recognition.yaml +18 -0
paddlex/configs/pipelines/formula_recognition.yaml +39 -0
paddlex/configs/pipelines/human_keypoint_detection.yaml +17 -0
paddlex/configs/pipelines/image_classification.yaml +10 -0
paddlex/configs/pipelines/image_multilabel_classification.yaml +9 -0
paddlex/configs/pipelines/instance_segmentation.yaml +10 -0
paddlex/configs/pipelines/layout_parsing.yaml +101 -0
paddlex/configs/pipelines/multilingual_speech_recognition.yaml +9 -0
paddlex/configs/pipelines/object_detection.yaml +10 -0
paddlex/configs/pipelines/open_vocabulary_detection.yaml +12 -0
paddlex/configs/pipelines/open_vocabulary_segmentation.yaml +13 -0
paddlex/configs/pipelines/pedestrian_attribute_recognition.yaml +15 -0
paddlex/configs/pipelines/rotated_object_detection.yaml +10 -0
paddlex/configs/pipelines/seal_recognition.yaml +51 -0
paddlex/configs/pipelines/semantic_segmentation.yaml +10 -0
paddlex/configs/pipelines/small_object_detection.yaml +10 -0
paddlex/configs/pipelines/table_recognition.yaml +56 -0
paddlex/configs/pipelines/table_recognition_v2.yaml +76 -0
paddlex/configs/pipelines/ts_anomaly_detection.yaml +8 -0
paddlex/configs/pipelines/ts_classification.yaml +8 -0
paddlex/configs/pipelines/ts_forecast.yaml +8 -0
paddlex/configs/pipelines/vehicle_attribute_recognition.yaml +15 -0
paddlex/configs/pipelines/video_classification.yaml +9 -0
paddlex/configs/pipelines/video_detection.yaml +10 -0
paddlex/engine.py +54 -0
paddlex/hpip_links.html +19 -0
paddlex/inference/__init__.py +19 -0
paddlex/inference/common/__init__.py +13 -0
paddlex/inference/common/batch_sampler/__init__.py +20 -0
paddlex/inference/common/batch_sampler/audio_batch_sampler.py +84 -0
paddlex/inference/common/batch_sampler/base_batch_sampler.py +90 -0
paddlex/inference/common/batch_sampler/det_3d_batch_sampler.py +147 -0
paddlex/inference/common/batch_sampler/image_batch_sampler.py +136 -0
paddlex/inference/common/batch_sampler/ts_batch_sampler.py +110 -0
paddlex/inference/common/batch_sampler/video_batch_sampler.py +94 -0
paddlex/inference/common/reader/__init__.py +19 -0
paddlex/inference/common/reader/audio_reader.py +46 -0
paddlex/inference/common/reader/det_3d_reader.py +239 -0
paddlex/inference/common/reader/image_reader.py +69 -0
paddlex/inference/common/reader/ts_reader.py +45 -0
paddlex/inference/common/reader/video_reader.py +42 -0
paddlex/inference/common/result/__init__.py +29 -0
paddlex/inference/common/result/base_cv_result.py +31 -0
paddlex/inference/common/result/base_result.py +70 -0
paddlex/inference/common/result/base_ts_result.py +42 -0
paddlex/inference/common/result/base_video_result.py +36 -0
paddlex/inference/common/result/mixin.py +703 -0
paddlex/inference/models/3d_bev_detection/__init__.py +15 -0
paddlex/inference/models/3d_bev_detection/predictor.py +314 -0
paddlex/inference/models/3d_bev_detection/processors.py +978 -0
paddlex/inference/models/3d_bev_detection/result.py +65 -0
paddlex/inference/models/3d_bev_detection/visualizer_3d.py +131 -0
paddlex/inference/models/__init__.py +130 -0
paddlex/inference/models/anomaly_detection/__init__.py +15 -0
paddlex/inference/models/anomaly_detection/predictor.py +145 -0
paddlex/inference/models/anomaly_detection/processors.py +46 -0
paddlex/inference/models/anomaly_detection/result.py +70 -0
paddlex/inference/models/base/__init__.py +15 -0
paddlex/inference/models/base/predictor/__init__.py +16 -0
paddlex/inference/models/base/predictor/base_predictor.py +175 -0
paddlex/inference/models/base/predictor/basic_predictor.py +139 -0
paddlex/inference/models/common/__init__.py +35 -0
paddlex/inference/models/common/static_infer.py +329 -0
paddlex/inference/models/common/tokenizer/__init__.py +17 -0
paddlex/inference/models/common/tokenizer/bert_tokenizer.py +655 -0
paddlex/inference/models/common/tokenizer/gpt_tokenizer.py +451 -0
paddlex/inference/models/common/tokenizer/tokenizer_utils.py +2141 -0
paddlex/inference/models/common/tokenizer/tokenizer_utils_base.py +3504 -0
paddlex/inference/models/common/tokenizer/utils.py +66 -0
paddlex/inference/models/common/tokenizer/vocab.py +647 -0
paddlex/inference/models/common/ts/__init__.py +15 -0
paddlex/inference/models/common/ts/funcs.py +533 -0
paddlex/inference/models/common/ts/processors.py +313 -0
paddlex/inference/models/common/vision/__init__.py +23 -0
paddlex/inference/models/common/vision/funcs.py +93 -0
paddlex/inference/models/common/vision/processors.py +270 -0
paddlex/inference/models/face_feature/__init__.py +15 -0
paddlex/inference/models/face_feature/predictor.py +65 -0
paddlex/inference/models/formula_recognition/__init__.py +15 -0
paddlex/inference/models/formula_recognition/predictor.py +203 -0
paddlex/inference/models/formula_recognition/processors.py +986 -0
paddlex/inference/models/formula_recognition/result.py +403 -0
paddlex/inference/models/image_classification/__init__.py +15 -0
paddlex/inference/models/image_classification/predictor.py +182 -0
paddlex/inference/models/image_classification/processors.py +87 -0
paddlex/inference/models/image_classification/result.py +92 -0
paddlex/inference/models/image_feature/__init__.py +15 -0
paddlex/inference/models/image_feature/predictor.py +156 -0
paddlex/inference/models/image_feature/processors.py +29 -0
paddlex/inference/models/image_feature/result.py +33 -0
paddlex/inference/models/image_multilabel_classification/__init__.py +15 -0
paddlex/inference/models/image_multilabel_classification/predictor.py +94 -0
paddlex/inference/models/image_multilabel_classification/processors.py +85 -0
paddlex/inference/models/image_multilabel_classification/result.py +95 -0
paddlex/inference/models/image_unwarping/__init__.py +15 -0
paddlex/inference/models/image_unwarping/predictor.py +105 -0
paddlex/inference/models/image_unwarping/processors.py +88 -0
paddlex/inference/models/image_unwarping/result.py +45 -0
paddlex/inference/models/instance_segmentation/__init__.py +15 -0
paddlex/inference/models/instance_segmentation/predictor.py +210 -0
paddlex/inference/models/instance_segmentation/processors.py +105 -0
paddlex/inference/models/instance_segmentation/result.py +161 -0
paddlex/inference/models/keypoint_detection/__init__.py +15 -0
paddlex/inference/models/keypoint_detection/predictor.py +188 -0
paddlex/inference/models/keypoint_detection/processors.py +359 -0
paddlex/inference/models/keypoint_detection/result.py +192 -0
paddlex/inference/models/multilingual_speech_recognition/__init__.py +15 -0
paddlex/inference/models/multilingual_speech_recognition/predictor.py +141 -0
paddlex/inference/models/multilingual_speech_recognition/processors.py +1941 -0
paddlex/inference/models/multilingual_speech_recognition/result.py +21 -0
paddlex/inference/models/object_detection/__init__.py +15 -0
paddlex/inference/models/object_detection/predictor.py +348 -0
paddlex/inference/models/object_detection/processors.py +855 -0
paddlex/inference/models/object_detection/result.py +113 -0
paddlex/inference/models/object_detection/utils.py +68 -0
paddlex/inference/models/open_vocabulary_detection/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_detection/predictor.py +155 -0
paddlex/inference/models/open_vocabulary_detection/processors/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_detection/processors/groundingdino_processors.py +485 -0
paddlex/inference/models/open_vocabulary_segmentation/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_segmentation/predictor.py +120 -0
paddlex/inference/models/open_vocabulary_segmentation/processors/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_segmentation/processors/sam_processer.py +249 -0
paddlex/inference/models/open_vocabulary_segmentation/results/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_segmentation/results/sam_result.py +147 -0
paddlex/inference/models/semantic_segmentation/__init__.py +15 -0
paddlex/inference/models/semantic_segmentation/predictor.py +167 -0
paddlex/inference/models/semantic_segmentation/processors.py +114 -0
paddlex/inference/models/semantic_segmentation/result.py +72 -0
paddlex/inference/models/table_structure_recognition/__init__.py +15 -0
paddlex/inference/models/table_structure_recognition/predictor.py +171 -0
paddlex/inference/models/table_structure_recognition/processors.py +235 -0
paddlex/inference/models/table_structure_recognition/result.py +70 -0
paddlex/inference/models/text_detection/__init__.py +15 -0
paddlex/inference/models/text_detection/predictor.py +191 -0
paddlex/inference/models/text_detection/processors.py +466 -0
paddlex/inference/models/text_detection/result.py +51 -0
paddlex/inference/models/text_recognition/__init__.py +15 -0
paddlex/inference/models/text_recognition/predictor.py +106 -0
paddlex/inference/models/text_recognition/processors.py +231 -0
paddlex/inference/models/text_recognition/result.py +75 -0
paddlex/inference/models/ts_anomaly_detection/__init__.py +15 -0
paddlex/inference/models/ts_anomaly_detection/predictor.py +146 -0
paddlex/inference/models/ts_anomaly_detection/processors.py +94 -0
paddlex/inference/models/ts_anomaly_detection/result.py +72 -0
paddlex/inference/models/ts_classification/__init__.py +15 -0
paddlex/inference/models/ts_classification/predictor.py +135 -0
paddlex/inference/models/ts_classification/processors.py +117 -0
paddlex/inference/models/ts_classification/result.py +78 -0
paddlex/inference/models/ts_forecasting/__init__.py +15 -0
paddlex/inference/models/ts_forecasting/predictor.py +159 -0
paddlex/inference/models/ts_forecasting/processors.py +149 -0
paddlex/inference/models/ts_forecasting/result.py +83 -0
paddlex/inference/models/video_classification/__init__.py +15 -0
paddlex/inference/models/video_classification/predictor.py +147 -0
paddlex/inference/models/video_classification/processors.py +409 -0
paddlex/inference/models/video_classification/result.py +92 -0
paddlex/inference/models/video_detection/__init__.py +15 -0
paddlex/inference/models/video_detection/predictor.py +136 -0
paddlex/inference/models/video_detection/processors.py +450 -0
paddlex/inference/models/video_detection/result.py +104 -0
paddlex/inference/pipelines/3d_bev_detection/__init__.py +15 -0
paddlex/inference/pipelines/3d_bev_detection/pipeline.py +67 -0
paddlex/inference/pipelines/__init__.py +228 -0
paddlex/inference/pipelines/anomaly_detection/__init__.py +15 -0
paddlex/inference/pipelines/anomaly_detection/pipeline.py +62 -0
paddlex/inference/pipelines/attribute_recognition/__init__.py +15 -0
paddlex/inference/pipelines/attribute_recognition/pipeline.py +105 -0
paddlex/inference/pipelines/attribute_recognition/result.py +100 -0
paddlex/inference/pipelines/base.py +132 -0
paddlex/inference/pipelines/components/__init__.py +23 -0
paddlex/inference/pipelines/components/chat_server/__init__.py +16 -0
paddlex/inference/pipelines/components/chat_server/base.py +39 -0
paddlex/inference/pipelines/components/chat_server/openai_bot_chat.py +236 -0
paddlex/inference/pipelines/components/common/__init__.py +18 -0
paddlex/inference/pipelines/components/common/base_operator.py +36 -0
paddlex/inference/pipelines/components/common/base_result.py +65 -0
paddlex/inference/pipelines/components/common/convert_points_and_boxes.py +46 -0
paddlex/inference/pipelines/components/common/crop_image_regions.py +550 -0
paddlex/inference/pipelines/components/common/seal_det_warp.py +941 -0
paddlex/inference/pipelines/components/common/sort_boxes.py +83 -0
paddlex/inference/pipelines/components/faisser.py +352 -0
paddlex/inference/pipelines/components/prompt_engineering/__init__.py +16 -0
paddlex/inference/pipelines/components/prompt_engineering/base.py +35 -0
paddlex/inference/pipelines/components/prompt_engineering/generate_ensemble_prompt.py +127 -0
paddlex/inference/pipelines/components/prompt_engineering/generate_kie_prompt.py +148 -0
paddlex/inference/pipelines/components/retriever/__init__.py +16 -0
paddlex/inference/pipelines/components/retriever/base.py +226 -0
paddlex/inference/pipelines/components/retriever/openai_bot_retriever.py +70 -0
paddlex/inference/pipelines/components/retriever/qianfan_bot_retriever.py +163 -0
paddlex/inference/pipelines/components/utils/__init__.py +13 -0
paddlex/inference/pipelines/components/utils/mixin.py +206 -0
paddlex/inference/pipelines/doc_preprocessor/__init__.py +15 -0
paddlex/inference/pipelines/doc_preprocessor/pipeline.py +190 -0
paddlex/inference/pipelines/doc_preprocessor/result.py +103 -0
paddlex/inference/pipelines/face_recognition/__init__.py +15 -0
paddlex/inference/pipelines/face_recognition/pipeline.py +61 -0
paddlex/inference/pipelines/face_recognition/result.py +43 -0
paddlex/inference/pipelines/formula_recognition/__init__.py +15 -0
paddlex/inference/pipelines/formula_recognition/pipeline.py +303 -0
paddlex/inference/pipelines/formula_recognition/result.py +291 -0
paddlex/inference/pipelines/image_classification/__init__.py +15 -0
paddlex/inference/pipelines/image_classification/pipeline.py +71 -0
paddlex/inference/pipelines/image_multilabel_classification/__init__.py +15 -0
paddlex/inference/pipelines/image_multilabel_classification/pipeline.py +78 -0
paddlex/inference/pipelines/instance_segmentation/__init__.py +15 -0
paddlex/inference/pipelines/instance_segmentation/pipeline.py +70 -0
paddlex/inference/pipelines/keypoint_detection/__init__.py +15 -0
paddlex/inference/pipelines/keypoint_detection/pipeline.py +137 -0
paddlex/inference/pipelines/layout_parsing/__init__.py +16 -0
paddlex/inference/pipelines/layout_parsing/pipeline.py +570 -0
paddlex/inference/pipelines/layout_parsing/pipeline_v2.py +739 -0
paddlex/inference/pipelines/layout_parsing/result.py +203 -0
paddlex/inference/pipelines/layout_parsing/result_v2.py +470 -0
paddlex/inference/pipelines/layout_parsing/utils.py +2385 -0
paddlex/inference/pipelines/multilingual_speech_recognition/__init__.py +15 -0
paddlex/inference/pipelines/multilingual_speech_recognition/pipeline.py +67 -0
paddlex/inference/pipelines/object_detection/__init__.py +15 -0
paddlex/inference/pipelines/object_detection/pipeline.py +95 -0
paddlex/inference/pipelines/ocr/__init__.py +15 -0
paddlex/inference/pipelines/ocr/pipeline.py +389 -0
paddlex/inference/pipelines/ocr/result.py +248 -0
paddlex/inference/pipelines/open_vocabulary_detection/__init__.py +15 -0
paddlex/inference/pipelines/open_vocabulary_detection/pipeline.py +75 -0
paddlex/inference/pipelines/open_vocabulary_segmentation/__init__.py +15 -0
paddlex/inference/pipelines/open_vocabulary_segmentation/pipeline.py +89 -0
paddlex/inference/pipelines/pp_chatocr/__init__.py +16 -0
paddlex/inference/pipelines/pp_chatocr/pipeline_base.py +102 -0
paddlex/inference/pipelines/pp_chatocr/pipeline_v3.py +773 -0
paddlex/inference/pipelines/pp_chatocr/pipeline_v4.py +977 -0
paddlex/inference/pipelines/pp_shitu_v2/__init__.py +15 -0
paddlex/inference/pipelines/pp_shitu_v2/pipeline.py +152 -0
paddlex/inference/pipelines/pp_shitu_v2/result.py +126 -0
paddlex/inference/pipelines/rotated_object_detection/__init__.py +15 -0
paddlex/inference/pipelines/rotated_object_detection/pipeline.py +74 -0
paddlex/inference/pipelines/seal_recognition/__init__.py +15 -0
paddlex/inference/pipelines/seal_recognition/pipeline.py +271 -0
paddlex/inference/pipelines/seal_recognition/result.py +87 -0
paddlex/inference/pipelines/semantic_segmentation/__init__.py +15 -0
paddlex/inference/pipelines/semantic_segmentation/pipeline.py +74 -0
paddlex/inference/pipelines/small_object_detection/__init__.py +15 -0
paddlex/inference/pipelines/small_object_detection/pipeline.py +74 -0
paddlex/inference/pipelines/table_recognition/__init__.py +16 -0
paddlex/inference/pipelines/table_recognition/pipeline.py +462 -0
paddlex/inference/pipelines/table_recognition/pipeline_v2.py +792 -0
paddlex/inference/pipelines/table_recognition/result.py +216 -0
paddlex/inference/pipelines/table_recognition/table_recognition_post_processing.py +362 -0
paddlex/inference/pipelines/table_recognition/table_recognition_post_processing_v2.py +470 -0
paddlex/inference/pipelines/table_recognition/utils.py +44 -0
paddlex/inference/pipelines/ts_anomaly_detection/__init__.py +15 -0
paddlex/inference/pipelines/ts_anomaly_detection/pipeline.py +62 -0
paddlex/inference/pipelines/ts_classification/__init__.py +15 -0
paddlex/inference/pipelines/ts_classification/pipeline.py +62 -0
paddlex/inference/pipelines/ts_forecasting/__init__.py +15 -0
paddlex/inference/pipelines/ts_forecasting/pipeline.py +62 -0
paddlex/inference/pipelines/video_classification/__init__.py +15 -0
paddlex/inference/pipelines/video_classification/pipeline.py +68 -0
paddlex/inference/pipelines/video_detection/__init__.py +15 -0
paddlex/inference/pipelines/video_detection/pipeline.py +73 -0
paddlex/inference/serving/__init__.py +13 -0
paddlex/inference/serving/basic_serving/__init__.py +18 -0
paddlex/inference/serving/basic_serving/_app.py +209 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/__init__.py +41 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/__init__.py +13 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/common.py +96 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/image_recognition.py +36 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/ocr.py +90 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/anomaly_detection.py +64 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/doc_preprocessor.py +97 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/face_recognition.py +223 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/formula_recognition.py +97 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/human_keypoint_detection.py +78 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/image_classification.py +66 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/image_multilabel_classification.py +70 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/instance_segmentation.py +81 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/layout_parsing.py +115 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/m_3d_bev_detection.py +76 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/multilingual_speech_recognition.py +89 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/object_detection.py +74 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ocr.py +99 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/open_vocabulary_detection.py +78 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/open_vocabulary_segmentation.py +85 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pedestrian_attribute_recognition.py +81 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv3_doc.py +191 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv4_doc.py +221 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_shituv2.py +218 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_structurev3.py +136 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/rotated_object_detection.py +78 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/seal_recognition.py +103 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/semantic_segmentation.py +64 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/small_object_detection.py +69 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition.py +105 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition_v2.py +107 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ts_anomaly_detection.py +62 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ts_classification.py +61 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ts_forecast.py +62 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/vehicle_attribute_recognition.py +81 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/video_classification.py +73 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/video_detection.py +89 -0
paddlex/inference/serving/basic_serving/_server.py +35 -0
paddlex/inference/serving/infra/__init__.py +13 -0
paddlex/inference/serving/infra/config.py +36 -0
paddlex/inference/serving/infra/models.py +72 -0
paddlex/inference/serving/infra/storage.py +175 -0
paddlex/inference/serving/infra/utils.py +259 -0
paddlex/inference/serving/schemas/__init__.py +13 -0
paddlex/inference/serving/schemas/anomaly_detection.py +39 -0
paddlex/inference/serving/schemas/doc_preprocessor.py +54 -0
paddlex/inference/serving/schemas/face_recognition.py +124 -0
paddlex/inference/serving/schemas/formula_recognition.py +56 -0
paddlex/inference/serving/schemas/human_keypoint_detection.py +55 -0
paddlex/inference/serving/schemas/image_classification.py +45 -0
paddlex/inference/serving/schemas/image_multilabel_classification.py +47 -0
paddlex/inference/serving/schemas/instance_segmentation.py +53 -0
paddlex/inference/serving/schemas/layout_parsing.py +72 -0
paddlex/inference/serving/schemas/m_3d_bev_detection.py +48 -0
paddlex/inference/serving/schemas/multilingual_speech_recognition.py +57 -0
paddlex/inference/serving/schemas/object_detection.py +52 -0
paddlex/inference/serving/schemas/ocr.py +60 -0
paddlex/inference/serving/schemas/open_vocabulary_detection.py +52 -0
paddlex/inference/serving/schemas/open_vocabulary_segmentation.py +52 -0
paddlex/inference/serving/schemas/pedestrian_attribute_recognition.py +61 -0
paddlex/inference/serving/schemas/pp_chatocrv3_doc.py +134 -0
paddlex/inference/serving/schemas/pp_chatocrv4_doc.py +151 -0
paddlex/inference/serving/schemas/pp_shituv2.py +124 -0
paddlex/inference/serving/schemas/pp_structurev3.py +84 -0
paddlex/inference/serving/schemas/rotated_object_detection.py +52 -0
paddlex/inference/serving/schemas/seal_recognition.py +62 -0
paddlex/inference/serving/schemas/semantic_segmentation.py +45 -0
paddlex/inference/serving/schemas/shared/__init__.py +13 -0
paddlex/inference/serving/schemas/shared/classification.py +23 -0
paddlex/inference/serving/schemas/shared/image_segmentation.py +28 -0
paddlex/inference/serving/schemas/shared/object_detection.py +24 -0
paddlex/inference/serving/schemas/shared/ocr.py +25 -0
paddlex/inference/serving/schemas/small_object_detection.py +52 -0
paddlex/inference/serving/schemas/table_recognition.py +64 -0
paddlex/inference/serving/schemas/table_recognition_v2.py +66 -0
paddlex/inference/serving/schemas/ts_anomaly_detection.py +37 -0
paddlex/inference/serving/schemas/ts_classification.py +38 -0
paddlex/inference/serving/schemas/ts_forecast.py +37 -0
paddlex/inference/serving/schemas/vehicle_attribute_recognition.py +61 -0
paddlex/inference/serving/schemas/video_classification.py +44 -0
paddlex/inference/serving/schemas/video_detection.py +56 -0
paddlex/inference/utils/__init__.py +13 -0
paddlex/inference/utils/benchmark.py +226 -0
paddlex/inference/utils/color_map.py +123 -0
paddlex/inference/utils/get_pipeline_path.py +27 -0
paddlex/inference/utils/io/__init__.py +36 -0
paddlex/inference/utils/io/readers.py +500 -0
paddlex/inference/utils/io/style.py +374 -0
paddlex/inference/utils/io/tablepyxl.py +149 -0
paddlex/inference/utils/io/writers.py +459 -0
paddlex/inference/utils/new_ir_blacklist.py +28 -0
paddlex/inference/utils/official_models.py +352 -0
paddlex/inference/utils/pp_option.py +256 -0
paddlex/model.py +113 -0
paddlex/modules/3d_bev_detection/__init__.py +18 -0
paddlex/modules/3d_bev_detection/dataset_checker/__init__.py +95 -0
paddlex/modules/3d_bev_detection/dataset_checker/dataset_src/__init__.py +17 -0
paddlex/modules/3d_bev_detection/dataset_checker/dataset_src/analyse_dataset.py +106 -0
paddlex/modules/3d_bev_detection/dataset_checker/dataset_src/check_dataset.py +102 -0
paddlex/modules/3d_bev_detection/evaluator.py +46 -0
paddlex/modules/3d_bev_detection/exportor.py +22 -0
paddlex/modules/3d_bev_detection/model_list.py +18 -0
paddlex/modules/3d_bev_detection/trainer.py +70 -0
paddlex/modules/__init__.py +138 -0
paddlex/modules/anomaly_detection/__init__.py +18 -0
paddlex/modules/anomaly_detection/dataset_checker/__init__.py +95 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/analyse_dataset.py +79 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/check_dataset.py +87 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/convert_dataset.py +230 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/split_dataset.py +87 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/utils/visualizer.py +71 -0
paddlex/modules/anomaly_detection/evaluator.py +58 -0
paddlex/modules/anomaly_detection/exportor.py +22 -0
paddlex/modules/anomaly_detection/model_list.py +16 -0
paddlex/modules/anomaly_detection/trainer.py +71 -0
paddlex/modules/base/__init__.py +18 -0
paddlex/modules/base/build_model.py +34 -0
paddlex/modules/base/dataset_checker/__init__.py +16 -0
paddlex/modules/base/dataset_checker/dataset_checker.py +169 -0
paddlex/modules/base/dataset_checker/utils.py +110 -0
paddlex/modules/base/evaluator.py +170 -0
paddlex/modules/base/exportor.py +146 -0
paddlex/modules/base/trainer.py +134 -0
paddlex/modules/face_recognition/__init__.py +18 -0
paddlex/modules/face_recognition/dataset_checker/__init__.py +71 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/__init__.py +16 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/check_dataset.py +174 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/utils/visualizer.py +156 -0
paddlex/modules/face_recognition/evaluator.py +52 -0
paddlex/modules/face_recognition/exportor.py +22 -0
paddlex/modules/face_recognition/model_list.py +15 -0
paddlex/modules/face_recognition/trainer.py +75 -0
paddlex/modules/formula_recognition/__init__.py +18 -0
paddlex/modules/formula_recognition/dataset_checker/__init__.py +113 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/analyse_dataset.py +157 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/check_dataset.py +80 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/convert_dataset.py +94 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/formula_recognition/evaluator.py +77 -0
paddlex/modules/formula_recognition/exportor.py +22 -0
paddlex/modules/formula_recognition/model_list.py +20 -0
paddlex/modules/formula_recognition/trainer.py +121 -0
paddlex/modules/general_recognition/__init__.py +18 -0
paddlex/modules/general_recognition/dataset_checker/__init__.py +107 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/analyse_dataset.py +98 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/check_dataset.py +100 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/convert_dataset.py +99 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/split_dataset.py +82 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/utils/visualizer.py +150 -0
paddlex/modules/general_recognition/evaluator.py +31 -0
paddlex/modules/general_recognition/exportor.py +22 -0
paddlex/modules/general_recognition/model_list.py +19 -0
paddlex/modules/general_recognition/trainer.py +52 -0
paddlex/modules/image_classification/__init__.py +18 -0
paddlex/modules/image_classification/dataset_checker/__init__.py +104 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/analyse_dataset.py +93 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/check_dataset.py +131 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/convert_dataset.py +51 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/utils/visualizer.py +156 -0
paddlex/modules/image_classification/evaluator.py +43 -0
paddlex/modules/image_classification/exportor.py +22 -0
paddlex/modules/image_classification/model_list.py +99 -0
paddlex/modules/image_classification/trainer.py +82 -0
paddlex/modules/image_unwarping/__init__.py +13 -0
paddlex/modules/image_unwarping/model_list.py +17 -0
paddlex/modules/instance_segmentation/__init__.py +18 -0
paddlex/modules/instance_segmentation/dataset_checker/__init__.py +108 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/analyse_dataset.py +78 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/check_dataset.py +92 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/convert_dataset.py +241 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/split_dataset.py +119 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/utils/visualizer.py +221 -0
paddlex/modules/instance_segmentation/evaluator.py +32 -0
paddlex/modules/instance_segmentation/exportor.py +22 -0
paddlex/modules/instance_segmentation/model_list.py +33 -0
paddlex/modules/instance_segmentation/trainer.py +31 -0
paddlex/modules/keypoint_detection/__init__.py +18 -0
paddlex/modules/keypoint_detection/dataset_checker/__init__.py +56 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/__init__.py +15 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/check_dataset.py +86 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/utils/visualizer.py +119 -0
paddlex/modules/keypoint_detection/evaluator.py +41 -0
paddlex/modules/keypoint_detection/exportor.py +22 -0
paddlex/modules/keypoint_detection/model_list.py +16 -0
paddlex/modules/keypoint_detection/trainer.py +39 -0
paddlex/modules/multilabel_classification/__init__.py +18 -0
paddlex/modules/multilabel_classification/dataset_checker/__init__.py +106 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/analyse_dataset.py +95 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/check_dataset.py +131 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/convert_dataset.py +117 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/utils/visualizer.py +153 -0
paddlex/modules/multilabel_classification/evaluator.py +43 -0
paddlex/modules/multilabel_classification/exportor.py +22 -0
paddlex/modules/multilabel_classification/model_list.py +24 -0
paddlex/modules/multilabel_classification/trainer.py +85 -0
paddlex/modules/multilingual_speech_recognition/__init__.py +18 -0
paddlex/modules/multilingual_speech_recognition/dataset_checker.py +27 -0
paddlex/modules/multilingual_speech_recognition/evaluator.py +27 -0
paddlex/modules/multilingual_speech_recognition/exportor.py +27 -0
paddlex/modules/multilingual_speech_recognition/model_list.py +22 -0
paddlex/modules/multilingual_speech_recognition/trainer.py +40 -0
paddlex/modules/object_detection/__init__.py +18 -0
paddlex/modules/object_detection/dataset_checker/__init__.py +115 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/analyse_dataset.py +80 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/check_dataset.py +86 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/convert_dataset.py +433 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/split_dataset.py +119 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/utils/visualizer.py +192 -0
paddlex/modules/object_detection/evaluator.py +52 -0
paddlex/modules/object_detection/exportor.py +22 -0
paddlex/modules/object_detection/model_list.py +84 -0
paddlex/modules/object_detection/trainer.py +99 -0
paddlex/modules/open_vocabulary_detection/__init__.py +18 -0
paddlex/modules/open_vocabulary_detection/dataset_checker.py +29 -0
paddlex/modules/open_vocabulary_detection/evaluator.py +29 -0
paddlex/modules/open_vocabulary_detection/exportor.py +29 -0
paddlex/modules/open_vocabulary_detection/model_list.py +18 -0
paddlex/modules/open_vocabulary_detection/trainer.py +42 -0
paddlex/modules/open_vocabulary_segmentation/__init__.py +18 -0
paddlex/modules/open_vocabulary_segmentation/dataset_checker.py +29 -0
paddlex/modules/open_vocabulary_segmentation/evaluator.py +29 -0
paddlex/modules/open_vocabulary_segmentation/exportor.py +29 -0
paddlex/modules/open_vocabulary_segmentation/model_list.py +19 -0
paddlex/modules/open_vocabulary_segmentation/trainer.py +42 -0
paddlex/modules/semantic_segmentation/__init__.py +18 -0
paddlex/modules/semantic_segmentation/dataset_checker/__init__.py +110 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/analyse_dataset.py +73 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/check_dataset.py +80 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/convert_dataset.py +162 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/split_dataset.py +87 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/utils/visualizer.py +71 -0
paddlex/modules/semantic_segmentation/evaluator.py +58 -0
paddlex/modules/semantic_segmentation/exportor.py +31 -0
paddlex/modules/semantic_segmentation/model_list.py +37 -0
paddlex/modules/semantic_segmentation/trainer.py +73 -0
paddlex/modules/table_recognition/__init__.py +18 -0
paddlex/modules/table_recognition/dataset_checker/__init__.py +98 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/analyse_dataset.py +58 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/check_dataset.py +86 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/split_dataset.py +79 -0
paddlex/modules/table_recognition/evaluator.py +43 -0
paddlex/modules/table_recognition/exportor.py +22 -0
paddlex/modules/table_recognition/model_list.py +21 -0
paddlex/modules/table_recognition/trainer.py +70 -0
paddlex/modules/text_detection/__init__.py +18 -0
paddlex/modules/text_detection/dataset_checker/__init__.py +109 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/analyse_dataset.py +217 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/check_dataset.py +106 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/split_dataset.py +140 -0
paddlex/modules/text_detection/evaluator.py +41 -0
paddlex/modules/text_detection/exportor.py +22 -0
paddlex/modules/text_detection/model_list.py +24 -0
paddlex/modules/text_detection/trainer.py +68 -0
paddlex/modules/text_recognition/__init__.py +18 -0
paddlex/modules/text_recognition/dataset_checker/__init__.py +126 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/analyse_dataset.py +161 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/check_dataset.py +107 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/convert_dataset.py +94 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/text_recognition/evaluator.py +64 -0
paddlex/modules/text_recognition/exportor.py +22 -0
paddlex/modules/text_recognition/model_list.py +34 -0
paddlex/modules/text_recognition/trainer.py +106 -0
paddlex/modules/ts_anomaly_detection/__init__.py +19 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/__init__.py +112 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/analyse_dataset.py +27 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/convert_dataset.py +78 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/split_dataset.py +63 -0
paddlex/modules/ts_anomaly_detection/evaluator.py +67 -0
paddlex/modules/ts_anomaly_detection/exportor.py +45 -0
paddlex/modules/ts_anomaly_detection/model_list.py +22 -0
paddlex/modules/ts_anomaly_detection/trainer.py +113 -0
paddlex/modules/ts_classification/__init__.py +19 -0
paddlex/modules/ts_classification/dataset_checker/__init__.py +112 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/analyse_dataset.py +74 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/convert_dataset.py +78 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/split_dataset.py +88 -0
paddlex/modules/ts_classification/evaluator.py +66 -0
paddlex/modules/ts_classification/exportor.py +45 -0
paddlex/modules/ts_classification/model_list.py +18 -0
paddlex/modules/ts_classification/trainer.py +108 -0
paddlex/modules/ts_forecast/__init__.py +19 -0
paddlex/modules/ts_forecast/dataset_checker/__init__.py +112 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/analyse_dataset.py +27 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/convert_dataset.py +77 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/split_dataset.py +63 -0
paddlex/modules/ts_forecast/evaluator.py +66 -0
paddlex/modules/ts_forecast/exportor.py +45 -0
paddlex/modules/ts_forecast/model_list.py +24 -0
paddlex/modules/ts_forecast/trainer.py +108 -0
paddlex/modules/video_classification/__init__.py +18 -0
paddlex/modules/video_classification/dataset_checker/__init__.py +93 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/analyse_dataset.py +93 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/check_dataset.py +121 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/split_dataset.py +82 -0
paddlex/modules/video_classification/evaluator.py +44 -0
paddlex/modules/video_classification/exportor.py +22 -0
paddlex/modules/video_classification/model_list.py +19 -0
paddlex/modules/video_classification/trainer.py +88 -0
paddlex/modules/video_detection/__init__.py +18 -0
paddlex/modules/video_detection/dataset_checker/__init__.py +86 -0
paddlex/modules/video_detection/dataset_checker/dataset_src/__init__.py +17 -0
paddlex/modules/video_detection/dataset_checker/dataset_src/analyse_dataset.py +101 -0
paddlex/modules/video_detection/dataset_checker/dataset_src/check_dataset.py +134 -0
paddlex/modules/video_detection/evaluator.py +42 -0
paddlex/modules/video_detection/exportor.py +22 -0
paddlex/modules/video_detection/model_list.py +15 -0
paddlex/modules/video_detection/trainer.py +82 -0
paddlex/ops/__init__.py +149 -0
paddlex/ops/iou3d_nms/iou3d_cpu.cpp +264 -0
paddlex/ops/iou3d_nms/iou3d_cpu.h +27 -0
paddlex/ops/iou3d_nms/iou3d_nms.cpp +204 -0
paddlex/ops/iou3d_nms/iou3d_nms.h +33 -0
paddlex/ops/iou3d_nms/iou3d_nms_api.cpp +108 -0
paddlex/ops/iou3d_nms/iou3d_nms_kernel.cu +482 -0
paddlex/ops/setup.py +37 -0
paddlex/ops/voxel/voxelize_op.cc +191 -0
paddlex/ops/voxel/voxelize_op.cu +346 -0
paddlex/paddle2onnx_requirements.txt +1 -0
paddlex/paddlex_cli.py +464 -0
paddlex/repo_apis/Paddle3D_api/__init__.py +17 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/__init__.py +18 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/config.py +118 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/model.py +238 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/register.py +55 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/runner.py +104 -0
paddlex/repo_apis/Paddle3D_api/pp3d_config.py +144 -0
paddlex/repo_apis/PaddleClas_api/__init__.py +17 -0
paddlex/repo_apis/PaddleClas_api/cls/__init__.py +19 -0
paddlex/repo_apis/PaddleClas_api/cls/config.py +594 -0
paddlex/repo_apis/PaddleClas_api/cls/model.py +355 -0
paddlex/repo_apis/PaddleClas_api/cls/register.py +908 -0
paddlex/repo_apis/PaddleClas_api/cls/runner.py +219 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/__init__.py +18 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/config.py +141 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/model.py +23 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/register.py +68 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/runner.py +55 -0
paddlex/repo_apis/PaddleDetection_api/__init__.py +17 -0
paddlex/repo_apis/PaddleDetection_api/config_helper.py +280 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/__init__.py +18 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/config.py +458 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/model.py +403 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/register.py +263 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/runner.py +226 -0
paddlex/repo_apis/PaddleDetection_api/object_det/__init__.py +19 -0
paddlex/repo_apis/PaddleDetection_api/object_det/config.py +539 -0
paddlex/repo_apis/PaddleDetection_api/object_det/model.py +430 -0
paddlex/repo_apis/PaddleDetection_api/object_det/official_categories.py +220 -0
paddlex/repo_apis/PaddleDetection_api/object_det/register.py +1106 -0
paddlex/repo_apis/PaddleDetection_api/object_det/runner.py +226 -0
paddlex/repo_apis/PaddleNLP_api/__init__.py +13 -0
paddlex/repo_apis/PaddleOCR_api/__init__.py +21 -0
paddlex/repo_apis/PaddleOCR_api/config_utils.py +53 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/config.py +570 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/model.py +402 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/register.py +73 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/runner.py +240 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/config.py +64 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/model.py +126 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/register.py +71 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/runner.py +51 -0
paddlex/repo_apis/PaddleOCR_api/text_det/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/text_det/config.py +62 -0
paddlex/repo_apis/PaddleOCR_api/text_det/model.py +72 -0
paddlex/repo_apis/PaddleOCR_api/text_det/register.py +90 -0
paddlex/repo_apis/PaddleOCR_api/text_det/runner.py +53 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/config.py +563 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/model.py +402 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/register.py +199 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/runner.py +240 -0
paddlex/repo_apis/PaddleSeg_api/__init__.py +16 -0
paddlex/repo_apis/PaddleSeg_api/base_seg_config.py +134 -0
paddlex/repo_apis/PaddleSeg_api/seg/__init__.py +16 -0
paddlex/repo_apis/PaddleSeg_api/seg/config.py +186 -0
paddlex/repo_apis/PaddleSeg_api/seg/model.py +491 -0
paddlex/repo_apis/PaddleSeg_api/seg/register.py +273 -0
paddlex/repo_apis/PaddleSeg_api/seg/runner.py +262 -0
paddlex/repo_apis/PaddleTS_api/__init__.py +19 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/config.py +89 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/register.py +146 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_base/__init__.py +13 -0
paddlex/repo_apis/PaddleTS_api/ts_base/config.py +246 -0
paddlex/repo_apis/PaddleTS_api/ts_base/model.py +276 -0
paddlex/repo_apis/PaddleTS_api/ts_base/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/config.py +73 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/register.py +59 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/config.py +137 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/register.py +186 -0
paddlex/repo_apis/PaddleVideo_api/__init__.py +17 -0
paddlex/repo_apis/PaddleVideo_api/config_utils.py +51 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/__init__.py +19 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/config.py +547 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/model.py +346 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/register.py +71 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/runner.py +205 -0
paddlex/repo_apis/PaddleVideo_api/video_det/__init__.py +19 -0
paddlex/repo_apis/PaddleVideo_api/video_det/config.py +548 -0
paddlex/repo_apis/PaddleVideo_api/video_det/model.py +298 -0
paddlex/repo_apis/PaddleVideo_api/video_det/register.py +45 -0
paddlex/repo_apis/PaddleVideo_api/video_det/runner.py +200 -0
paddlex/repo_apis/__init__.py +13 -0
paddlex/repo_apis/base/__init__.py +23 -0
paddlex/repo_apis/base/config.py +238 -0
paddlex/repo_apis/base/model.py +571 -0
paddlex/repo_apis/base/register.py +135 -0
paddlex/repo_apis/base/runner.py +391 -0
paddlex/repo_apis/base/utils/__init__.py +13 -0
paddlex/repo_apis/base/utils/arg.py +64 -0
paddlex/repo_apis/base/utils/subprocess.py +107 -0
paddlex/repo_manager/__init__.py +24 -0
paddlex/repo_manager/core.py +271 -0
paddlex/repo_manager/meta.py +170 -0
paddlex/repo_manager/repo.py +415 -0
paddlex/repo_manager/requirements.txt +21 -0
paddlex/repo_manager/utils.py +359 -0
paddlex/serving_requirements.txt +9 -0
paddlex/utils/__init__.py +1 -12
paddlex/utils/cache.py +148 -0
paddlex/utils/config.py +215 -0
paddlex/utils/custom_device_whitelist.py +457 -0
paddlex/utils/device.py +151 -0
paddlex/utils/download.py +168 -182
paddlex/utils/env.py +11 -50
paddlex/utils/errors/__init__.py +17 -0
paddlex/utils/errors/dataset_checker.py +78 -0
paddlex/utils/errors/others.py +152 -0
paddlex/utils/file_interface.py +212 -0
paddlex/utils/flags.py +65 -0
paddlex/utils/fonts/__init__.py +67 -0
paddlex/utils/func_register.py +41 -0
paddlex/utils/interactive_get_pipeline.py +55 -0
paddlex/utils/lazy_loader.py +68 -0
paddlex/utils/logging.py +131 -33
paddlex/utils/misc.py +201 -0
paddlex/utils/pipeline_arguments.py +711 -0
paddlex/utils/result_saver.py +59 -0
paddlex/utils/subclass_register.py +101 -0
paddlex/version.py +54 -0
paddlex-3.0.0rc0.dist-info/LICENSE +169 -0
paddlex-3.0.0rc0.dist-info/METADATA +1035 -0
paddlex-3.0.0rc0.dist-info/RECORD +1015 -0
paddlex-3.0.0rc0.dist-info/WHEEL +5 -0
paddlex-3.0.0rc0.dist-info/entry_points.txt +2 -0
paddlex-3.0.0rc0.dist-info/top_level.txt +1 -0
PaddleClas/__init__.py +0 -16
PaddleClas/deploy/__init__.py +0 -1
PaddleClas/deploy/paddleserving/__init__.py +0 -0
PaddleClas/deploy/paddleserving/classification_web_service.py +0 -74
PaddleClas/deploy/paddleserving/cpu_utilization.py +0 -4
PaddleClas/deploy/paddleserving/pipeline_http_client.py +0 -20
PaddleClas/deploy/paddleserving/pipeline_rpc_client.py +0 -33
PaddleClas/deploy/paddleserving/recognition/__init__.py +0 -0
PaddleClas/deploy/paddleserving/recognition/pipeline_http_client.py +0 -21
PaddleClas/deploy/paddleserving/recognition/pipeline_rpc_client.py +0 -34
PaddleClas/deploy/paddleserving/recognition/recognition_web_service.py +0 -209
PaddleClas/deploy/python/__init__.py +0 -0
PaddleClas/deploy/python/build_gallery.py +0 -214
PaddleClas/deploy/python/det_preprocess.py +0 -205
PaddleClas/deploy/python/postprocess.py +0 -161
PaddleClas/deploy/python/predict_cls.py +0 -142
PaddleClas/deploy/python/predict_det.py +0 -158
PaddleClas/deploy/python/predict_rec.py +0 -138
PaddleClas/deploy/python/predict_system.py +0 -144
PaddleClas/deploy/python/preprocess.py +0 -337
PaddleClas/deploy/utils/__init__.py +0 -5
PaddleClas/deploy/utils/config.py +0 -197
PaddleClas/deploy/utils/draw_bbox.py +0 -61
PaddleClas/deploy/utils/encode_decode.py +0 -31
PaddleClas/deploy/utils/get_image_list.py +0 -49
PaddleClas/deploy/utils/logger.py +0 -120
PaddleClas/deploy/utils/predictor.py +0 -71
PaddleClas/deploy/vector_search/__init__.py +0 -1
PaddleClas/deploy/vector_search/interface.py +0 -272
PaddleClas/deploy/vector_search/test.py +0 -34
PaddleClas/hubconf.py +0 -788
PaddleClas/paddleclas.py +0 -552
PaddleClas/ppcls/__init__.py +0 -20
PaddleClas/ppcls/arch/__init__.py +0 -127
PaddleClas/ppcls/arch/backbone/__init__.py +0 -80
PaddleClas/ppcls/arch/backbone/base/__init__.py +0 -0
PaddleClas/ppcls/arch/backbone/base/theseus_layer.py +0 -126
PaddleClas/ppcls/arch/backbone/legendary_models/__init__.py +0 -6
PaddleClas/ppcls/arch/backbone/legendary_models/esnet.py +0 -355
PaddleClas/ppcls/arch/backbone/legendary_models/hrnet.py +0 -744
PaddleClas/ppcls/arch/backbone/legendary_models/inception_v3.py +0 -539
PaddleClas/ppcls/arch/backbone/legendary_models/mobilenet_v1.py +0 -234
PaddleClas/ppcls/arch/backbone/legendary_models/mobilenet_v3.py +0 -561
PaddleClas/ppcls/arch/backbone/legendary_models/pp_lcnet.py +0 -399
PaddleClas/ppcls/arch/backbone/legendary_models/resnet.py +0 -534
PaddleClas/ppcls/arch/backbone/legendary_models/vgg.py +0 -231
PaddleClas/ppcls/arch/backbone/model_zoo/__init__.py +0 -0
PaddleClas/ppcls/arch/backbone/model_zoo/alexnet.py +0 -168
PaddleClas/ppcls/arch/backbone/model_zoo/cspnet.py +0 -376
PaddleClas/ppcls/arch/backbone/model_zoo/darknet.py +0 -197
PaddleClas/ppcls/arch/backbone/model_zoo/densenet.py +0 -344
PaddleClas/ppcls/arch/backbone/model_zoo/distilled_vision_transformer.py +0 -272
PaddleClas/ppcls/arch/backbone/model_zoo/dla.py +0 -528
PaddleClas/ppcls/arch/backbone/model_zoo/dpn.py +0 -451
PaddleClas/ppcls/arch/backbone/model_zoo/efficientnet.py +0 -976
PaddleClas/ppcls/arch/backbone/model_zoo/ghostnet.py +0 -363
PaddleClas/ppcls/arch/backbone/model_zoo/googlenet.py +0 -229
PaddleClas/ppcls/arch/backbone/model_zoo/gvt.py +0 -693
PaddleClas/ppcls/arch/backbone/model_zoo/hardnet.py +0 -293
PaddleClas/ppcls/arch/backbone/model_zoo/inception_v4.py +0 -477
PaddleClas/ppcls/arch/backbone/model_zoo/levit.py +0 -589
PaddleClas/ppcls/arch/backbone/model_zoo/mixnet.py +0 -815
PaddleClas/ppcls/arch/backbone/model_zoo/mobilenet_v2.py +0 -287
PaddleClas/ppcls/arch/backbone/model_zoo/rednet.py +0 -203
PaddleClas/ppcls/arch/backbone/model_zoo/regnet.py +0 -431
PaddleClas/ppcls/arch/backbone/model_zoo/repvgg.py +0 -422
PaddleClas/ppcls/arch/backbone/model_zoo/res2net.py +0 -264
PaddleClas/ppcls/arch/backbone/model_zoo/res2net_vd.py +0 -305
PaddleClas/ppcls/arch/backbone/model_zoo/resnest.py +0 -740
PaddleClas/ppcls/arch/backbone/model_zoo/resnet_vc.py +0 -309
PaddleClas/ppcls/arch/backbone/model_zoo/resnext.py +0 -298
PaddleClas/ppcls/arch/backbone/model_zoo/resnext101_wsl.py +0 -490
PaddleClas/ppcls/arch/backbone/model_zoo/resnext_vd.py +0 -317
PaddleClas/ppcls/arch/backbone/model_zoo/rexnet.py +0 -281
PaddleClas/ppcls/arch/backbone/model_zoo/se_resnet_vd.py +0 -390
PaddleClas/ppcls/arch/backbone/model_zoo/se_resnext.py +0 -364
PaddleClas/ppcls/arch/backbone/model_zoo/se_resnext_vd.py +0 -309
PaddleClas/ppcls/arch/backbone/model_zoo/shufflenet_v2.py +0 -362
PaddleClas/ppcls/arch/backbone/model_zoo/squeezenet.py +0 -194
PaddleClas/ppcls/arch/backbone/model_zoo/swin_transformer.py +0 -857
PaddleClas/ppcls/arch/backbone/model_zoo/tnt.py +0 -385
PaddleClas/ppcls/arch/backbone/model_zoo/vision_transformer.py +0 -495
PaddleClas/ppcls/arch/backbone/model_zoo/xception.py +0 -377
PaddleClas/ppcls/arch/backbone/model_zoo/xception_deeplab.py +0 -421
PaddleClas/ppcls/arch/backbone/variant_models/__init__.py +0 -3
PaddleClas/ppcls/arch/backbone/variant_models/pp_lcnet_variant.py +0 -29
PaddleClas/ppcls/arch/backbone/variant_models/resnet_variant.py +0 -23
PaddleClas/ppcls/arch/backbone/variant_models/vgg_variant.py +0 -28
PaddleClas/ppcls/arch/gears/__init__.py +0 -32
PaddleClas/ppcls/arch/gears/arcmargin.py +0 -72
PaddleClas/ppcls/arch/gears/circlemargin.py +0 -59
PaddleClas/ppcls/arch/gears/cosmargin.py +0 -55
PaddleClas/ppcls/arch/gears/fc.py +0 -35
PaddleClas/ppcls/arch/gears/identity_head.py +0 -9
PaddleClas/ppcls/arch/gears/vehicle_neck.py +0 -52
PaddleClas/ppcls/arch/utils.py +0 -53
PaddleClas/ppcls/data/__init__.py +0 -144
PaddleClas/ppcls/data/dataloader/DistributedRandomIdentitySampler.py +0 -90
PaddleClas/ppcls/data/dataloader/__init__.py +0 -9
PaddleClas/ppcls/data/dataloader/common_dataset.py +0 -84
PaddleClas/ppcls/data/dataloader/dali.py +0 -319
PaddleClas/ppcls/data/dataloader/icartoon_dataset.py +0 -36
PaddleClas/ppcls/data/dataloader/imagenet_dataset.py +0 -38
PaddleClas/ppcls/data/dataloader/logo_dataset.py +0 -46
PaddleClas/ppcls/data/dataloader/mix_dataset.py +0 -49
PaddleClas/ppcls/data/dataloader/mix_sampler.py +0 -79
PaddleClas/ppcls/data/dataloader/multilabel_dataset.py +0 -59
PaddleClas/ppcls/data/dataloader/pk_sampler.py +0 -105
PaddleClas/ppcls/data/dataloader/vehicle_dataset.py +0 -138
PaddleClas/ppcls/data/postprocess/__init__.py +0 -41
PaddleClas/ppcls/data/postprocess/topk.py +0 -85
PaddleClas/ppcls/data/preprocess/__init__.py +0 -100
PaddleClas/ppcls/data/preprocess/batch_ops/__init__.py +0 -1
PaddleClas/ppcls/data/preprocess/batch_ops/batch_operators.py +0 -231
PaddleClas/ppcls/data/preprocess/ops/__init__.py +0 -1
PaddleClas/ppcls/data/preprocess/ops/autoaugment.py +0 -264
PaddleClas/ppcls/data/preprocess/ops/cutout.py +0 -41
PaddleClas/ppcls/data/preprocess/ops/fmix.py +0 -217
PaddleClas/ppcls/data/preprocess/ops/functional.py +0 -138
PaddleClas/ppcls/data/preprocess/ops/grid.py +0 -89
PaddleClas/ppcls/data/preprocess/ops/hide_and_seek.py +0 -44
PaddleClas/ppcls/data/preprocess/ops/operators.py +0 -384
PaddleClas/ppcls/data/preprocess/ops/randaugment.py +0 -106
PaddleClas/ppcls/data/preprocess/ops/random_erasing.py +0 -90
PaddleClas/ppcls/data/preprocess/ops/timm_autoaugment.py +0 -877
PaddleClas/ppcls/data/utils/__init__.py +0 -13
PaddleClas/ppcls/data/utils/get_image_list.py +0 -49
PaddleClas/ppcls/engine/__init__.py +0 -0
PaddleClas/ppcls/engine/engine.py +0 -436
PaddleClas/ppcls/engine/evaluation/__init__.py +0 -16
PaddleClas/ppcls/engine/evaluation/classification.py +0 -143
PaddleClas/ppcls/engine/evaluation/retrieval.py +0 -169
PaddleClas/ppcls/engine/slim/__init__.py +0 -16
PaddleClas/ppcls/engine/slim/prune.py +0 -66
PaddleClas/ppcls/engine/slim/quant.py +0 -55
PaddleClas/ppcls/engine/train/__init__.py +0 -14
PaddleClas/ppcls/engine/train/train.py +0 -79
PaddleClas/ppcls/engine/train/utils.py +0 -72
PaddleClas/ppcls/loss/__init__.py +0 -65
PaddleClas/ppcls/loss/celoss.py +0 -67
PaddleClas/ppcls/loss/centerloss.py +0 -54
PaddleClas/ppcls/loss/comfunc.py +0 -45
PaddleClas/ppcls/loss/deephashloss.py +0 -92
PaddleClas/ppcls/loss/distanceloss.py +0 -43
PaddleClas/ppcls/loss/distillationloss.py +0 -141
PaddleClas/ppcls/loss/dmlloss.py +0 -46
PaddleClas/ppcls/loss/emlloss.py +0 -97
PaddleClas/ppcls/loss/googlenetloss.py +0 -41
PaddleClas/ppcls/loss/msmloss.py +0 -78
PaddleClas/ppcls/loss/multilabelloss.py +0 -43
PaddleClas/ppcls/loss/npairsloss.py +0 -38
PaddleClas/ppcls/loss/pairwisecosface.py +0 -55
PaddleClas/ppcls/loss/supconloss.py +0 -108
PaddleClas/ppcls/loss/trihardloss.py +0 -82
PaddleClas/ppcls/loss/triplet.py +0 -137
PaddleClas/ppcls/metric/__init__.py +0 -51
PaddleClas/ppcls/metric/metrics.py +0 -308
PaddleClas/ppcls/optimizer/__init__.py +0 -72
PaddleClas/ppcls/optimizer/learning_rate.py +0 -326
PaddleClas/ppcls/optimizer/optimizer.py +0 -207
PaddleClas/ppcls/utils/__init__.py +0 -27
PaddleClas/ppcls/utils/check.py +0 -151
PaddleClas/ppcls/utils/config.py +0 -210
PaddleClas/ppcls/utils/download.py +0 -319
PaddleClas/ppcls/utils/ema.py +0 -63
PaddleClas/ppcls/utils/logger.py +0 -137
PaddleClas/ppcls/utils/metrics.py +0 -107
PaddleClas/ppcls/utils/misc.py +0 -63
PaddleClas/ppcls/utils/model_zoo.py +0 -213
PaddleClas/ppcls/utils/profiler.py +0 -111
PaddleClas/ppcls/utils/save_load.py +0 -136
PaddleClas/setup.py +0 -58
PaddleClas/tools/__init__.py +0 -15
PaddleClas/tools/eval.py +0 -31
PaddleClas/tools/export_model.py +0 -34
PaddleClas/tools/infer.py +0 -31
PaddleClas/tools/train.py +0 -32
paddlex/cls.py +0 -82
paddlex/command.py +0 -215
paddlex/cv/__init__.py +0 -17
paddlex/cv/datasets/__init__.py +0 -18
paddlex/cv/datasets/coco.py +0 -208
paddlex/cv/datasets/imagenet.py +0 -88
paddlex/cv/datasets/seg_dataset.py +0 -91
paddlex/cv/datasets/voc.py +0 -445
paddlex/cv/models/__init__.py +0 -18
paddlex/cv/models/base.py +0 -631
paddlex/cv/models/classifier.py +0 -989
paddlex/cv/models/detector.py +0 -2292
paddlex/cv/models/load_model.py +0 -148
paddlex/cv/models/segmenter.py +0 -768
paddlex/cv/models/slim/__init__.py +0 -13
paddlex/cv/models/slim/prune.py +0 -55
paddlex/cv/models/utils/__init__.py +0 -13
paddlex/cv/models/utils/det_metrics/__init__.py +0 -15
paddlex/cv/models/utils/det_metrics/coco_utils.py +0 -476
paddlex/cv/models/utils/det_metrics/metrics.py +0 -220
paddlex/cv/models/utils/infer_nets.py +0 -45
paddlex/cv/models/utils/seg_metrics.py +0 -62
paddlex/cv/models/utils/visualize.py +0 -399
paddlex/cv/transforms/__init__.py +0 -46
paddlex/cv/transforms/batch_operators.py +0 -286
paddlex/cv/transforms/box_utils.py +0 -41
paddlex/cv/transforms/functions.py +0 -193
paddlex/cv/transforms/operators.py +0 -1402
paddlex/deploy.py +0 -268
paddlex/det.py +0 -49
paddlex/paddleseg/__init__.py +0 -17
paddlex/paddleseg/core/__init__.py +0 -20
paddlex/paddleseg/core/infer.py +0 -289
paddlex/paddleseg/core/predict.py +0 -145
paddlex/paddleseg/core/train.py +0 -258
paddlex/paddleseg/core/val.py +0 -172
paddlex/paddleseg/cvlibs/__init__.py +0 -17
paddlex/paddleseg/cvlibs/callbacks.py +0 -279
paddlex/paddleseg/cvlibs/config.py +0 -359
paddlex/paddleseg/cvlibs/manager.py +0 -142
paddlex/paddleseg/cvlibs/param_init.py +0 -91
paddlex/paddleseg/datasets/__init__.py +0 -21
paddlex/paddleseg/datasets/ade.py +0 -112
paddlex/paddleseg/datasets/cityscapes.py +0 -86
paddlex/paddleseg/datasets/cocostuff.py +0 -79
paddlex/paddleseg/datasets/dataset.py +0 -164
paddlex/paddleseg/datasets/mini_deep_globe_road_extraction.py +0 -95
paddlex/paddleseg/datasets/optic_disc_seg.py +0 -97
paddlex/paddleseg/datasets/pascal_context.py +0 -80
paddlex/paddleseg/datasets/voc.py +0 -113
paddlex/paddleseg/models/__init__.py +0 -39
paddlex/paddleseg/models/ann.py +0 -436
paddlex/paddleseg/models/attention_unet.py +0 -189
paddlex/paddleseg/models/backbones/__init__.py +0 -18
paddlex/paddleseg/models/backbones/hrnet.py +0 -815
paddlex/paddleseg/models/backbones/mobilenetv3.py +0 -365
paddlex/paddleseg/models/backbones/resnet_vd.py +0 -364
paddlex/paddleseg/models/backbones/xception_deeplab.py +0 -415
paddlex/paddleseg/models/bisenet.py +0 -311
paddlex/paddleseg/models/danet.py +0 -220
paddlex/paddleseg/models/decoupled_segnet.py +0 -233
paddlex/paddleseg/models/deeplab.py +0 -258
paddlex/paddleseg/models/dnlnet.py +0 -231
paddlex/paddleseg/models/emanet.py +0 -219
paddlex/paddleseg/models/fast_scnn.py +0 -318
paddlex/paddleseg/models/fcn.py +0 -135
paddlex/paddleseg/models/gcnet.py +0 -223
paddlex/paddleseg/models/gscnn.py +0 -357
paddlex/paddleseg/models/hardnet.py +0 -309
paddlex/paddleseg/models/isanet.py +0 -202
paddlex/paddleseg/models/layers/__init__.py +0 -19
paddlex/paddleseg/models/layers/activation.py +0 -73
paddlex/paddleseg/models/layers/attention.py +0 -146
paddlex/paddleseg/models/layers/layer_libs.py +0 -168
paddlex/paddleseg/models/layers/nonlocal2d.py +0 -155
paddlex/paddleseg/models/layers/pyramid_pool.py +0 -182
paddlex/paddleseg/models/losses/__init__.py +0 -27
paddlex/paddleseg/models/losses/binary_cross_entropy_loss.py +0 -174
paddlex/paddleseg/models/losses/bootstrapped_cross_entropy.py +0 -73
paddlex/paddleseg/models/losses/cross_entropy_loss.py +0 -94
paddlex/paddleseg/models/losses/decoupledsegnet_relax_boundary_loss.py +0 -129
paddlex/paddleseg/models/losses/dice_loss.py +0 -61
paddlex/paddleseg/models/losses/edge_attention_loss.py +0 -78
paddlex/paddleseg/models/losses/gscnn_dual_task_loss.py +0 -141
paddlex/paddleseg/models/losses/l1_loss.py +0 -76
paddlex/paddleseg/models/losses/lovasz_loss.py +0 -222
paddlex/paddleseg/models/losses/mean_square_error_loss.py +0 -65
paddlex/paddleseg/models/losses/mixed_loss.py +0 -58
paddlex/paddleseg/models/losses/ohem_cross_entropy_loss.py +0 -99
paddlex/paddleseg/models/losses/ohem_edge_attention_loss.py +0 -114
paddlex/paddleseg/models/ocrnet.py +0 -248
paddlex/paddleseg/models/pspnet.py +0 -147
paddlex/paddleseg/models/sfnet.py +0 -236
paddlex/paddleseg/models/shufflenet_slim.py +0 -268
paddlex/paddleseg/models/u2net.py +0 -574
paddlex/paddleseg/models/unet.py +0 -155
paddlex/paddleseg/models/unet_3plus.py +0 -316
paddlex/paddleseg/models/unet_plusplus.py +0 -237
paddlex/paddleseg/transforms/__init__.py +0 -16
paddlex/paddleseg/transforms/functional.py +0 -161
paddlex/paddleseg/transforms/transforms.py +0 -937
paddlex/paddleseg/utils/__init__.py +0 -22
paddlex/paddleseg/utils/config_check.py +0 -60
paddlex/paddleseg/utils/download.py +0 -163
paddlex/paddleseg/utils/env/__init__.py +0 -16
paddlex/paddleseg/utils/env/seg_env.py +0 -56
paddlex/paddleseg/utils/env/sys_env.py +0 -122
paddlex/paddleseg/utils/logger.py +0 -48
paddlex/paddleseg/utils/metrics.py +0 -146
paddlex/paddleseg/utils/progbar.py +0 -212
paddlex/paddleseg/utils/timer.py +0 -53
paddlex/paddleseg/utils/utils.py +0 -120
paddlex/paddleseg/utils/visualize.py +0 -90
paddlex/ppcls/__init__.py +0 -20
paddlex/ppcls/arch/__init__.py +0 -127
paddlex/ppcls/arch/backbone/__init__.py +0 -80
paddlex/ppcls/arch/backbone/base/__init__.py +0 -0
paddlex/ppcls/arch/backbone/base/theseus_layer.py +0 -130
paddlex/ppcls/arch/backbone/legendary_models/__init__.py +0 -6
paddlex/ppcls/arch/backbone/legendary_models/esnet.py +0 -355
paddlex/ppcls/arch/backbone/legendary_models/hrnet.py +0 -748
paddlex/ppcls/arch/backbone/legendary_models/inception_v3.py +0 -539
paddlex/ppcls/arch/backbone/legendary_models/mobilenet_v1.py +0 -234
paddlex/ppcls/arch/backbone/legendary_models/mobilenet_v3.py +0 -561
paddlex/ppcls/arch/backbone/legendary_models/pp_lcnet.py +0 -399
paddlex/ppcls/arch/backbone/legendary_models/resnet.py +0 -534
paddlex/ppcls/arch/backbone/legendary_models/vgg.py +0 -235
paddlex/ppcls/arch/backbone/model_zoo/__init__.py +0 -0
paddlex/ppcls/arch/backbone/model_zoo/alexnet.py +0 -168
paddlex/ppcls/arch/backbone/model_zoo/cspnet.py +0 -376
paddlex/ppcls/arch/backbone/model_zoo/darknet.py +0 -197
paddlex/ppcls/arch/backbone/model_zoo/densenet.py +0 -344
paddlex/ppcls/arch/backbone/model_zoo/distilled_vision_transformer.py +0 -272
paddlex/ppcls/arch/backbone/model_zoo/dla.py +0 -528
paddlex/ppcls/arch/backbone/model_zoo/dpn.py +0 -451
paddlex/ppcls/arch/backbone/model_zoo/efficientnet.py +0 -976
paddlex/ppcls/arch/backbone/model_zoo/ghostnet.py +0 -363
paddlex/ppcls/arch/backbone/model_zoo/googlenet.py +0 -229
paddlex/ppcls/arch/backbone/model_zoo/gvt.py +0 -693
paddlex/ppcls/arch/backbone/model_zoo/hardnet.py +0 -293
paddlex/ppcls/arch/backbone/model_zoo/inception_v4.py +0 -477
paddlex/ppcls/arch/backbone/model_zoo/levit.py +0 -589
paddlex/ppcls/arch/backbone/model_zoo/mixnet.py +0 -815
paddlex/ppcls/arch/backbone/model_zoo/mobilenet_v2.py +0 -287
paddlex/ppcls/arch/backbone/model_zoo/rednet.py +0 -203
paddlex/ppcls/arch/backbone/model_zoo/regnet.py +0 -431
paddlex/ppcls/arch/backbone/model_zoo/repvgg.py +0 -422
paddlex/ppcls/arch/backbone/model_zoo/res2net.py +0 -264
paddlex/ppcls/arch/backbone/model_zoo/res2net_vd.py +0 -305
paddlex/ppcls/arch/backbone/model_zoo/resnest.py +0 -740
paddlex/ppcls/arch/backbone/model_zoo/resnet_vc.py +0 -309
paddlex/ppcls/arch/backbone/model_zoo/resnext.py +0 -298
paddlex/ppcls/arch/backbone/model_zoo/resnext101_wsl.py +0 -490
paddlex/ppcls/arch/backbone/model_zoo/resnext_vd.py +0 -317
paddlex/ppcls/arch/backbone/model_zoo/rexnet.py +0 -281
paddlex/ppcls/arch/backbone/model_zoo/se_resnet_vd.py +0 -390
paddlex/ppcls/arch/backbone/model_zoo/se_resnext.py +0 -364
paddlex/ppcls/arch/backbone/model_zoo/se_resnext_vd.py +0 -309
paddlex/ppcls/arch/backbone/model_zoo/shufflenet_v2.py +0 -362
paddlex/ppcls/arch/backbone/model_zoo/squeezenet.py +0 -194
paddlex/ppcls/arch/backbone/model_zoo/swin_transformer.py +0 -857
paddlex/ppcls/arch/backbone/model_zoo/tnt.py +0 -385
paddlex/ppcls/arch/backbone/model_zoo/vision_transformer.py +0 -495
paddlex/ppcls/arch/backbone/model_zoo/xception.py +0 -377
paddlex/ppcls/arch/backbone/model_zoo/xception_deeplab.py +0 -421
paddlex/ppcls/arch/backbone/variant_models/__init__.py +0 -3
paddlex/ppcls/arch/backbone/variant_models/pp_lcnet_variant.py +0 -29
paddlex/ppcls/arch/backbone/variant_models/resnet_variant.py +0 -23
paddlex/ppcls/arch/backbone/variant_models/vgg_variant.py +0 -28
paddlex/ppcls/arch/gears/__init__.py +0 -32
paddlex/ppcls/arch/gears/arcmargin.py +0 -72
paddlex/ppcls/arch/gears/circlemargin.py +0 -59
paddlex/ppcls/arch/gears/cosmargin.py +0 -55
paddlex/ppcls/arch/gears/fc.py +0 -35
paddlex/ppcls/arch/gears/identity_head.py +0 -9
paddlex/ppcls/arch/gears/vehicle_neck.py +0 -52
paddlex/ppcls/arch/utils.py +0 -53
paddlex/ppcls/data/__init__.py +0 -144
paddlex/ppcls/data/dataloader/DistributedRandomIdentitySampler.py +0 -90
paddlex/ppcls/data/dataloader/__init__.py +0 -9
paddlex/ppcls/data/dataloader/common_dataset.py +0 -84
paddlex/ppcls/data/dataloader/dali.py +0 -319
paddlex/ppcls/data/dataloader/icartoon_dataset.py +0 -36
paddlex/ppcls/data/dataloader/imagenet_dataset.py +0 -38
paddlex/ppcls/data/dataloader/logo_dataset.py +0 -46
paddlex/ppcls/data/dataloader/mix_dataset.py +0 -49
paddlex/ppcls/data/dataloader/mix_sampler.py +0 -79
paddlex/ppcls/data/dataloader/multilabel_dataset.py +0 -59
paddlex/ppcls/data/dataloader/pk_sampler.py +0 -105
paddlex/ppcls/data/dataloader/vehicle_dataset.py +0 -138
paddlex/ppcls/data/postprocess/__init__.py +0 -41
paddlex/ppcls/data/postprocess/topk.py +0 -85
paddlex/ppcls/data/preprocess/__init__.py +0 -100
paddlex/ppcls/data/preprocess/batch_ops/__init__.py +0 -0
paddlex/ppcls/data/preprocess/batch_ops/batch_operators.py +0 -231
paddlex/ppcls/data/preprocess/ops/__init__.py +0 -0
paddlex/ppcls/data/preprocess/ops/autoaugment.py +0 -264
paddlex/ppcls/data/preprocess/ops/cutout.py +0 -41
paddlex/ppcls/data/preprocess/ops/fmix.py +0 -217
paddlex/ppcls/data/preprocess/ops/functional.py +0 -141
paddlex/ppcls/data/preprocess/ops/grid.py +0 -89
paddlex/ppcls/data/preprocess/ops/hide_and_seek.py +0 -44
paddlex/ppcls/data/preprocess/ops/operators.py +0 -384
paddlex/ppcls/data/preprocess/ops/randaugment.py +0 -106
paddlex/ppcls/data/preprocess/ops/random_erasing.py +0 -90
paddlex/ppcls/data/preprocess/ops/timm_autoaugment.py +0 -877
paddlex/ppcls/data/utils/__init__.py +0 -13
paddlex/ppcls/data/utils/get_image_list.py +0 -49
paddlex/ppcls/engine/__init__.py +0 -0
paddlex/ppcls/engine/engine.py +0 -436
paddlex/ppcls/engine/evaluation/__init__.py +0 -16
paddlex/ppcls/engine/evaluation/classification.py +0 -143
paddlex/ppcls/engine/evaluation/retrieval.py +0 -169
paddlex/ppcls/engine/slim/__init__.py +0 -16
paddlex/ppcls/engine/slim/prune.py +0 -66
paddlex/ppcls/engine/slim/quant.py +0 -55
paddlex/ppcls/engine/train/__init__.py +0 -14
paddlex/ppcls/engine/train/train.py +0 -79
paddlex/ppcls/engine/train/utils.py +0 -72
paddlex/ppcls/loss/__init__.py +0 -65
paddlex/ppcls/loss/celoss.py +0 -67
paddlex/ppcls/loss/centerloss.py +0 -54
paddlex/ppcls/loss/comfunc.py +0 -45
paddlex/ppcls/loss/deephashloss.py +0 -96
paddlex/ppcls/loss/distanceloss.py +0 -43
paddlex/ppcls/loss/distillationloss.py +0 -141
paddlex/ppcls/loss/dmlloss.py +0 -46
paddlex/ppcls/loss/emlloss.py +0 -97
paddlex/ppcls/loss/googlenetloss.py +0 -42
paddlex/ppcls/loss/msmloss.py +0 -78
paddlex/ppcls/loss/multilabelloss.py +0 -43
paddlex/ppcls/loss/npairsloss.py +0 -38
paddlex/ppcls/loss/pairwisecosface.py +0 -59
paddlex/ppcls/loss/supconloss.py +0 -108
paddlex/ppcls/loss/trihardloss.py +0 -82
paddlex/ppcls/loss/triplet.py +0 -137
paddlex/ppcls/metric/__init__.py +0 -51
paddlex/ppcls/metric/metrics.py +0 -308
paddlex/ppcls/optimizer/__init__.py +0 -72
paddlex/ppcls/optimizer/learning_rate.py +0 -326
paddlex/ppcls/optimizer/optimizer.py +0 -208
paddlex/ppcls/utils/__init__.py +0 -27
paddlex/ppcls/utils/check.py +0 -151
paddlex/ppcls/utils/config.py +0 -210
paddlex/ppcls/utils/download.py +0 -319
paddlex/ppcls/utils/ema.py +0 -63
paddlex/ppcls/utils/logger.py +0 -137
paddlex/ppcls/utils/metrics.py +0 -112
paddlex/ppcls/utils/misc.py +0 -63
paddlex/ppcls/utils/model_zoo.py +0 -213
paddlex/ppcls/utils/profiler.py +0 -111
paddlex/ppcls/utils/save_load.py +0 -136
paddlex/ppdet/__init__.py +0 -16
paddlex/ppdet/core/__init__.py +0 -15
paddlex/ppdet/core/config/__init__.py +0 -13
paddlex/ppdet/core/config/schema.py +0 -248
paddlex/ppdet/core/config/yaml_helpers.py +0 -118
paddlex/ppdet/core/workspace.py +0 -278
paddlex/ppdet/data/__init__.py +0 -21
paddlex/ppdet/data/crop_utils/__init__.py +0 -13
paddlex/ppdet/data/crop_utils/annotation_cropper.py +0 -585
paddlex/ppdet/data/crop_utils/chip_box_utils.py +0 -170
paddlex/ppdet/data/reader.py +0 -302
paddlex/ppdet/data/shm_utils.py +0 -67
paddlex/ppdet/data/source/__init__.py +0 -29
paddlex/ppdet/data/source/category.py +0 -904
paddlex/ppdet/data/source/coco.py +0 -251
paddlex/ppdet/data/source/dataset.py +0 -197
paddlex/ppdet/data/source/keypoint_coco.py +0 -669
paddlex/ppdet/data/source/mot.py +0 -636
paddlex/ppdet/data/source/sniper_coco.py +0 -191
paddlex/ppdet/data/source/voc.py +0 -231
paddlex/ppdet/data/source/widerface.py +0 -180
paddlex/ppdet/data/transform/__init__.py +0 -28
paddlex/ppdet/data/transform/atss_assigner.py +0 -270
paddlex/ppdet/data/transform/autoaugment_utils.py +0 -1591
paddlex/ppdet/data/transform/batch_operators.py +0 -1080
paddlex/ppdet/data/transform/gridmask_utils.py +0 -86
paddlex/ppdet/data/transform/keypoint_operators.py +0 -868
paddlex/ppdet/data/transform/mot_operators.py +0 -628
paddlex/ppdet/data/transform/op_helper.py +0 -498
paddlex/ppdet/data/transform/operators.py +0 -3025
paddlex/ppdet/engine/__init__.py +0 -30
paddlex/ppdet/engine/callbacks.py +0 -340
paddlex/ppdet/engine/env.py +0 -50
paddlex/ppdet/engine/export_utils.py +0 -177
paddlex/ppdet/engine/tracker.py +0 -538
paddlex/ppdet/engine/trainer.py +0 -723
paddlex/ppdet/metrics/__init__.py +0 -29
paddlex/ppdet/metrics/coco_utils.py +0 -184
paddlex/ppdet/metrics/json_results.py +0 -149
paddlex/ppdet/metrics/keypoint_metrics.py +0 -401
paddlex/ppdet/metrics/map_utils.py +0 -444
paddlex/ppdet/metrics/mcmot_metrics.py +0 -470
paddlex/ppdet/metrics/metrics.py +0 -434
paddlex/ppdet/metrics/mot_metrics.py +0 -1236
paddlex/ppdet/metrics/munkres.py +0 -428
paddlex/ppdet/metrics/widerface_utils.py +0 -393
paddlex/ppdet/model_zoo/__init__.py +0 -18
paddlex/ppdet/model_zoo/model_zoo.py +0 -84
paddlex/ppdet/modeling/__init__.py +0 -45
paddlex/ppdet/modeling/architectures/__init__.py +0 -51
paddlex/ppdet/modeling/architectures/blazeface.py +0 -91
paddlex/ppdet/modeling/architectures/cascade_rcnn.py +0 -144
paddlex/ppdet/modeling/architectures/centernet.py +0 -108
paddlex/ppdet/modeling/architectures/deepsort.py +0 -69
paddlex/ppdet/modeling/architectures/detr.py +0 -93
paddlex/ppdet/modeling/architectures/fairmot.py +0 -100
paddlex/ppdet/modeling/architectures/faster_rcnn.py +0 -106
paddlex/ppdet/modeling/architectures/fcos.py +0 -105
paddlex/ppdet/modeling/architectures/gfl.py +0 -87
paddlex/ppdet/modeling/architectures/jde.py +0 -111
paddlex/ppdet/modeling/architectures/keypoint_hrhrnet.py +0 -287
paddlex/ppdet/modeling/architectures/keypoint_hrnet.py +0 -267
paddlex/ppdet/modeling/architectures/mask_rcnn.py +0 -135
paddlex/ppdet/modeling/architectures/meta_arch.py +0 -128
paddlex/ppdet/modeling/architectures/picodet.py +0 -91
paddlex/ppdet/modeling/architectures/s2anet.py +0 -102
paddlex/ppdet/modeling/architectures/solov2.py +0 -110
paddlex/ppdet/modeling/architectures/sparse_rcnn.py +0 -99
paddlex/ppdet/modeling/architectures/ssd.py +0 -93
paddlex/ppdet/modeling/architectures/tood.py +0 -78
paddlex/ppdet/modeling/architectures/ttfnet.py +0 -98
paddlex/ppdet/modeling/architectures/yolo.py +0 -124
paddlex/ppdet/modeling/assigners/__init__.py +0 -23
paddlex/ppdet/modeling/assigners/atss_assigner.py +0 -211
paddlex/ppdet/modeling/assigners/simota_assigner.py +0 -262
paddlex/ppdet/modeling/assigners/task_aligned_assigner.py +0 -158
paddlex/ppdet/modeling/assigners/utils.py +0 -195
paddlex/ppdet/modeling/backbones/__init__.py +0 -49
paddlex/ppdet/modeling/backbones/blazenet.py +0 -323
paddlex/ppdet/modeling/backbones/darknet.py +0 -340
paddlex/ppdet/modeling/backbones/dla.py +0 -244
paddlex/ppdet/modeling/backbones/esnet.py +0 -290
paddlex/ppdet/modeling/backbones/ghostnet.py +0 -470
paddlex/ppdet/modeling/backbones/hardnet.py +0 -224
paddlex/ppdet/modeling/backbones/hrnet.py +0 -727
paddlex/ppdet/modeling/backbones/lcnet.py +0 -259
paddlex/ppdet/modeling/backbones/lite_hrnet.py +0 -886
paddlex/ppdet/modeling/backbones/mobilenet_v1.py +0 -418
paddlex/ppdet/modeling/backbones/mobilenet_v3.py +0 -483
paddlex/ppdet/modeling/backbones/name_adapter.py +0 -69
paddlex/ppdet/modeling/backbones/res2net.py +0 -358
paddlex/ppdet/modeling/backbones/resnet.py +0 -613
paddlex/ppdet/modeling/backbones/senet.py +0 -139
paddlex/ppdet/modeling/backbones/shufflenet_v2.py +0 -246
paddlex/ppdet/modeling/backbones/swin_transformer.py +0 -743
paddlex/ppdet/modeling/backbones/vgg.py +0 -210
paddlex/ppdet/modeling/bbox_utils.py +0 -778
paddlex/ppdet/modeling/heads/__init__.py +0 -53
paddlex/ppdet/modeling/heads/bbox_head.py +0 -377
paddlex/ppdet/modeling/heads/cascade_head.py +0 -284
paddlex/ppdet/modeling/heads/centernet_head.py +0 -292
paddlex/ppdet/modeling/heads/detr_head.py +0 -368
paddlex/ppdet/modeling/heads/face_head.py +0 -110
paddlex/ppdet/modeling/heads/fcos_head.py +0 -259
paddlex/ppdet/modeling/heads/gfl_head.py +0 -487
paddlex/ppdet/modeling/heads/keypoint_hrhrnet_head.py +0 -108
paddlex/ppdet/modeling/heads/mask_head.py +0 -250
paddlex/ppdet/modeling/heads/pico_head.py +0 -278
paddlex/ppdet/modeling/heads/roi_extractor.py +0 -111
paddlex/ppdet/modeling/heads/s2anet_head.py +0 -1056
paddlex/ppdet/modeling/heads/simota_head.py +0 -506
paddlex/ppdet/modeling/heads/solov2_head.py +0 -560
paddlex/ppdet/modeling/heads/sparsercnn_head.py +0 -375
paddlex/ppdet/modeling/heads/ssd_head.py +0 -215
paddlex/ppdet/modeling/heads/tood_head.py +0 -366
paddlex/ppdet/modeling/heads/ttf_head.py +0 -316
paddlex/ppdet/modeling/heads/yolo_head.py +0 -124
paddlex/ppdet/modeling/initializer.py +0 -317
paddlex/ppdet/modeling/keypoint_utils.py +0 -342
paddlex/ppdet/modeling/layers.py +0 -1430
paddlex/ppdet/modeling/losses/__init__.py +0 -43
paddlex/ppdet/modeling/losses/ctfocal_loss.py +0 -68
paddlex/ppdet/modeling/losses/detr_loss.py +0 -233
paddlex/ppdet/modeling/losses/fairmot_loss.py +0 -41
paddlex/ppdet/modeling/losses/fcos_loss.py +0 -225
paddlex/ppdet/modeling/losses/gfocal_loss.py +0 -217
paddlex/ppdet/modeling/losses/iou_aware_loss.py +0 -47
paddlex/ppdet/modeling/losses/iou_loss.py +0 -210
paddlex/ppdet/modeling/losses/jde_loss.py +0 -193
paddlex/ppdet/modeling/losses/keypoint_loss.py +0 -229
paddlex/ppdet/modeling/losses/solov2_loss.py +0 -101
paddlex/ppdet/modeling/losses/sparsercnn_loss.py +0 -425
paddlex/ppdet/modeling/losses/ssd_loss.py +0 -170
paddlex/ppdet/modeling/losses/varifocal_loss.py +0 -152
paddlex/ppdet/modeling/losses/yolo_loss.py +0 -212
paddlex/ppdet/modeling/mot/__init__.py +0 -25
paddlex/ppdet/modeling/mot/matching/__init__.py +0 -19
paddlex/ppdet/modeling/mot/matching/deepsort_matching.py +0 -382
paddlex/ppdet/modeling/mot/matching/jde_matching.py +0 -144
paddlex/ppdet/modeling/mot/motion/__init__.py +0 -17
paddlex/ppdet/modeling/mot/motion/kalman_filter.py +0 -270
paddlex/ppdet/modeling/mot/tracker/__init__.py +0 -23
paddlex/ppdet/modeling/mot/tracker/base_jde_tracker.py +0 -297
paddlex/ppdet/modeling/mot/tracker/base_sde_tracker.py +0 -156
paddlex/ppdet/modeling/mot/tracker/deepsort_tracker.py +0 -188
paddlex/ppdet/modeling/mot/tracker/jde_tracker.py +0 -277
paddlex/ppdet/modeling/mot/utils.py +0 -263
paddlex/ppdet/modeling/mot/visualization.py +0 -150
paddlex/ppdet/modeling/necks/__init__.py +0 -30
paddlex/ppdet/modeling/necks/bifpn.py +0 -302
paddlex/ppdet/modeling/necks/blazeface_fpn.py +0 -216
paddlex/ppdet/modeling/necks/centernet_fpn.py +0 -426
paddlex/ppdet/modeling/necks/csp_pan.py +0 -364
paddlex/ppdet/modeling/necks/fpn.py +0 -231
paddlex/ppdet/modeling/necks/hrfpn.py +0 -126
paddlex/ppdet/modeling/necks/ttf_fpn.py +0 -242
paddlex/ppdet/modeling/necks/yolo_fpn.py +0 -988
paddlex/ppdet/modeling/ops.py +0 -1611
paddlex/ppdet/modeling/post_process.py +0 -731
paddlex/ppdet/modeling/proposal_generator/__init__.py +0 -2
paddlex/ppdet/modeling/proposal_generator/anchor_generator.py +0 -135
paddlex/ppdet/modeling/proposal_generator/proposal_generator.py +0 -77
paddlex/ppdet/modeling/proposal_generator/rpn_head.py +0 -260
paddlex/ppdet/modeling/proposal_generator/target.py +0 -681
paddlex/ppdet/modeling/proposal_generator/target_layer.py +0 -491
paddlex/ppdet/modeling/reid/__init__.py +0 -25
paddlex/ppdet/modeling/reid/fairmot_embedding_head.py +0 -225
paddlex/ppdet/modeling/reid/jde_embedding_head.py +0 -214
paddlex/ppdet/modeling/reid/pplcnet_embedding.py +0 -282
paddlex/ppdet/modeling/reid/pyramidal_embedding.py +0 -144
paddlex/ppdet/modeling/reid/resnet.py +0 -310
paddlex/ppdet/modeling/shape_spec.py +0 -25
paddlex/ppdet/modeling/transformers/__init__.py +0 -25
paddlex/ppdet/modeling/transformers/deformable_transformer.py +0 -517
paddlex/ppdet/modeling/transformers/detr_transformer.py +0 -353
paddlex/ppdet/modeling/transformers/matchers.py +0 -127
paddlex/ppdet/modeling/transformers/position_encoding.py +0 -108
paddlex/ppdet/modeling/transformers/utils.py +0 -110
paddlex/ppdet/optimizer.py +0 -335
paddlex/ppdet/slim/__init__.py +0 -82
paddlex/ppdet/slim/distill.py +0 -110
paddlex/ppdet/slim/prune.py +0 -85
paddlex/ppdet/slim/quant.py +0 -84
paddlex/ppdet/slim/unstructured_prune.py +0 -66
paddlex/ppdet/utils/__init__.py +0 -13
paddlex/ppdet/utils/check.py +0 -112
paddlex/ppdet/utils/checkpoint.py +0 -226
paddlex/ppdet/utils/cli.py +0 -151
paddlex/ppdet/utils/colormap.py +0 -58
paddlex/ppdet/utils/download.py +0 -558
paddlex/ppdet/utils/logger.py +0 -70
paddlex/ppdet/utils/profiler.py +0 -111
paddlex/ppdet/utils/stats.py +0 -94
paddlex/ppdet/utils/visualizer.py +0 -321
paddlex/ppdet/utils/voc_utils.py +0 -86
paddlex/seg.py +0 -41
paddlex/tools/__init__.py +0 -17
paddlex/tools/anchor_clustering/__init__.py +0 -15
paddlex/tools/anchor_clustering/yolo_cluster.py +0 -178
paddlex/tools/convert.py +0 -52
paddlex/tools/dataset_conversion/__init__.py +0 -24
paddlex/tools/dataset_conversion/x2coco.py +0 -379
paddlex/tools/dataset_conversion/x2imagenet.py +0 -82
paddlex/tools/dataset_conversion/x2seg.py +0 -343
paddlex/tools/dataset_conversion/x2voc.py +0 -230
paddlex/tools/dataset_split/__init__.py +0 -23
paddlex/tools/dataset_split/coco_split.py +0 -69
paddlex/tools/dataset_split/imagenet_split.py +0 -75
paddlex/tools/dataset_split/seg_split.py +0 -96
paddlex/tools/dataset_split/utils.py +0 -75
paddlex/tools/dataset_split/voc_split.py +0 -91
paddlex/tools/split.py +0 -41
paddlex/utils/checkpoint.py +0 -492
paddlex/utils/shm.py +0 -67
paddlex/utils/stats.py +0 -68
paddlex/utils/utils.py +0 -229
paddlex-2.1.0.data/data/paddlex_restful/restful/templates/paddlex_restful_demo.html +0 -5205
paddlex-2.1.0.dist-info/LICENSE +0 -201
paddlex-2.1.0.dist-info/METADATA +0 -32
paddlex-2.1.0.dist-info/RECORD +0 -698
paddlex-2.1.0.dist-info/WHEEL +0 -5
paddlex-2.1.0.dist-info/entry_points.txt +0 -4
paddlex-2.1.0.dist-info/top_level.txt +0 -3
paddlex_restful/__init__.py +0 -15
paddlex_restful/command.py +0 -63
paddlex_restful/restful/__init__.py +0 -15
paddlex_restful/restful/app.py +0 -969
paddlex_restful/restful/dataset/__init__.py +0 -13
paddlex_restful/restful/dataset/cls_dataset.py +0 -159
paddlex_restful/restful/dataset/dataset.py +0 -266
paddlex_restful/restful/dataset/datasetbase.py +0 -86
paddlex_restful/restful/dataset/det_dataset.py +0 -190
paddlex_restful/restful/dataset/ins_seg_dataset.py +0 -312
paddlex_restful/restful/dataset/operate.py +0 -155
paddlex_restful/restful/dataset/seg_dataset.py +0 -222
paddlex_restful/restful/dataset/utils.py +0 -267
paddlex_restful/restful/demo.py +0 -202
paddlex_restful/restful/dir.py +0 -45
paddlex_restful/restful/model.py +0 -312
paddlex_restful/restful/project/__init__.py +0 -13
paddlex_restful/restful/project/evaluate/__init__.py +0 -13
paddlex_restful/restful/project/evaluate/classification.py +0 -126
paddlex_restful/restful/project/evaluate/detection.py +0 -789
paddlex_restful/restful/project/evaluate/draw_pred_result.py +0 -181
paddlex_restful/restful/project/evaluate/segmentation.py +0 -122
paddlex_restful/restful/project/operate.py +0 -931
paddlex_restful/restful/project/project.py +0 -143
paddlex_restful/restful/project/prune/__init__.py +0 -13
paddlex_restful/restful/project/prune/classification.py +0 -32
paddlex_restful/restful/project/prune/detection.py +0 -48
paddlex_restful/restful/project/prune/segmentation.py +0 -34
paddlex_restful/restful/project/task.py +0 -884
paddlex_restful/restful/project/train/__init__.py +0 -13
paddlex_restful/restful/project/train/classification.py +0 -141
paddlex_restful/restful/project/train/detection.py +0 -263
paddlex_restful/restful/project/train/params.py +0 -432
paddlex_restful/restful/project/train/params_v2.py +0 -326
paddlex_restful/restful/project/train/segmentation.py +0 -191
paddlex_restful/restful/project/visualize.py +0 -244
paddlex_restful/restful/system.py +0 -102
paddlex_restful/restful/templates/paddlex_restful_demo.html +0 -5205
paddlex_restful/restful/utils.py +0 -841
paddlex_restful/restful/workspace.py +0 -343
paddlex_restful/restful/workspace_pb2.py +0 -1411

paddlex/inference/pipelines/layout_parsing/utils.py ADDED Viewed

@@ -0,0 +1,2385 @@
+# copyright (c) 2024 PaddlePaddle Authors. All Rights Reserve.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+__all__ = [
+    "get_sub_regions_ocr_res",
+    "get_layout_ordering",
+    "get_single_block_parsing_res",
+    "get_show_color",
+    "sorted_layout_boxes",
+]
+import numpy as np
+from PIL import Image
+import uuid
+import re
+from pathlib import Path
+from copy import deepcopy
+from typing import Optional, Union, List, Tuple, Dict, Any
+from ..ocr.result import OCRResult
+from ...models.object_detection.result import DetResult
+from ..components import convert_points_to_boxes
+def get_overlap_boxes_idx(src_boxes: np.ndarray, ref_boxes: np.ndarray) -> List:
+    """
+    Get the indices of source boxes that overlap with reference boxes based on a specified threshold.
+    Args:
+        src_boxes (np.ndarray): A 2D numpy array of source bounding boxes.
+        ref_boxes (np.ndarray): A 2D numpy array of reference bounding boxes.
+    Returns:
+        match_idx_list (list): A list of indices of source boxes that overlap with reference boxes.
+    """
+    match_idx_list = []
+    src_boxes_num = len(src_boxes)
+    if src_boxes_num > 0 and len(ref_boxes) > 0:
+        for rno in range(len(ref_boxes)):
+            ref_box = ref_boxes[rno]
+            x1 = np.maximum(ref_box[0], src_boxes[:, 0])
+            y1 = np.maximum(ref_box[1], src_boxes[:, 1])
+            x2 = np.minimum(ref_box[2], src_boxes[:, 2])
+            y2 = np.minimum(ref_box[3], src_boxes[:, 3])
+            pub_w = x2 - x1
+            pub_h = y2 - y1
+            match_idx = np.where((pub_w > 3) & (pub_h > 3))[0]
+            match_idx_list.extend(match_idx)
+    return match_idx_list
+def get_sub_regions_ocr_res(
+    overall_ocr_res: OCRResult,
+    object_boxes: List,
+    flag_within: bool = True,
+    return_match_idx: bool = False,
+) -> OCRResult:
+    """
+    Filters OCR results to only include text boxes within specified object boxes based on a flag.
+    Args:
+        overall_ocr_res (OCRResult): The original OCR result containing all text boxes.
+        object_boxes (list): A list of bounding boxes for the objects of interest.
+        flag_within (bool): If True, only include text boxes within the object boxes. If False, exclude text boxes within the object boxes.
+        return_match_idx (bool): If True, return the list of matching indices.
+    Returns:
+        OCRResult: A filtered OCR result containing only the relevant text boxes.
+    """
+    sub_regions_ocr_res = {}
+    sub_regions_ocr_res["rec_polys"] = []
+    sub_regions_ocr_res["rec_texts"] = []
+    sub_regions_ocr_res["rec_scores"] = []
+    sub_regions_ocr_res["rec_boxes"] = []
+    overall_text_boxes = overall_ocr_res["rec_boxes"]
+    match_idx_list = get_overlap_boxes_idx(overall_text_boxes, object_boxes)
+    match_idx_list = list(set(match_idx_list))
+    for box_no in range(len(overall_text_boxes)):
+        if flag_within:
+            if box_no in match_idx_list:
+                flag_match = True
+            else:
+                flag_match = False
+        else:
+            if box_no not in match_idx_list:
+                flag_match = True
+            else:
+                flag_match = False
+        if flag_match:
+            sub_regions_ocr_res["rec_polys"].append(
+                overall_ocr_res["rec_polys"][box_no]
+            )
+            sub_regions_ocr_res["rec_texts"].append(
+                overall_ocr_res["rec_texts"][box_no]
+            )
+            sub_regions_ocr_res["rec_scores"].append(
+                overall_ocr_res["rec_scores"][box_no]
+            )
+            sub_regions_ocr_res["rec_boxes"].append(
+                overall_ocr_res["rec_boxes"][box_no]
+            )
+    for key in ["rec_polys", "rec_scores", "rec_boxes"]:
+        sub_regions_ocr_res[key] = np.array(sub_regions_ocr_res[key])
+    return (
+        (sub_regions_ocr_res, match_idx_list)
+        if return_match_idx
+        else sub_regions_ocr_res
+    )
+def sorted_layout_boxes(res, w):
+    """
+    Sort text boxes in order from top to bottom, left to right
+    Args:
+        res: List of dictionaries containing layout information.
+        w: Width of image.
+    Returns:
+        List of dictionaries containing sorted layout information.
+    """
+    num_boxes = len(res)
+    if num_boxes == 1:
+        return res
+    # Sort on the y axis first or sort it on the x axis
+    sorted_boxes = sorted(res, key=lambda x: (x["block_bbox"][1], x["block_bbox"][0]))
+    _boxes = list(sorted_boxes)
+    new_res = []
+    res_left = []
+    res_right = []
+    i = 0
+    while True:
+        if i >= num_boxes:
+            break
+        # Check that the bbox is on the left
+        elif (
+            _boxes[i]["block_bbox"][0] < w / 4
+            and _boxes[i]["block_bbox"][2] < 3 * w / 5
+        ):
+            res_left.append(_boxes[i])
+            i += 1
+        elif _boxes[i]["block_bbox"][0] > 2 * w / 5:
+            res_right.append(_boxes[i])
+            i += 1
+        else:
+            new_res += res_left
+            new_res += res_right
+            new_res.append(_boxes[i])
+            res_left = []
+            res_right = []
+            i += 1
+    res_left = sorted(res_left, key=lambda x: (x["block_bbox"][1]))
+    res_right = sorted(res_right, key=lambda x: (x["block_bbox"][1]))
+    if res_left:
+        new_res += res_left
+    if res_right:
+        new_res += res_right
+    return new_res
+def _calculate_overlap_area_div_minbox_area_ratio(
+    bbox1: Union[list, tuple],
+    bbox2: Union[list, tuple],
+) -> float:
+    """
+    Calculate the ratio of the overlap area between bbox1 and bbox2
+    to the area of the smaller bounding box.
+    Args:
+        bbox1 (list or tuple): Coordinates of the first bounding box [x_min, y_min, x_max, y_max].
+        bbox2 (list or tuple): Coordinates of the second bounding box [x_min, y_min, x_max, y_max].
+    Returns:
+        float: The ratio of the overlap area to the area of the smaller bounding box.
+    """
+    bbox1 = list(map(int, bbox1))
+    bbox2 = list(map(int, bbox2))
+    x_left = max(bbox1[0], bbox2[0])
+    y_top = max(bbox1[1], bbox2[1])
+    x_right = min(bbox1[2], bbox2[2])
+    y_bottom = min(bbox1[3], bbox2[3])
+    if x_right <= x_left or y_bottom <= y_top:
+        return 0.0
+    intersection_area = (x_right - x_left) * (y_bottom - y_top)
+    area_bbox1 = (bbox1[2] - bbox1[0]) * (bbox1[3] - bbox1[1])
+    area_bbox2 = (bbox2[2] - bbox2[0]) * (bbox2[3] - bbox2[1])
+    min_box_area = min(area_bbox1, area_bbox2)
+    if min_box_area <= 0:
+        return 0.0
+    return intersection_area / min_box_area
+def _whether_y_overlap_exceeds_threshold(
+    bbox1: Union[list, tuple],
+    bbox2: Union[list, tuple],
+    overlap_ratio_threshold: float = 0.6,
+) -> bool:
+    """
+    Determines whether the vertical overlap between two bounding boxes exceeds a given threshold.
+    Args:
+        bbox1 (list or tuple): The first bounding box defined as (left, top, right, bottom).
+        bbox2 (list or tuple): The second bounding box defined as (left, top, right, bottom).
+        overlap_ratio_threshold (float): The threshold ratio to determine if the overlap is significant.
+                                         Defaults to 0.6.
+    Returns:
+        bool: True if the vertical overlap divided by the minimum height of the two bounding boxes
+              exceeds the overlap_ratio_threshold, otherwise False.
+    """
+    _, y1_0, _, y1_1 = bbox1
+    _, y2_0, _, y2_1 = bbox2
+    overlap = max(0, min(y1_1, y2_1) - max(y1_0, y2_0))
+    min_height = min(y1_1 - y1_0, y2_1 - y2_0)
+    return (overlap / min_height) > overlap_ratio_threshold
+def _adjust_span_text(span: List[str], prepend: bool = False, append: bool = False):
+    """
+    Adjust the text of a span by prepending or appending a newline.
+    Args:
+        span (list): A list where the second element is the text of the span.
+        prepend (bool): If True, prepend a newline to the text.
+        append (bool): If True, append a newline to the text.
+    Returns:
+        None: The function modifies the span in place.
+    """
+    if prepend:
+        span[1] = "\n" + span[1]
+    if append:
+        span[1] = span[1] + "\n"
+    return span
+def _format_line(
+    line: List[List[Union[List[int], str]]],
+    layout_min: int,
+    layout_max: int,
+    is_reference: bool = False,
+) -> None:
+    """
+    Format a line of text spans based on layout constraints.
+    Args:
+        line (list): A list of spans, where each span is a list containing a bounding box and text.
+        layout_min (int): The minimum x-coordinate of the layout bounding box.
+        layout_max (int): The maximum x-coordinate of the layout bounding box.
+        is_reference (bool): A flag indicating whether the line is a reference line, which affects formatting rules.
+    Returns:
+        None: The function modifies the line in place.
+    """
+    first_span = line[0]
+    end_span = line[-1]
+    if not is_reference:
+        if first_span[0][0] - layout_min > 10:
+            first_span = _adjust_span_text(first_span, prepend=True)
+        if layout_max - end_span[0][2] > 10:
+            end_span = _adjust_span_text(end_span, append=True)
+    else:
+        if first_span[0][0] - layout_min < 5:
+            first_span = _adjust_span_text(first_span, prepend=True)
+        if layout_max - end_span[0][2] > 20:
+            end_span = _adjust_span_text(end_span, append=True)
+    line[0] = first_span
+    line[-1] = end_span
+    return line
+def split_boxes_if_x_contained(boxes, offset=1e-5):
+    """
+    Check if there is any complete containment in the x-direction
+    between the bounding boxes and split the containing box accordingly.
+    Args:
+        boxes (list of lists): Each element is a list containing an ndarray of length 4, a description, and a label.
+        offset (float): A small offset value to ensure that the split boxes are not too close to the original boxes.
+    Returns:
+        A new list of boxes, including split boxes, with the same `rec_text` and `label` attributes.
+    """
+    def is_x_contained(box_a, box_b):
+        """Check if box_a completely contains box_b in the x-direction."""
+        return box_a[0][0] <= box_b[0][0] and box_a[0][2] >= box_b[0][2]
+    new_boxes = []
+    for i in range(len(boxes)):
+        box_a = boxes[i]
+        is_split = False
+        for j in range(len(boxes)):
+            if i == j:
+                continue
+            box_b = boxes[j]
+            if is_x_contained(box_a, box_b):
+                is_split = True
+                # Split box_a based on the x-coordinates of box_b
+                if box_a[0][0] < box_b[0][0]:
+                    w = box_b[0][0] - offset - box_a[0][0]
+                    if w > 1:
+                        new_boxes.append(
+                            [
+                                np.array(
+                                    [
+                                        box_a[0][0],
+                                        box_a[0][1],
+                                        box_b[0][0] - offset,
+                                        box_a[0][3],
+                                    ]
+                                ),
+                                box_a[1],
+                                box_a[2],
+                            ]
+                        )
+                if box_a[0][2] > box_b[0][2]:
+                    w = box_a[0][2] - box_b[0][2] + offset
+                    if w > 1:
+                        box_a = [
+                            np.array(
+                                [
+                                    box_b[0][2] + offset,
+                                    box_a[0][1],
+                                    box_a[0][2],
+                                    box_a[0][3],
+                                ]
+                            ),
+                            box_a[1],
+                            box_a[2],
+                        ]
+            if j == len(boxes) - 1 and is_split:
+                new_boxes.append(box_a)
+        if not is_split:
+            new_boxes.append(box_a)
+    return new_boxes
+def _sort_line_by_x_projection(
+    input_img: np.ndarray,
+    general_ocr_pipeline: Any,
+    line: List[List[Union[List[int], str]]],
+) -> None:
+    """
+    Sort a line of text spans based on their vertical position within the layout bounding box.
+    Args:
+        input_img (ndarray): The input image used for OCR.
+        general_ocr_pipeline (Any): The general OCR pipeline used for text recognition.
+        line (list): A list of spans, where each span is a list containing a bounding box and text.
+    Returns:
+        list: The sorted line of text spans.
+    """
+    splited_boxes = split_boxes_if_x_contained(line)
+    splited_lines = []
+    if len(line) != len(splited_boxes):
+        splited_boxes.sort(key=lambda span: span[0][0])
+        text_rec_model = general_ocr_pipeline.text_rec_model
+        for span in splited_boxes:
+            if span[2] == "text":
+                crop_img = input_img[
+                    int(span[0][1]) : int(span[0][3]),
+                    int(span[0][0]) : int(span[0][2]),
+                ]
+                span[1] = next(text_rec_model([crop_img]))["rec_text"]
+            splited_lines.append(span)
+    else:
+        splited_lines = line
+    return splited_lines
+def _sort_ocr_res_by_y_projection(
+    input_img: np.ndarray,
+    general_ocr_pipeline: Any,
+    label: Any,
+    block_bbox: Tuple[int, int, int, int],
+    ocr_res: Dict[str, List[Any]],
+    line_height_iou_threshold: float = 0.7,
+) -> Dict[str, List[Any]]:
+    """
+    Sorts OCR results based on their spatial arrangement, grouping them into lines and blocks.
+    Args:
+        input_img (ndarray): The input image used for OCR.
+        general_ocr_pipeline (Any): The general OCR pipeline used for text recognition.
+        label (Any): The label associated with the OCR results. It's not used in the function but might be
+                     relevant for other parts of the calling context.
+        block_bbox (Tuple[int, int, int, int]): A tuple representing the layout bounding box, defined as
+                                                 (left, top, right, bottom).
+        ocr_res (Dict[str, List[Any]]): A dictionary containing OCR results with the following keys:
+            - "boxes": A list of bounding boxes, each defined as [left, top, right, bottom].
+            - "rec_texts": A corresponding list of recognized text strings for each box.
+        line_height_iou_threshold (float): The threshold for determining whether two boxes belong to
+                                           the same line based on their vertical overlap. Defaults to 0.7.
+    Returns:
+        Dict[str, List[Any]]: A dictionary with the same structure as `ocr_res`, but with boxes and texts sorted
+                              and grouped into lines and blocks.
+    """
+    assert (
+        ocr_res["boxes"] and ocr_res["rec_texts"]
+    ), "OCR results must contain 'boxes' and 'rec_texts'"
+    boxes = ocr_res["boxes"]
+    rec_texts = ocr_res["rec_texts"]
+    rec_labels = ocr_res["rec_labels"]
+    x_min, _, x_max, _ = block_bbox
+    inline_x_min = min([box[0] for box in boxes])
+    inline_x_max = max([box[2] for box in boxes])
+    spans = list(zip(boxes, rec_texts, rec_labels))
+    spans.sort(key=lambda span: span[0][1])
+    spans = [list(span) for span in spans]
+    lines = []
+    current_line = [spans[0]]
+    current_y0, current_y1 = spans[0][0][1], spans[0][0][3]
+    for span in spans[1:]:
+        y0, y1 = span[0][1], span[0][3]
+        if _whether_y_overlap_exceeds_threshold(
+            (0, current_y0, 0, current_y1),
+            (0, y0, 0, y1),
+            line_height_iou_threshold,
+        ):
+            current_line.append(span)
+            current_y0 = min(current_y0, y0)
+            current_y1 = max(current_y1, y1)
+        else:
+            lines.append(current_line)
+            current_line = [span]
+            current_y0, current_y1 = y0, y1
+    if current_line:
+        lines.append(current_line)
+    new_lines = []
+    for line in lines:
+        line.sort(key=lambda span: span[0][0])
+        ocr_labels = [span[2] for span in line]
+        if "formula" in ocr_labels:
+            line = _sort_line_by_x_projection(input_img, general_ocr_pipeline, line)
+        if label == "reference":
+            line = _format_line(line, inline_x_min, inline_x_max, is_reference=True)
+        elif label != "content":
+            line = _format_line(line, x_min, x_max)
+        new_lines.append(line)
+    ocr_res["boxes"] = [span[0] for line in new_lines for span in line]
+    if label == "content":
+        ocr_res["rec_texts"] = [
+            "".join(f"{span[1]} " for span in line).rstrip() for line in new_lines
+        ]
+    else:
+        ocr_res["rec_texts"] = [span[1] + " " for line in new_lines for span in line]
+    return ocr_res, len(new_lines)
+def _process_text(input_text: str) -> str:
+    """
+    Process the input text to handle spaces.
+    The function removes multiple consecutive spaces between Chinese characters and ensures that
+    only a single space is retained between Chinese and non-Chinese characters.
+    Args:
+        input_text (str): The text to be processed.
+    Returns:
+        str: The processed text with properly formatted spaces.
+    """
+    def handle_spaces_(text: str) -> str:
+        """
+        Handle spaces in the text by removing multiple consecutive spaces and inserting a single space
+        between Chinese and non-Chinese characters.
+        Args:
+            text (str): The text to handle spaces for.
+        Returns:
+            str: The text with properly formatted spaces.
+        """
+        spaces = re.finditer(r"\s+", text)
+        processed_text = list(text)
+        for space in reversed(list(spaces)):
+            start, end = space.span()
+            prev_char = processed_text[start - 1] if start > 0 else ""
+            next_char = processed_text[end] if end < len(processed_text) else ""
+            is_prev_chinese = (
+                re.match(r"[\u4e00-\u9fff]", prev_char) if prev_char else False
+            )
+            is_next_chinese = (
+                re.match(r"[\u4e00-\u9fff]", next_char) if next_char else False
+            )
+            if is_prev_chinese and is_next_chinese:
+                processed_text[start:end] = []
+            else:
+                processed_text[start:end] = [" "]
+        return "".join(processed_text)
+    text_without_spaces = handle_spaces_(input_text)
+    final_text = re.sub(r"\s+", " ", text_without_spaces).strip()
+    return final_text
+def get_single_block_parsing_res(
+    general_ocr_pipeline: Any,
+    overall_ocr_res: OCRResult,
+    layout_det_res: DetResult,
+    table_res_list: list,
+    seal_res_list: list,
+) -> OCRResult:
+    """
+    Extract structured information from OCR and layout detection results.
+    Args:
+        overall_ocr_res (OCRResult): An object containing the overall OCR results, including detected text boxes and recognized text. The structure is expected to have:
+            - "input_img": The image on which OCR was performed.
+            - "dt_boxes": A list of detected text box coordinates.
+            - "rec_texts": A list of recognized text corresponding to the detected boxes.
+        layout_det_res (DetResult): An object containing the layout detection results, including detected layout boxes and their labels. The structure is expected to have:
+            - "boxes": A list of dictionaries with keys "coordinate" for box coordinates and "block_label" for the type of content.
+        table_res_list (list): A list of table detection results, where each item is a dictionary containing:
+            - "block_bbox": The bounding box of the table layout.
+            - "pred_html": The predicted HTML representation of the table.
+        seal_res_list (List): A list of seal detection results. The details of each item depend on the specific application context.
+    Returns:
+        list: A list of structured boxes where each item is a dictionary containing:
+            - "block_label": The label of the content (e.g., 'table', 'chart', 'image').
+            - The label as a key with either table HTML or image data and text.
+            - "block_bbox": The coordinates of the layout box.
+    """
+    single_block_layout_parsing_res = []
+    input_img = overall_ocr_res["doc_preprocessor_res"]["output_img"]
+    seal_index = 0
+    with_doc_title = False
+    max_block_area = 0.0
+    paragraph_title_indexs = []
+    layout_det_res_list, _ = _remove_overlap_blocks(
+        deepcopy(layout_det_res["boxes"]),
+        threshold=0.5,
+        smaller=True,
+    )
+    for box_idx, box_info in enumerate(layout_det_res_list):
+        block_bbox = box_info["coordinate"]
+        label = box_info["label"]
+        rec_res = {"boxes": [], "rec_texts": [], "rec_labels": [], "flag": False}
+        seg_start_coordinate = float("inf")
+        seg_end_coordinate = float("-inf")
+        num_of_lines = 1
+        if label == "doc_title":
+            with_doc_title = True
+        elif label == "paragraph_title":
+            paragraph_title_indexs.append(box_idx)
+        block_area = (block_bbox[2] - block_bbox[0]) * (block_bbox[3] - block_bbox[1])
+        max_block_area = max(max_block_area, block_area)
+        if label == "table":
+            for table_res in table_res_list:
+                if len(table_res["cell_box_list"]) == 0:
+                    continue
+                if (
+                    _calculate_overlap_area_div_minbox_area_ratio(
+                        block_bbox, table_res["cell_box_list"][0]
+                    )
+                    > 0.5
+                ):
+                    single_block_layout_parsing_res.append(
+                        {
+                            "block_label": label,
+                            "block_content": table_res["pred_html"],
+                            "block_bbox": block_bbox,
+                        },
+                    )
+                    break
+        elif label == "seal":
+            if len(seal_res_list) > 0:
+                single_block_layout_parsing_res.append(
+                    {
+                        "block_label": label,
+                        "block_content": _process_text(
+                            ", ".join(seal_res_list[seal_index]["rec_texts"])
+                        ),
+                        "block_bbox": block_bbox,
+                    },
+                )
+                seal_index += 1
+        else:
+            overall_text_boxes = overall_ocr_res["rec_boxes"]
+            for box_no in range(len(overall_text_boxes)):
+                if (
+                    _calculate_overlap_area_div_minbox_area_ratio(
+                        block_bbox, overall_text_boxes[box_no]
+                    )
+                    > 0.5
+                ):
+                    rec_res["boxes"].append(overall_text_boxes[box_no])
+                    rec_res["rec_texts"].append(
+                        overall_ocr_res["rec_texts"][box_no],
+                    )
+                    rec_res["rec_labels"].append(
+                        overall_ocr_res["rec_labels"][box_no],
+                    )
+                    rec_res["flag"] = True
+            if rec_res["flag"]:
+                rec_res, num_of_lines = _sort_ocr_res_by_y_projection(
+                    input_img, general_ocr_pipeline, label, block_bbox, rec_res, 0.7
+                )
+                seg_start_coordinate = rec_res["boxes"][0][0]
+                seg_end_coordinate = rec_res["boxes"][-1][2]
+                if label == "formula":
+                    rec_res["rec_texts"] = [
+                        rec_res_text.replace("$", "")
+                        for rec_res_text in rec_res["rec_texts"]
+                    ]
+            if label in ["chart", "image"]:
+                x_min, y_min, x_max, y_max = list(map(int, block_bbox))
+                img_path = f"imgs/img_in_table_box_{x_min}_{y_min}_{x_max}_{y_max}.jpg"
+                img = Image.fromarray(input_img[y_min:y_max, x_min:x_max, ::-1])
+                single_block_layout_parsing_res.append(
+                    {
+                        "block_label": label,
+                        "block_content": _process_text("".join(rec_res["rec_texts"])),
+                        "block_image": {img_path: img},
+                        "block_bbox": block_bbox,
+                    },
+                )
+            else:
+                if label in ["doc_title"]:
+                    content = " ".join(rec_res["rec_texts"])
+                elif label in ["content"]:
+                    content = "\n".join(rec_res["rec_texts"])
+                else:
+                    content = "".join(rec_res["rec_texts"])
+                    if label != "reference":
+                        content = _process_text(content)
+                single_block_layout_parsing_res.append(
+                    {
+                        "block_label": label,
+                        "block_content": content,
+                        "block_bbox": block_bbox,
+                        "seg_start_coordinate": seg_start_coordinate,
+                        "seg_end_coordinate": seg_end_coordinate,
+                        "num_of_lines": num_of_lines,
+                        "block_area": block_area,
+                    },
+                )
+    if (
+        not with_doc_title
+        and len(paragraph_title_indexs) == 1
+        and single_block_layout_parsing_res[paragraph_title_indexs[0]].get(
+            "block_area", 0
+        )
+        > max_block_area * 0.3
+    ):
+        single_block_layout_parsing_res[paragraph_title_indexs[0]][
+            "block_label"
+        ] = "doc_title"
+    if len(layout_det_res_list) == 0:
+        for ocr_rec_box, ocr_rec_text in zip(
+            overall_ocr_res["rec_boxes"], overall_ocr_res["rec_texts"]
+        ):
+            single_block_layout_parsing_res.append(
+                {
+                    "block_label": "text",
+                    "block_content": ocr_rec_text,
+                    "block_bbox": ocr_rec_box,
+                    "seg_start_coordinate": ocr_rec_box[0],
+                    "seg_end_coordinate": ocr_rec_box[2],
+                },
+            )
+    single_block_layout_parsing_res = get_layout_ordering(
+        single_block_layout_parsing_res,
+        no_mask_labels=[
+            "text",
+            "formula",
+            "algorithm",
+            "reference",
+            "content",
+            "abstract",
+        ],
+    )
+    return single_block_layout_parsing_res
+def _projection_by_bboxes(boxes: np.ndarray, axis: int) -> np.ndarray:
+    """
+    Generate a 1D projection histogram from bounding boxes along a specified axis.
+    Args:
+        boxes: A (N, 4) array of bounding boxes defined by [x_min, y_min, x_max, y_max].
+        axis: Axis for projection; 0 for horizontal (x-axis), 1 for vertical (y-axis).
+    Returns:
+        A 1D numpy array representing the projection histogram based on bounding box intervals.
+    """
+    assert axis in [0, 1]
+    max_length = np.max(boxes[:, axis::2])
+    projection = np.zeros(max_length, dtype=int)
+    # Increment projection histogram over the interval defined by each bounding box
+    for start, end in boxes[:, axis::2]:
+        projection[start:end] += 1
+    return projection
+def _split_projection_profile(arr_values: np.ndarray, min_value: float, min_gap: float):
+    """
+    Split the projection profile into segments based on specified thresholds.
+    Args:
+        arr_values: 1D array representing the projection profile.
+        min_value: Minimum value threshold to consider a profile segment significant.
+        min_gap: Minimum gap width to consider a separation between segments.
+    Returns:
+        A tuple of start and end indices for each segment that meets the criteria.
+    """
+    # Identify indices where the projection exceeds the minimum value
+    significant_indices = np.where(arr_values > min_value)[0]
+    if not len(significant_indices):
+        return
+    # Calculate gaps between significant indices
+    index_diffs = significant_indices[1:] - significant_indices[:-1]
+    gap_indices = np.where(index_diffs > min_gap)[0]
+    # Determine start and end indices of segments
+    segment_starts = np.insert(
+        significant_indices[gap_indices + 1],
+        0,
+        significant_indices[0],
+    )
+    segment_ends = np.append(
+        significant_indices[gap_indices],
+        significant_indices[-1] + 1,
+    )
+    return segment_starts, segment_ends
+def _recursive_yx_cut(
+    boxes: np.ndarray, indices: List[int], res: List[int], min_gap: int = 1
+):
+    """
+    Recursively project and segment bounding boxes, starting with Y-axis and followed by X-axis.
+    Args:
+        boxes: A (N, 4) array representing bounding boxes.
+        indices: List of indices indicating the original position of boxes.
+        res: List to store indices of the final segmented bounding boxes.
+        min_gap (int): Minimum gap width to consider a separation between segments on the X-axis. Defaults to 1.
+    Returns:
+        None: This function modifies the `res` list in place.
+    """
+    assert len(boxes) == len(
+        indices
+    ), "The length of boxes and indices must be the same."
+    # Sort by y_min for Y-axis projection
+    y_sorted_indices = boxes[:, 1].argsort()
+    y_sorted_boxes = boxes[y_sorted_indices]
+    y_sorted_indices = np.array(indices)[y_sorted_indices]
+    # Perform Y-axis projection
+    y_projection = _projection_by_bboxes(boxes=y_sorted_boxes, axis=1)
+    y_intervals = _split_projection_profile(y_projection, 0, 1)
+    if not y_intervals:
+        return
+    # Process each segment defined by Y-axis projection
+    for y_start, y_end in zip(*y_intervals):
+        # Select boxes within the current y interval
+        y_interval_indices = (y_start <= y_sorted_boxes[:, 1]) & (
+            y_sorted_boxes[:, 1] < y_end
+        )
+        y_boxes_chunk = y_sorted_boxes[y_interval_indices]
+        y_indices_chunk = y_sorted_indices[y_interval_indices]
+        # Sort by x_min for X-axis projection
+        x_sorted_indices = y_boxes_chunk[:, 0].argsort()
+        x_sorted_boxes_chunk = y_boxes_chunk[x_sorted_indices]
+        x_sorted_indices_chunk = y_indices_chunk[x_sorted_indices]
+        # Perform X-axis projection
+        x_projection = _projection_by_bboxes(boxes=x_sorted_boxes_chunk, axis=0)
+        x_intervals = _split_projection_profile(x_projection, 0, min_gap)
+        if not x_intervals:
+            continue
+        # If X-axis cannot be further segmented, add current indices to results
+        if len(x_intervals[0]) == 1:
+            res.extend(x_sorted_indices_chunk)
+            continue
+        # Recursively process each segment defined by X-axis projection
+        for x_start, x_end in zip(*x_intervals):
+            x_interval_indices = (x_start <= x_sorted_boxes_chunk[:, 0]) & (
+                x_sorted_boxes_chunk[:, 0] < x_end
+            )
+            _recursive_yx_cut(
+                x_sorted_boxes_chunk[x_interval_indices],
+                x_sorted_indices_chunk[x_interval_indices],
+                res,
+            )
+def _recursive_xy_cut(
+    boxes: np.ndarray, indices: List[int], res: List[int], min_gap: int = 1
+):
+    """
+    Recursively performs X-axis projection followed by Y-axis projection to segment bounding boxes.
+    Args:
+        boxes: A (N, 4) array representing bounding boxes with [x_min, y_min, x_max, y_max].
+        indices: A list of indices representing the position of boxes in the original data.
+        res: A list to store indices of bounding boxes that meet the criteria.
+        min_gap (int): Minimum gap width to consider a separation between segments on the X-axis. Defaults to 1.
+    Returns:
+        None: This function modifies the `res` list in place.
+    """
+    # Ensure boxes and indices have the same length
+    assert len(boxes) == len(
+        indices
+    ), "The length of boxes and indices must be the same."
+    # Sort by x_min to prepare for X-axis projection
+    x_sorted_indices = boxes[:, 0].argsort()
+    x_sorted_boxes = boxes[x_sorted_indices]
+    x_sorted_indices = np.array(indices)[x_sorted_indices]
+    # Perform X-axis projection
+    x_projection = _projection_by_bboxes(boxes=x_sorted_boxes, axis=0)
+    x_intervals = _split_projection_profile(x_projection, 0, 1)
+    if not x_intervals:
+        return
+    # Process each segment defined by X-axis projection
+    for x_start, x_end in zip(*x_intervals):
+        # Select boxes within the current x interval
+        x_interval_indices = (x_start <= x_sorted_boxes[:, 0]) & (
+            x_sorted_boxes[:, 0] < x_end
+        )
+        x_boxes_chunk = x_sorted_boxes[x_interval_indices]
+        x_indices_chunk = x_sorted_indices[x_interval_indices]
+        # Sort selected boxes by y_min to prepare for Y-axis projection
+        y_sorted_indices = x_boxes_chunk[:, 1].argsort()
+        y_sorted_boxes_chunk = x_boxes_chunk[y_sorted_indices]
+        y_sorted_indices_chunk = x_indices_chunk[y_sorted_indices]
+        # Perform Y-axis projection
+        y_projection = _projection_by_bboxes(boxes=y_sorted_boxes_chunk, axis=1)
+        y_intervals = _split_projection_profile(y_projection, 0, min_gap)
+        if not y_intervals:
+            continue
+        # If Y-axis cannot be further segmented, add current indices to results
+        if len(y_intervals[0]) == 1:
+            res.extend(y_sorted_indices_chunk)
+            continue
+        # Recursively process each segment defined by Y-axis projection
+        for y_start, y_end in zip(*y_intervals):
+            y_interval_indices = (y_start <= y_sorted_boxes_chunk[:, 1]) & (
+                y_sorted_boxes_chunk[:, 1] < y_end
+            )
+            _recursive_xy_cut(
+                y_sorted_boxes_chunk[y_interval_indices],
+                y_sorted_indices_chunk[y_interval_indices],
+                res,
+            )
+def sort_by_xycut(
+    block_bboxes: Union[np.ndarray, List[List[int]]],
+    direction: int = 0,
+    min_gap: int = 1,
+) -> List[int]:
+    """
+    Sort bounding boxes using recursive XY cut method based on the specified direction.
+    Args:
+        block_bboxes (Union[np.ndarray, List[List[int]]]): An array or list of bounding boxes,
+                                                           where each box is represented as
+                                                           [x_min, y_min, x_max, y_max].
+        direction (int): Direction for the initial cut. Use 1 for Y-axis first and 0 for X-axis first.
+                         Defaults to 0.
+        min_gap (int): Minimum gap width to consider a separation between segments. Defaults to 1.
+    Returns:
+        List[int]: A list of indices representing the order of sorted bounding boxes.
+    """
+    block_bboxes = np.asarray(block_bboxes).astype(int)
+    res = []
+    if direction == 1:
+        _recursive_yx_cut(
+            block_bboxes,
+            np.arange(len(block_bboxes)).tolist(),
+            res,
+            min_gap,
+        )
+    else:
+        _recursive_xy_cut(
+            block_bboxes,
+            np.arange(len(block_bboxes)).tolist(),
+            res,
+            min_gap,
+        )
+    return res
+def gather_imgs(original_img, layout_det_objs):
+    imgs_in_doc = []
+    for det_obj in layout_det_objs:
+        if det_obj["label"] in ("image", "chart"):
+            x_min, y_min, x_max, y_max = list(map(int, det_obj["coordinate"]))
+            img_path = f"imgs/img_in_table_box_{x_min}_{y_min}_{x_max}_{y_max}.jpg"
+            img = Image.fromarray(original_img[y_min:y_max, x_min:x_max, ::-1])
+            imgs_in_doc.append(
+                {
+                    "path": img_path,
+                    "img": img,
+                    "coordinate": (x_min, y_min, x_max, y_max),
+                    "score": det_obj["score"],
+                }
+            )
+    return imgs_in_doc
+def _get_minbox_if_overlap_by_ratio(
+    bbox1: Union[List[int], Tuple[int, int, int, int]],
+    bbox2: Union[List[int], Tuple[int, int, int, int]],
+    ratio: float,
+    smaller: bool = True,
+) -> Optional[Union[List[int], Tuple[int, int, int, int]]]:
+    """
+    Determine if the overlap area between two bounding boxes exceeds a given ratio
+    and return the smaller (or larger) bounding box based on the `smaller` flag.
+    Args:
+        bbox1 (Union[List[int], Tuple[int, int, int, int]]): Coordinates of the first bounding box [x_min, y_min, x_max, y_max].
+        bbox2 (Union[List[int], Tuple[int, int, int, int]]): Coordinates of the second bounding box [x_min, y_min, x_max, y_max].
+        ratio (float): The overlap ratio threshold.
+        smaller (bool): If True, return the smaller bounding box; otherwise, return the larger one.
+    Returns:
+        Optional[Union[List[int], Tuple[int, int, int, int]]]:
+            The selected bounding box or None if the overlap ratio is not exceeded.
+    """
+    # Calculate the areas of both bounding boxes
+    area1 = (bbox1[2] - bbox1[0]) * (bbox1[3] - bbox1[1])
+    area2 = (bbox2[2] - bbox2[0]) * (bbox2[3] - bbox2[1])
+    # Calculate the overlap ratio using a helper function
+    overlap_ratio = _calculate_overlap_area_div_minbox_area_ratio(bbox1, bbox2)
+    # Check if the overlap ratio exceeds the threshold
+    if overlap_ratio > ratio:
+        if (area1 <= area2 and smaller) or (area1 >= area2 and not smaller):
+            return 1
+        else:
+            return 2
+    return None
+def _remove_overlap_blocks(
+    blocks: List[Dict[str, List[int]]], threshold: float = 0.65, smaller: bool = True
+) -> Tuple[List[Dict[str, List[int]]], List[Dict[str, List[int]]]]:
+    """
+    Remove overlapping blocks based on a specified overlap ratio threshold.
+    Args:
+        blocks (List[Dict[str, List[int]]]): List of block dictionaries, each containing a 'block_bbox' key.
+        threshold (float): Ratio threshold to determine significant overlap.
+        smaller (bool): If True, the smaller block in overlap is removed.
+    Returns:
+        Tuple[List[Dict[str, List[int]]], List[Dict[str, List[int]]]]:
+            A tuple containing the updated list of blocks and a list of dropped blocks.
+    """
+    dropped_blocks = []
+    dropped_indexes = set()
+    # Iterate over each pair of blocks to find overlaps
+    for i, block1 in enumerate(blocks):
+        for j in range(i + 1, len(blocks)):
+            block2 = blocks[j]
+            # Skip blocks that are already marked for removal
+            if i in dropped_indexes or j in dropped_indexes:
+                continue
+            # Check for overlap and determine which block to remove
+            overlap_box_index = _get_minbox_if_overlap_by_ratio(
+                block1["coordinate"],
+                block2["coordinate"],
+                threshold,
+                smaller=smaller,
+            )
+            if overlap_box_index is not None:
+                # Determine which block to remove based on overlap_box_index
+                if overlap_box_index == 1:
+                    drop_index = i
+                else:
+                    drop_index = j
+                dropped_indexes.add(drop_index)
+    # Remove marked blocks from the original list
+    for index in sorted(dropped_indexes, reverse=True):
+        dropped_blocks.append(blocks[index])
+        del blocks[index]
+    return blocks, dropped_blocks
+def _get_text_median_width(blocks: List[Dict[str, any]]) -> float:
+    """
+    Calculate the median width of blocks labeled as "text".
+    Args:
+        blocks (List[Dict[str, any]]): List of block dictionaries, each containing a 'block_bbox' and 'label'.
+    Returns:
+        float: The median width of text blocks, or infinity if no text blocks are found.
+    """
+    widths = [
+        block["block_bbox"][2] - block["block_bbox"][0]
+        for block in blocks
+        if block.get("block_label") == "text"
+    ]
+    return np.median(widths) if widths else float("inf")
+def _get_layout_property(
+    blocks: List[Dict[str, any]],
+    median_width: float,
+    no_mask_labels: List[str],
+    threshold: float = 0.8,
+) -> Tuple[List[Dict[str, any]], bool]:
+    """
+    Determine the layout (single or double column) of text blocks.
+    Args:
+        blocks (List[Dict[str, any]]): List of block dictionaries containing 'label' and 'block_bbox'.
+        median_width (float): Median width of text blocks.
+        no_mask_labels (List[str]): Labels of blocks to be considered for layout analysis.
+        threshold (float): Threshold for determining layout overlap.
+    Returns:
+        Tuple[List[Dict[str, any]], bool]: Updated list of blocks with layout information and a boolean
+        indicating if the double layout area is greater than the single layout area.
+    """
+    blocks.sort(
+        key=lambda x: (
+            x["block_bbox"][0],
+            (x["block_bbox"][2] - x["block_bbox"][0]),
+        ),
+    )
+    check_single_layout = {}
+    page_min_x, page_max_x = float("inf"), 0
+    double_label_area = 0
+    single_label_area = 0
+    for i, block in enumerate(blocks):
+        page_min_x = min(page_min_x, block["block_bbox"][0])
+        page_max_x = max(page_max_x, block["block_bbox"][2])
+    page_width = page_max_x - page_min_x
+    for i, block in enumerate(blocks):
+        if block["block_label"] not in no_mask_labels:
+            continue
+        x_min_i, _, x_max_i, _ = block["block_bbox"]
+        layout_length = x_max_i - x_min_i
+        cover_count, cover_with_threshold_count = 0, 0
+        match_block_with_threshold_indexes = []
+        for j, other_block in enumerate(blocks):
+            if i == j or other_block["block_label"] not in no_mask_labels:
+                continue
+            x_min_j, _, x_max_j, _ = other_block["block_bbox"]
+            x_match_min, x_match_max = max(
+                x_min_i,
+                x_min_j,
+            ), min(x_max_i, x_max_j)
+            match_block_iou = (x_match_max - x_match_min) / (x_max_j - x_min_j)
+            if match_block_iou > 0:
+                cover_count += 1
+                if match_block_iou > threshold:
+                    cover_with_threshold_count += 1
+                    match_block_with_threshold_indexes.append(
+                        (j, match_block_iou),
+                    )
+                x_min_i = x_match_max
+                if x_min_i >= x_max_i:
+                    break
+        if (
+            layout_length > median_width * 1.3
+            and (cover_with_threshold_count >= 2 or cover_count >= 2)
+        ) or layout_length > 0.6 * page_width:
+            # if layout_length > median_width * 1.3 and (cover_with_threshold_count >= 2):
+            block["layout"] = "double"
+            double_label_area += (block["block_bbox"][2] - block["block_bbox"][0]) * (
+                block["block_bbox"][3] - block["block_bbox"][1]
+            )
+        else:
+            block["layout"] = "single"
+            check_single_layout[i] = match_block_with_threshold_indexes
+    # Check single-layout block
+    for i, single_layout in check_single_layout.items():
+        if single_layout:
+            index, match_iou = single_layout[-1]
+            if match_iou > 0.9 and blocks[index]["layout"] == "double":
+                blocks[i]["layout"] = "double"
+                double_label_area += (
+                    blocks[i]["block_bbox"][2] - blocks[i]["block_bbox"][0]
+                ) * (blocks[i]["block_bbox"][3] - blocks[i]["block_bbox"][1])
+            else:
+                single_label_area += (
+                    blocks[i]["block_bbox"][2] - blocks[i]["block_bbox"][0]
+                ) * (blocks[i]["block_bbox"][3] - blocks[i]["block_bbox"][1])
+    return blocks, (double_label_area > single_label_area)
+def _get_bbox_direction(input_bbox: List[float], ratio: float = 1.0) -> bool:
+    """
+    Determine if a bounding box is horizontal or vertical.
+    Args:
+        input_bbox (List[float]): Bounding box [x_min, y_min, x_max, y_max].
+        ratio (float): Ratio for determining orientation. Default is 1.0.
+    Returns:
+        bool: True if the bounding box is considered horizontal, False if vertical.
+    """
+    width = input_bbox[2] - input_bbox[0]
+    height = input_bbox[3] - input_bbox[1]
+    return width * ratio >= height
+def _get_projection_iou(
+    input_bbox: List[float], match_bbox: List[float], is_horizontal: bool = True
+) -> float:
+    """
+    Calculate the IoU of lines between two bounding boxes.
+    Args:
+        input_bbox (List[float]): First bounding box [x_min, y_min, x_max, y_max].
+        match_bbox (List[float]): Second bounding box [x_min, y_min, x_max, y_max].
+        is_horizontal (bool): Whether to compare horizontally or vertically.
+    Returns:
+        float: Line IoU. Returns 0 if there is no overlap.
+    """
+    if is_horizontal:
+        x_match_min = max(input_bbox[0], match_bbox[0])
+        x_match_max = min(input_bbox[2], match_bbox[2])
+        overlap = max(0, x_match_max - x_match_min)
+        input_width = min(input_bbox[2] - input_bbox[0], match_bbox[2] - match_bbox[0])
+    else:
+        y_match_min = max(input_bbox[1], match_bbox[1])
+        y_match_max = min(input_bbox[3], match_bbox[3])
+        overlap = max(0, y_match_max - y_match_min)
+        input_width = min(input_bbox[3] - input_bbox[1], match_bbox[3] - match_bbox[1])
+    return overlap / input_width if input_width > 0 else 0.0
+def _get_sub_category(
+    blocks: List[Dict[str, Any]], title_labels: List[str]
+) -> Tuple[List[Dict[str, Any]], List[float]]:
+    """
+    Determine the layout of title and text blocks and collect pre_cuts.
+    Args:
+        blocks (List[Dict[str, Any]]): List of block dictionaries.
+        title_labels (List[str]): List of labels considered as titles.
+    Returns:
+        List[Dict[str, Any]]: Updated list of blocks with title-text layout information.
+        Dict[float]: Dict of pre_cuts coordinates.
+    """
+    sub_title_labels = ["paragraph_title"]
+    vision_labels = ["image", "table", "chart", "figure"]
+    vision_title_labels = ["figure_title", "chart_title", "table_title"]
+    all_labels = title_labels + sub_title_labels + vision_labels + vision_title_labels
+    special_pre_cut_labels = sub_title_labels
+    # single doc title is irregular,pre cut not applicable
+    num_doc_title = 0
+    for block in blocks:
+        if block["block_label"] == "doc_title":
+            num_doc_title += 1
+            if num_doc_title == 2:
+                special_pre_cut_labels = title_labels + sub_title_labels
+                break
+    if len(blocks) == 0:
+        return blocks, {}
+    min_x = min(block["block_bbox"][0] for block in blocks)
+    min_y = min(block["block_bbox"][1] for block in blocks)
+    max_x = max(block["block_bbox"][2] for block in blocks)
+    max_y = max(block["block_bbox"][3] for block in blocks)
+    region_bbox = (min_x, min_y, max_x, max_y)
+    region_x_center = (region_bbox[0] + region_bbox[2]) / 2
+    region_y_center = (region_bbox[1] + region_bbox[3]) / 2
+    region_width = region_bbox[2] - region_bbox[0]
+    region_height = region_bbox[3] - region_bbox[1]
+    pre_cuts = {}
+    for i, block1 in enumerate(blocks):
+        block1.setdefault("title_text", [])
+        block1.setdefault("sub_title", [])
+        block1.setdefault("vision_footnote", [])
+        block1.setdefault("sub_label", block1["block_label"])
+        if block1["block_label"] not in all_labels:
+            continue
+        bbox1 = block1["block_bbox"]
+        x1, y1, x2, y2 = bbox1
+        is_horizontal_1 = _get_bbox_direction(block1["block_bbox"])
+        left_up_title_text_distance = float("inf")
+        left_up_title_text_index = -1
+        left_up_title_text_direction = None
+        right_down_title_text_distance = float("inf")
+        right_down_title_text_index = -1
+        right_down_title_text_direction = None
+        # pre-cuts
+        # Condition 1: Length is greater than half of the layout region
+        if is_horizontal_1:
+            block_length = x2 - x1
+            required_length = region_width / 2
+        else:
+            block_length = y2 - y1
+            required_length = region_height / 2
+        if block1["block_label"] in special_pre_cut_labels:
+            length_condition = True
+        else:
+            length_condition = block_length > required_length
+        # Condition 2: Centered check (must be within ±20 in both horizontal and vertical directions)
+        block_x_center = (x1 + x2) / 2
+        block_y_center = (y1 + y2) / 2
+        tolerance_len = block_length // 5
+        if block1["block_label"] in special_pre_cut_labels:
+            tolerance_len = block_length // 10
+        if is_horizontal_1:
+            is_centered = abs(block_x_center - region_x_center) <= tolerance_len
+        else:
+            is_centered = abs(block_y_center - region_y_center) <= tolerance_len
+        # Condition 3: Check for surrounding text
+        has_left_text = False
+        has_right_text = False
+        has_above_text = False
+        has_below_text = False
+        for block2 in blocks:
+            if block2["block_label"] != "text":
+                continue
+            bbox2 = block2["block_bbox"]
+            x1_2, y1_2, x2_2, y2_2 = bbox2
+            if is_horizontal_1:
+                if x2_2 <= x1 and not (y2_2 <= y1 or y1_2 >= y2):
+                    has_left_text = True
+                if x1_2 >= x2 and not (y2_2 <= y1 or y1_2 >= y2):
+                    has_right_text = True
+            else:
+                if y2_2 <= y1 and not (x2_2 <= x1 or x1_2 >= x2):
+                    has_above_text = True
+                if y1_2 >= y2 and not (x2_2 <= x1 or x1_2 >= x2):
+                    has_below_text = True
+            if (is_horizontal_1 and has_left_text and has_right_text) or (
+                not is_horizontal_1 and has_above_text and has_below_text
+            ):
+                break
+        no_text_on_sides = (
+            not (has_left_text or has_right_text)
+            if is_horizontal_1
+            else not (has_above_text or has_below_text)
+        )
+        # Add coordinates if all conditions are met
+        if is_centered and length_condition and no_text_on_sides:
+            if is_horizontal_1:
+                pre_cuts.setdefault("y", []).append(y1)
+            else:
+                pre_cuts.setdefault("x", []).append(x1)
+        for j, block2 in enumerate(blocks):
+            if i == j:
+                continue
+            bbox2 = block2["block_bbox"]
+            x1_prime, y1_prime, x2_prime, y2_prime = bbox2
+            is_horizontal_2 = _get_bbox_direction(bbox2)
+            match_block_iou = _get_projection_iou(
+                bbox2,
+                bbox1,
+                is_horizontal_1,
+            )
+            def distance_(is_horizontal, is_left_up):
+                if is_horizontal:
+                    if is_left_up:
+                        return (y1 - y2_prime + 2) // 5 + x1_prime / 5000
+                    else:
+                        return (y1_prime - y2 + 2) // 5 + x1_prime / 5000
+                else:
+                    if is_left_up:
+                        return (x1 - x2_prime + 2) // 5 + y1_prime / 5000
+                    else:
+                        return (x1_prime - x2 + 2) // 5 + y1_prime / 5000
+            block_iou_threshold = 0.1
+            if block1["block_label"] in sub_title_labels:
+                block_iou_threshold = 0.5
+            if is_horizontal_1:
+                if match_block_iou >= block_iou_threshold:
+                    left_up_distance = distance_(True, True)
+                    right_down_distance = distance_(True, False)
+                    if (
+                        y2_prime <= y1
+                        and left_up_distance <= left_up_title_text_distance
+                    ):
+                        left_up_title_text_distance = left_up_distance
+                        left_up_title_text_index = j
+                        left_up_title_text_direction = is_horizontal_2
+                    elif (
+                        y1_prime > y2
+                        and right_down_distance < right_down_title_text_distance
+                    ):
+                        right_down_title_text_distance = right_down_distance
+                        right_down_title_text_index = j
+                        right_down_title_text_direction = is_horizontal_2
+            else:
+                if match_block_iou >= block_iou_threshold:
+                    left_up_distance = distance_(False, True)
+                    right_down_distance = distance_(False, False)
+                    if (
+                        x2_prime <= x1
+                        and left_up_distance <= left_up_title_text_distance
+                    ):
+                        left_up_title_text_distance = left_up_distance
+                        left_up_title_text_index = j
+                        left_up_title_text_direction = is_horizontal_2
+                    elif (
+                        x1_prime > x2
+                        and right_down_distance < right_down_title_text_distance
+                    ):
+                        right_down_title_text_distance = right_down_distance
+                        right_down_title_text_index = j
+                        right_down_title_text_direction = is_horizontal_2
+        height = bbox1[3] - bbox1[1]
+        width = bbox1[2] - bbox1[0]
+        title_text_weight = [0.8, 0.8]
+        title_text, sub_title, vision_footnote = [], [], []
+        def get_sub_category_(
+            title_text_direction,
+            title_text_index,
+            label,
+            is_left_up=True,
+        ):
+            direction_ = [1, 3] if is_left_up else [2, 4]
+            if (
+                title_text_direction == is_horizontal_1
+                and title_text_index != -1
+                and (label == "text" or label == "paragraph_title")
+            ):
+                bbox2 = blocks[title_text_index]["block_bbox"]
+                if is_horizontal_1:
+                    height1 = bbox2[3] - bbox2[1]
+                    width1 = bbox2[2] - bbox2[0]
+                    if label == "text":
+                        if (
+                            _nearest_edge_distance(bbox1, bbox2)[0] <= 15
+                            and block1["block_label"] in vision_labels
+                            and width1 < width
+                            and height1 < 0.5 * height
+                        ):
+                            blocks[title_text_index]["sub_label"] = "vision_footnote"
+                            vision_footnote.append(bbox2)
+                        elif (
+                            height1 < height * title_text_weight[0]
+                            and (width1 < width or width1 > 1.5 * width)
+                            and block1["block_label"] in title_labels
+                        ):
+                            blocks[title_text_index]["sub_label"] = "title_text"
+                            title_text.append((direction_[0], bbox2))
+                    elif (
+                        label == "paragraph_title"
+                        and block1["block_label"] in sub_title_labels
+                    ):
+                        sub_title.append(bbox2)
+                else:
+                    height1 = bbox2[3] - bbox2[1]
+                    width1 = bbox2[2] - bbox2[0]
+                    if label == "text":
+                        if (
+                            _nearest_edge_distance(bbox1, bbox2)[0] <= 15
+                            and block1["block_label"] in vision_labels
+                            and height1 < height
+                            and width1 < 0.5 * width
+                        ):
+                            blocks[title_text_index]["sub_label"] = "vision_footnote"
+                            vision_footnote.append(bbox2)
+                        elif (
+                            width1 < width * title_text_weight[1]
+                            and block1["block_label"] in title_labels
+                        ):
+                            blocks[title_text_index]["sub_label"] = "title_text"
+                            title_text.append((direction_[1], bbox2))
+                    elif (
+                        label == "paragraph_title"
+                        and block1["block_label"] in sub_title_labels
+                    ):
+                        sub_title.append(bbox2)
+        if (
+            is_horizontal_1
+            and abs(left_up_title_text_distance - right_down_title_text_distance) * 5
+            > height
+        ) or (
+            not is_horizontal_1
+            and abs(left_up_title_text_distance - right_down_title_text_distance) * 5
+            > width
+        ):
+            if left_up_title_text_distance < right_down_title_text_distance:
+                get_sub_category_(
+                    left_up_title_text_direction,
+                    left_up_title_text_index,
+                    blocks[left_up_title_text_index]["block_label"],
+                    True,
+                )
+            else:
+                get_sub_category_(
+                    right_down_title_text_direction,
+                    right_down_title_text_index,
+                    blocks[right_down_title_text_index]["block_label"],
+                    False,
+                )
+        else:
+            get_sub_category_(
+                left_up_title_text_direction,
+                left_up_title_text_index,
+                blocks[left_up_title_text_index]["block_label"],
+                True,
+            )
+            get_sub_category_(
+                right_down_title_text_direction,
+                right_down_title_text_index,
+                blocks[right_down_title_text_index]["block_label"],
+                False,
+            )
+        if block1["block_label"] in title_labels:
+            if blocks[i].get("title_text") == []:
+                blocks[i]["title_text"] = title_text
+        if block1["block_label"] in sub_title_labels:
+            if blocks[i].get("sub_title") == []:
+                blocks[i]["sub_title"] = sub_title
+        if block1["block_label"] in vision_labels:
+            if blocks[i].get("vision_footnote") == []:
+                blocks[i]["vision_footnote"] = vision_footnote
+    return blocks, pre_cuts
+def get_layout_ordering(
+    parsing_res_list: List[Dict[str, Any]],
+    no_mask_labels: List[str] = [],
+) -> None:
+    """
+    Process layout parsing results to remove overlapping bounding boxes
+    and assign an ordering index based on their positions.
+    Modifies:
+        The 'parsing_res_list' list by adding an 'index' to each block.
+    Args:
+        parsing_res_list (List[Dict[str, Any]]): List of block dictionaries with 'block_bbox' and 'block_label'.
+        no_mask_labels (List[str]): Labels for which overlapping removal is not performed.
+    """
+    title_text_labels = ["doc_title"]
+    title_labels = ["doc_title", "paragraph_title"]
+    vision_labels = ["image", "table", "seal", "chart", "figure"]
+    vision_title_labels = ["table_title", "chart_title", "figure_title"]
+    parsing_res_list, pre_cuts = _get_sub_category(parsing_res_list, title_text_labels)
+    parsing_res_by_pre_cuts_list = []
+    if len(pre_cuts) > 0:
+        block_bboxes = [block["block_bbox"] for block in parsing_res_list]
+        for axis, cuts in pre_cuts.items():
+            axis_index = 1 if axis == "y" else 0
+            max_val = max(bbox[axis_index + 2] for bbox in block_bboxes)
+            intervals = []
+            prev = 0
+            for cut in sorted(cuts):
+                intervals.append((prev, cut))
+                prev = cut
+            intervals.append((prev, max_val))
+            for start, end in intervals:
+                mask = [
+                    (bbox[axis_index] >= start) and (bbox[axis_index] < end)
+                    for bbox in block_bboxes
+                ]
+                parsing_res_by_pre_cuts_list.append(
+                    [parsing_res_list[i] for i, m in enumerate(mask) if m]
+                )
+    else:
+        parsing_res_by_pre_cuts_list = [parsing_res_list]
+    final_parsing_res_list = []
+    num_index = 0
+    num_sub_index = 0
+    for parsing_res_by_pre_cuts in parsing_res_by_pre_cuts_list:
+        doc_flag = False
+        median_width = _get_text_median_width(parsing_res_by_pre_cuts)
+        parsing_res_by_pre_cuts, projection_direction = _get_layout_property(
+            parsing_res_by_pre_cuts,
+            median_width,
+            no_mask_labels=no_mask_labels,
+            threshold=0.3,
+        )
+        # Convert bounding boxes to float and remove overlaps
+        (
+            double_text_blocks,
+            title_text_blocks,
+            title_blocks,
+            vision_blocks,
+            vision_title_blocks,
+            vision_footnote_blocks,
+            other_blocks,
+        ) = ([], [], [], [], [], [], [])
+        drop_indexes = []
+        for index, block in enumerate(parsing_res_by_pre_cuts):
+            label = block["sub_label"]
+            block["block_bbox"] = list(map(int, block["block_bbox"]))
+            if label == "doc_title":
+                doc_flag = True
+            if label in no_mask_labels:
+                if block["layout"] == "double":
+                    double_text_blocks.append(block)
+                    drop_indexes.append(index)
+            elif label == "title_text":
+                title_text_blocks.append(block)
+                drop_indexes.append(index)
+            elif label == "vision_footnote":
+                vision_footnote_blocks.append(block)
+                drop_indexes.append(index)
+            elif label in vision_title_labels:
+                vision_title_blocks.append(block)
+                drop_indexes.append(index)
+            elif label in title_labels:
+                title_blocks.append(block)
+                drop_indexes.append(index)
+            elif label in vision_labels:
+                vision_blocks.append(block)
+                drop_indexes.append(index)
+            else:
+                other_blocks.append(block)
+                drop_indexes.append(index)
+        for index in sorted(drop_indexes, reverse=True):
+            del parsing_res_by_pre_cuts[index]
+        if len(parsing_res_by_pre_cuts) > 0:
+            # single text label
+            if (
+                len(double_text_blocks) > len(parsing_res_by_pre_cuts)
+                or projection_direction
+            ):
+                parsing_res_by_pre_cuts.extend(title_blocks + double_text_blocks)
+                title_blocks = []
+                double_text_blocks = []
+                block_bboxes = [
+                    block["block_bbox"] for block in parsing_res_by_pre_cuts
+                ]
+                block_bboxes.sort(
+                    key=lambda x: (
+                        x[0] // max(20, median_width),
+                        x[1],
+                    ),
+                )
+                block_bboxes = np.array(block_bboxes)
+                sorted_indices = sort_by_xycut(block_bboxes, direction=1, min_gap=1)
+            else:
+                block_bboxes = [
+                    block["block_bbox"] for block in parsing_res_by_pre_cuts
+                ]
+                block_bboxes.sort(key=lambda x: (x[0] // 20, x[1]))
+                block_bboxes = np.array(block_bboxes)
+                sorted_indices = sort_by_xycut(block_bboxes, direction=0, min_gap=20)
+            sorted_boxes = block_bboxes[sorted_indices].tolist()
+            for block in parsing_res_by_pre_cuts:
+                block["index"] = num_index + sorted_boxes.index(block["block_bbox"]) + 1
+                block["sub_index"] = (
+                    num_sub_index + sorted_boxes.index(block["block_bbox"]) + 1
+                )
+        def nearest_match_(input_blocks, distance_type="manhattan", is_add_index=True):
+            for block in input_blocks:
+                bbox = block["block_bbox"]
+                min_distance = float("inf")
+                min_distance_config = [
+                    [float("inf"), float("inf")],
+                    float("inf"),
+                    float("inf"),
+                ]  # for double text
+                nearest_gt_index = 0
+                for match_block in parsing_res_by_pre_cuts:
+                    match_bbox = match_block["block_bbox"]
+                    if distance_type == "nearest_iou_edge_distance":
+                        distance, min_distance_config = _nearest_iou_edge_distance(
+                            bbox,
+                            match_bbox,
+                            block["sub_label"],
+                            vision_labels=vision_labels,
+                            no_mask_labels=no_mask_labels,
+                            median_width=median_width,
+                            title_labels=title_labels,
+                            title_text=block["title_text"],
+                            sub_title=block["sub_title"],
+                            min_distance_config=min_distance_config,
+                            tolerance_len=10,
+                        )
+                    elif distance_type == "title_text":
+                        if (
+                            match_block["block_label"] in title_labels + ["abstract"]
+                            and match_block["title_text"] != []
+                        ):
+                            iou_left_up = _calculate_overlap_area_div_minbox_area_ratio(
+                                bbox,
+                                match_block["title_text"][0][1],
+                            )
+                            iou_right_down = (
+                                _calculate_overlap_area_div_minbox_area_ratio(
+                                    bbox,
+                                    match_block["title_text"][-1][1],
+                                )
+                            )
+                            iou = 1 - max(iou_left_up, iou_right_down)
+                            distance = _manhattan_distance(bbox, match_bbox) * iou
+                        else:
+                            distance = float("inf")
+                    elif distance_type == "manhattan":
+                        distance = _manhattan_distance(bbox, match_bbox)
+                    elif distance_type == "vision_footnote":
+                        if (
+                            match_block["block_label"] in vision_labels
+                            and match_block["vision_footnote"] != []
+                        ):
+                            iou_left_up = _calculate_overlap_area_div_minbox_area_ratio(
+                                bbox,
+                                match_block["vision_footnote"][0],
+                            )
+                            iou_right_down = (
+                                _calculate_overlap_area_div_minbox_area_ratio(
+                                    bbox,
+                                    match_block["vision_footnote"][-1],
+                                )
+                            )
+                            iou = 1 - max(iou_left_up, iou_right_down)
+                            distance = _manhattan_distance(bbox, match_bbox) * iou
+                        else:
+                            distance = float("inf")
+                    elif distance_type == "vision_body":
+                        if (
+                            match_block["block_label"] in vision_title_labels
+                            and block["vision_footnote"] != []
+                        ):
+                            iou_left_up = _calculate_overlap_area_div_minbox_area_ratio(
+                                match_bbox,
+                                block["vision_footnote"][0],
+                            )
+                            iou_right_down = (
+                                _calculate_overlap_area_div_minbox_area_ratio(
+                                    match_bbox,
+                                    block["vision_footnote"][-1],
+                                )
+                            )
+                            iou = 1 - max(iou_left_up, iou_right_down)
+                            distance = _manhattan_distance(bbox, match_bbox) * iou
+                        else:
+                            distance = float("inf")
+                    # when reference block cross mulitple columns, its order should be after the blocks above it.
+                    elif distance_type == "append":
+                        if match_bbox[3] <= bbox[1]:
+                            distance = -(match_bbox[2] * 10 + match_bbox[3])
+                        else:
+                            distance = float("inf")
+                    else:
+                        raise NotImplementedError
+                    if distance < min_distance:
+                        min_distance = distance
+                        if is_add_index:
+                            nearest_gt_index = match_block.get("index", 999)
+                        else:
+                            nearest_gt_index = match_block.get("sub_index", 999)
+                if is_add_index:
+                    block["index"] = nearest_gt_index
+                else:
+                    block["sub_index"] = nearest_gt_index
+                parsing_res_by_pre_cuts.append(block)
+        # double text label
+        double_text_blocks.sort(
+            key=lambda x: (
+                x["block_bbox"][1] // 10,
+                x["block_bbox"][0] // median_width,
+                x["block_bbox"][1] ** 2 + x["block_bbox"][0] ** 2,
+            ),
+        )
+        # filter the reference blocks from all blocks that cross mulitple columns.
+        # they should be ordered using "append".
+        double_text_reference_blocks = []
+        i = 0
+        while i < len(double_text_blocks):
+            if double_text_blocks[i]["block_label"] == "reference":
+                double_text_reference_blocks.append(double_text_blocks.pop(i))
+            else:
+                i += 1
+        nearest_match_(
+            double_text_blocks,
+            distance_type="nearest_iou_edge_distance",
+        )
+        nearest_match_(
+            double_text_reference_blocks,
+            distance_type="append",
+        )
+        parsing_res_by_pre_cuts.sort(
+            key=lambda x: (x["index"], x["block_bbox"][1], x["block_bbox"][0]),
+        )
+        for idx, block in enumerate(parsing_res_by_pre_cuts):
+            block["index"] = num_index + idx + 1
+            block["sub_index"] = num_sub_index + idx + 1
+        # title label
+        title_blocks.sort(
+            key=lambda x: (
+                x["block_bbox"][1] // 10,
+                x["block_bbox"][0] // median_width,
+                x["block_bbox"][1] ** 2 + x["block_bbox"][0] ** 2,
+            ),
+        )
+        nearest_match_(title_blocks, distance_type="nearest_iou_edge_distance")
+        if doc_flag:
+            text_sort_labels = ["doc_title"]
+            text_label_priority = {
+                label: priority for priority, label in enumerate(text_sort_labels)
+            }
+            doc_titles = []
+            for i, block in enumerate(parsing_res_by_pre_cuts):
+                if block["block_label"] == "doc_title":
+                    doc_titles.append(
+                        (i, block["block_bbox"][1], block["block_bbox"][0]),
+                    )
+            doc_titles.sort(key=lambda x: (x[1], x[2]))
+            first_doc_title_index = doc_titles[0][0]
+            parsing_res_by_pre_cuts[first_doc_title_index]["index"] = 1
+            parsing_res_by_pre_cuts.sort(
+                key=lambda x: (
+                    x["index"],
+                    text_label_priority.get(x["block_label"], 9999),
+                    x["block_bbox"][1],
+                    x["block_bbox"][0],
+                ),
+            )
+        else:
+            parsing_res_by_pre_cuts.sort(
+                key=lambda x: (
+                    x["index"],
+                    x["block_bbox"][1],
+                    x["block_bbox"][0],
+                ),
+            )
+        for idx, block in enumerate(parsing_res_by_pre_cuts):
+            block["index"] = num_index + idx + 1
+            block["sub_index"] = num_sub_index + idx + 1
+        # title-text label
+        nearest_match_(title_text_blocks, distance_type="title_text")
+        def hor_tb_and_ver_lr(x):
+            input_bbox = x["block_bbox"]
+            is_horizontal = _get_bbox_direction(input_bbox)
+            if is_horizontal:
+                return input_bbox[1]
+            else:
+                return input_bbox[0]
+        parsing_res_by_pre_cuts.sort(
+            key=lambda x: (x["index"], hor_tb_and_ver_lr(x)),
+        )
+        for idx, block in enumerate(parsing_res_by_pre_cuts):
+            block["index"] = num_index + idx + 1
+            block["sub_index"] = num_sub_index + idx + 1
+        # image,figure,chart,seal label
+        nearest_match_(
+            vision_blocks,
+            distance_type="nearest_iou_edge_distance",
+            is_add_index=False,
+        )
+        parsing_res_by_pre_cuts.sort(
+            key=lambda x: (
+                x["sub_index"],
+                x["block_bbox"][1],
+                x["block_bbox"][0],
+            ),
+        )
+        for idx, block in enumerate(parsing_res_by_pre_cuts):
+            block["sub_index"] = num_sub_index + idx + 1
+        # image,figure,chart,seal title label
+        nearest_match_(
+            vision_title_blocks,
+            distance_type="nearest_iou_edge_distance",
+            is_add_index=False,
+        )
+        parsing_res_by_pre_cuts.sort(
+            key=lambda x: (
+                x["sub_index"],
+                x["block_bbox"][1],
+                x["block_bbox"][0],
+            ),
+        )
+        for idx, block in enumerate(parsing_res_by_pre_cuts):
+            block["sub_index"] = num_sub_index + idx + 1
+        # vision footnote label
+        nearest_match_(
+            vision_footnote_blocks,
+            distance_type="vision_footnote",
+            is_add_index=False,
+        )
+        text_label_priority = {"vision_footnote": 9999}
+        parsing_res_by_pre_cuts.sort(
+            key=lambda x: (
+                x["sub_index"],
+                text_label_priority.get(x["sub_label"], 0),
+                x["block_bbox"][1],
+                x["block_bbox"][0],
+            ),
+        )
+        for idx, block in enumerate(parsing_res_by_pre_cuts):
+            block["sub_index"] = num_sub_index + idx + 1
+        # header、footnote、header_image... label
+        nearest_match_(other_blocks, distance_type="manhattan", is_add_index=False)
+        # add all parsing result
+        final_parsing_res_list.extend(parsing_res_by_pre_cuts)
+        # update num index
+        num_sub_index += len(parsing_res_by_pre_cuts)
+        for parsing_res in parsing_res_by_pre_cuts:
+            if parsing_res.get("index"):
+                num_index += 1
+    parsing_res_list = [
+        {
+            "block_label": parsing_res["block_label"],
+            "block_content": parsing_res["block_content"],
+            "block_bbox": parsing_res["block_bbox"],
+            "block_image": parsing_res.get("block_image", None),
+            "sub_label": parsing_res["sub_label"],
+            "sub_index": parsing_res["sub_index"],
+            "index": parsing_res.get("index", None),
+            "seg_start_coordinate": parsing_res.get(
+                "seg_start_coordinate", float("inf")
+            ),
+            "seg_end_coordinate": parsing_res.get("seg_end_coordinate", float("-inf")),
+            "num_of_lines": parsing_res.get("num_of_lines", 1),
+        }
+        for parsing_res in final_parsing_res_list
+    ]
+    return parsing_res_list
+def _manhattan_distance(
+    point1: Tuple[float, float],
+    point2: Tuple[float, float],
+    weight_x: float = 1.0,
+    weight_y: float = 1.0,
+) -> float:
+    """
+    Calculate the weighted Manhattan distance between two points.
+    Args:
+        point1 (Tuple[float, float]): The first point as (x, y).
+        point2 (Tuple[float, float]): The second point as (x, y).
+        weight_x (float): The weight for the x-axis distance. Default is 1.0.
+        weight_y (float): The weight for the y-axis distance. Default is 1.0.
+    Returns:
+        float: The weighted Manhattan distance between the two points.
+    """
+    return weight_x * abs(point1[0] - point2[0]) + weight_y * abs(point1[1] - point2[1])
+def _calculate_horizontal_distance(
+    input_bbox: List[int],
+    match_bbox: List[int],
+    height: int,
+    disperse: int,
+    title_text: List[Tuple[int, List[int]]],
+) -> float:
+    """
+    Calculate the horizontal distance between two bounding boxes, considering title text adjustments.
+    Args:
+        input_bbox (List[int]): The bounding box coordinates [x1, y1, x2, y2] of the input object.
+        match_bbox (List[int]): The bounding box coordinates [x1', y1', x2', y2'] of the object to match against.
+        height (int): The height of the input bounding box used for normalization.
+        disperse (int): The dispersion factor used to normalize the horizontal distance.
+        title_text (List[Tuple[int, List[int]]]): A list of tuples containing title text information and their bounding box coordinates.
+                                                  Format: [(position_indicator, [x1, y1, x2, y2]), ...].
+    Returns:
+        float: The calculated horizontal distance taking into account the title text adjustments.
+    """
+    x1, y1, x2, y2 = input_bbox
+    x1_prime, y1_prime, x2_prime, y2_prime = match_bbox
+    # Determine vertical distance adjustment based on title text
+    if y2 < y1_prime:
+        if title_text and title_text[-1][0] == 2:
+            y2 += title_text[-1][1][3] - title_text[-1][1][1]
+        vertical_adjustment = (y1_prime - y2) * 0.5
+    else:
+        if title_text and title_text[0][0] == 1:
+            y1 -= title_text[0][1][3] - title_text[0][1][1]
+        vertical_adjustment = y1 - y2_prime
+    # Calculate horizontal distance with adjustments
+    horizontal_distance = (
+        abs(x2_prime - x1) // disperse
+        + vertical_adjustment // height
+        + vertical_adjustment / 5000
+    )
+    return horizontal_distance
+def _calculate_vertical_distance(
+    input_bbox: List[int],
+    match_bbox: List[int],
+    width: int,
+    disperse: int,
+    title_text: List[Tuple[int, List[int]]],
+) -> float:
+    """
+    Calculate the vertical distance between two bounding boxes, considering title text adjustments.
+    Args:
+        input_bbox (List[int]): The bounding box coordinates [x1, y1, x2, y2] of the input object.
+        match_bbox (List[int]): The bounding box coordinates [x1', y1', x2', y2'] of the object to match against.
+        width (int): The width of the input bounding box used for normalization.
+        disperse (int): The dispersion factor used to normalize the vertical distance.
+        title_text (List[Tuple[int, List[int]]]): A list of tuples containing title text information and their bounding box coordinates.
+                                                  Format: [(position_indicator, [x1, y1, x2, y2]), ...].
+    Returns:
+        float: The calculated vertical distance taking into account the title text adjustments.
+    """
+    x1, y1, x2, y2 = input_bbox
+    x1_prime, y1_prime, x2_prime, y2_prime = match_bbox
+    # Determine horizontal distance adjustment based on title text
+    if x1 > x2_prime:
+        if title_text and title_text[0][0] == 3:
+            x1 -= title_text[0][1][2] - title_text[0][1][0]
+        horizontal_adjustment = (x1 - x2_prime) * 0.5
+    else:
+        if title_text and title_text[-1][0] == 4:
+            x2 += title_text[-1][1][2] - title_text[-1][1][0]
+        horizontal_adjustment = x1_prime - x2
+    # Calculate vertical distance with adjustments
+    vertical_distance = (
+        abs(y2_prime - y1) // disperse
+        + horizontal_adjustment // width
+        + horizontal_adjustment / 5000
+    )
+    return vertical_distance
+def _nearest_edge_distance(
+    input_bbox: List[int],
+    match_bbox: List[int],
+    weight: List[float] = [1.0, 1.0, 1.0, 1.0],
+    label: str = "text",
+    no_mask_labels: List[str] = [],
+    min_edge_distance_config: List[float] = [],
+    tolerance_len: float = 10.0,
+) -> Tuple[float, List[float]]:
+    """
+    Calculate the nearest edge distance between two bounding boxes, considering directional weights.
+    Args:
+        input_bbox (list): The bounding box coordinates [x1, y1, x2, y2] of the input object.
+        match_bbox (list): The bounding box coordinates [x1', y1', x2', y2'] of the object to match against.
+        weight (list, optional): Directional weights for the edge distances [left, right, up, down]. Defaults to [1, 1, 1, 1].
+        label (str, optional): The label/type of the object in the bounding box (e.g., 'text'). Defaults to 'text'.
+        no_mask_labels (list, optional): Labels for which no masking is applied when calculating edge distances. Defaults to an empty list.
+        min_edge_distance_config (list, optional): Configuration for minimum edge distances [min_edge_distance_x, min_edge_distance_y].
+        Defaults to [float('inf'), float('inf')].
+        tolerance_len (float, optional): The tolerance length for adjusting edge distances. Defaults to 10.
+    Returns:
+        Tuple[float, List[float]]: A tuple containing:
+            - The calculated minimum edge distance between the bounding boxes.
+            - A list with the minimum edge distances in the x and y directions.
+    """
+    match_bbox_iou = _calculate_overlap_area_div_minbox_area_ratio(
+        input_bbox,
+        match_bbox,
+    )
+    if match_bbox_iou > 0 and label not in no_mask_labels:
+        return 0, [0, 0]
+    if not min_edge_distance_config:
+        min_edge_distance_config = [float("inf"), float("inf")]
+    min_edge_distance_x, min_edge_distance_y = min_edge_distance_config
+    x1, y1, x2, y2 = input_bbox
+    x1_prime, y1_prime, x2_prime, y2_prime = match_bbox
+    direction_num = 0
+    distance_x = float("inf")
+    distance_y = float("inf")
+    distance = [float("inf")] * 4
+    # input_bbox is to the left of match_bbox
+    if x2 < x1_prime:
+        direction_num += 1
+        distance[0] = x1_prime - x2
+        if abs(distance[0] - min_edge_distance_x) <= tolerance_len:
+            distance_x = min_edge_distance_x * weight[0]
+        else:
+            distance_x = distance[0] * weight[0]
+    # input_bbox is to the right of match_bbox
+    elif x1 > x2_prime:
+        direction_num += 1
+        distance[1] = x1 - x2_prime
+        if abs(distance[1] - min_edge_distance_x) <= tolerance_len:
+            distance_x = min_edge_distance_x * weight[1]
+        else:
+            distance_x = distance[1] * weight[1]
+    elif match_bbox_iou > 0:
+        distance[0] = 0
+        distance_x = 0
+    # input_bbox is above match_bbox
+    if y2 < y1_prime:
+        direction_num += 1
+        distance[2] = y1_prime - y2
+        if abs(distance[2] - min_edge_distance_y) <= tolerance_len:
+            distance_y = min_edge_distance_y * weight[2]
+        else:
+            distance_y = distance[2] * weight[2]
+        if label in no_mask_labels:
+            distance_y = max(0.1, distance_y) * 10  # for abstract
+    # input_bbox is below match_bbox
+    elif y1 > y2_prime:
+        direction_num += 1
+        distance[3] = y1 - y2_prime
+        if abs(distance[3] - min_edge_distance_y) <= tolerance_len:
+            distance_y = min_edge_distance_y * weight[3]
+        else:
+            distance_y = distance[3] * weight[3]
+    elif match_bbox_iou > 0:
+        distance[2] = 0
+        distance_y = 0
+    if direction_num == 2:
+        return (distance_x + distance_y), [
+            min(distance[0], distance[1]),
+            min(distance[2], distance[3]),
+        ]
+    else:
+        return min(distance_x, distance_y), [
+            min(distance[0], distance[1]),
+            min(distance[2], distance[3]),
+        ]
+def _get_weights(label, horizontal):
+    """Define weights based on the label and orientation."""
+    if label == "doc_title":
+        return (
+            [1, 0.1, 0.1, 1] if horizontal else [0.2, 0.1, 1, 1]
+        )  # left-down ,  right-left
+    elif label in [
+        "paragraph_title",
+        "table_title",
+        "abstract",
+        "image",
+        "seal",
+        "chart",
+        "figure",
+    ]:
+        return [1, 1, 0.1, 1]  # down
+    else:
+        return [1, 1, 1, 0.1]  # up
+def _nearest_iou_edge_distance(
+    input_bbox: List[int],
+    match_bbox: List[int],
+    label: str,
+    vision_labels: List[str],
+    no_mask_labels: List[str],
+    median_width: int = -1,
+    title_labels: List[str] = [],
+    title_text: List[Tuple[int, List[int]]] = [],
+    sub_title: List[List[int]] = [],
+    min_distance_config: List[float] = [],
+    tolerance_len: float = 10.0,
+) -> Tuple[float, List[float]]:
+    """
+    Calculate the nearest IOU edge distance between two bounding boxes, considering label types, title adjustments, and minimum distance configurations.
+    This function computes the edge distance between two bounding boxes while considering their overlap (IOU) and various adjustments based on label types,
+    title text, and subtitle information. It also applies minimum distance configurations and tolerance adjustments.
+    Args:
+        input_bbox (List[int]): The bounding box coordinates [x1, y1, x2, y2] of the input object.
+        match_bbox (List[int]): The bounding box coordinates [x1', y1', x2', y2'] of the object to match against.
+        label (str): The label/type of the object in the bounding box (e.g., 'image', 'text', etc.).
+        vision_labels (List[str]): List of labels for vision-related objects (e.g., images, icons).
+        no_mask_labels (List[str]): Labels for which no masking is applied when calculating edge distances.
+        median_width (int, optional): The median width for title dispersion calculation. Defaults to -1.
+        title_labels (List[str], optional): Labels that indicate the object is a title. Defaults to an empty list.
+        title_text (List[Tuple[int, List[int]]], optional): Text content associated with title labels, in the format [(position_indicator, [x1, y1, x2, y2]), ...].
+        sub_title (List[List[int]], optional): List of subtitle bounding boxes to adjust the input_bbox. Defaults to an empty list.
+        min_distance_config (List[float], optional): Configuration for minimum distances [min_edge_distance_config, up_edge_distances_config, total_distance].
+        tolerance_len (float, optional): The tolerance length for adjusting edge distances. Defaults to 10.0.
+    Returns:
+        Tuple[float, List[float]]: A tuple containing:
+            - The calculated distance considering IOU and adjustments.
+            - The updated minimum distance configuration.
+    """
+    x1, y1, x2, y2 = input_bbox
+    x1_prime, y1_prime, x2_prime, y2_prime = match_bbox
+    min_edge_distance_config, up_edge_distances_config, total_distance = (
+        min_distance_config
+    )
+    iou_distance = 0
+    if label in vision_labels:
+        horizontal1 = horizontal2 = True
+    else:
+        horizontal1 = _get_bbox_direction(input_bbox)
+        horizontal2 = _get_bbox_direction(match_bbox, 3)
+    if (
+        horizontal1 != horizontal2
+        or _get_projection_iou(input_bbox, match_bbox, horizontal1) < 0.01
+    ):
+        iou_distance = 1
+    if label == "doc_title":
+        # Calculate distance for titles
+        disperse = max(1, median_width)
+        tolerance_len = max(tolerance_len, disperse)
+    # Adjust input_bbox based on sub_title
+    if sub_title:
+        for sub in sub_title:
+            x1_, y1_, x2_, y2_ = sub
+            x1, y1, x2, y2 = (
+                min(x1, x1_),
+                min(y1, y1_),
+                min(x2, x2_),
+                max(y2, y2_),
+            )
+        input_bbox = [x1, y1, x2, y2]
+    if title_text:
+        for sub in title_text:
+            x1_, y1_, x2_, y2_ = sub[1]
+            if horizontal1:
+                x1, y1, x2, y2 = (
+                    min(x1, x1_),
+                    min(y1, y1_),
+                    min(x2, x2_),
+                    max(y2, y2_),
+                )
+            else:
+                x1, y1, x2, y2 = (
+                    min(x1, x1_),
+                    min(y1, y1_),
+                    max(x2, x2_),
+                    min(y2, y2_),
+                )
+        input_bbox = [x1, y1, x2, y2]
+    # Calculate edge distance
+    weight = _get_weights(label, horizontal1)
+    if label == "abstract":
+        tolerance_len *= 2
+    edge_distance, edge_distance_config = _nearest_edge_distance(
+        input_bbox,
+        match_bbox,
+        weight,
+        label=label,
+        no_mask_labels=no_mask_labels,
+        min_edge_distance_config=min_edge_distance_config,
+        tolerance_len=tolerance_len,
+    )
+    # Weights for combining distances
+    iou_edge_weight = [10**8, 10**4, 1, 0.0001]
+    # Calculate up and left edge distances
+    up_edge_distance = y1_prime
+    left_edge_distance = x1_prime
+    if (
+        label in no_mask_labels or label in title_labels or label in vision_labels
+    ) and y1 > y2_prime:
+        up_edge_distance = -y2_prime
+        left_edge_distance = -x2_prime
+    min_up_edge_distance = up_edge_distances_config
+    if abs(min_up_edge_distance - up_edge_distance) <= tolerance_len:
+        up_edge_distance = min_up_edge_distance
+    # Calculate total distance
+    distance = (
+        iou_distance * iou_edge_weight[0]
+        + edge_distance * iou_edge_weight[1]
+        + up_edge_distance * iou_edge_weight[2]
+        + left_edge_distance * iou_edge_weight[3]
+    )
+    # Update minimum distance configuration if a smaller distance is found
+    if total_distance > distance:
+        edge_distance_config = [
+            edge_distance_config[0],
+            edge_distance_config[1],
+        ]
+        min_distance_config = [
+            edge_distance_config,
+            up_edge_distance,
+            distance,
+        ]
+    return distance, min_distance_config
+def get_show_color(label: str) -> Tuple:
+    label_colors = {
+        # Medium Blue (from 'titles_list')
+        "paragraph_title": (102, 102, 255, 100),
+        "doc_title": (255, 248, 220, 100),  # Cornsilk
+        # Light Yellow (from 'tables_caption_list')
+        "table_title": (255, 255, 102, 100),
+        # Sky Blue (from 'imgs_caption_list')
+        "figure_title": (102, 178, 255, 100),
+        "chart_title": (221, 160, 221, 100),  # Plum
+        "vision_footnote": (144, 238, 144, 100),  # Light Green
+        # Deep Purple (from 'texts_list')
+        "text": (153, 0, 76, 100),
+        # Bright Green (from 'interequations_list')
+        "formula": (0, 255, 0, 100),
+        "abstract": (255, 239, 213, 100),  # Papaya Whip
+        # Medium Green (from 'lists_list' and 'indexs_list')
+        "content": (40, 169, 92, 100),
+        # Neutral Gray (from 'dropped_bbox_list')
+        "seal": (158, 158, 158, 100),
+        # Olive Yellow (from 'tables_body_list')
+        "table": (204, 204, 0, 100),
+        # Bright Green (from 'imgs_body_list')
+        "image": (153, 255, 51, 100),
+        # Bright Green (from 'imgs_body_list')
+        "figure": (153, 255, 51, 100),
+        "chart": (216, 191, 216, 100),  # Thistle
+        # Pale Yellow-Green (from 'tables_footnote_list')
+        "reference": (229, 255, 204, 100),
+        "algorithm": (255, 250, 240, 100),  # Floral White
+    }
+    default_color = (158, 158, 158, 100)
+    return label_colors.get(label, default_color)

paddlex 2.1.0__py3-none-any.whl → 3.0.0rc0__py3-none-any.whl

paddlex 2.1.0py3-none-any.whl → 3.0.0rc0py3-none-any.whl