PyPI - paddlex - Versions diffs - 2.1.0__py3-none-any.whl → 3.0.0rc0__py3-none-any.whl - Mend

paddlex 2.1.0py3-none-any.whl → 3.0.0rc0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (1708) hide show

paddlex/.version +1 -0
paddlex/__init__.py +52 -19
paddlex/__main__.py +39 -0
paddlex/configs/modules/3d_bev_detection/BEVFusion.yaml +38 -0
paddlex/configs/modules/doc_text_orientation/PP-LCNet_x1_0_doc_ori.yaml +41 -0
paddlex/configs/modules/face_detection/BlazeFace-FPN-SSH.yaml +40 -0
paddlex/configs/modules/face_detection/BlazeFace.yaml +40 -0
paddlex/configs/modules/face_detection/PP-YOLOE_plus-S_face.yaml +40 -0
paddlex/configs/modules/face_detection/PicoDet_LCNet_x2_5_face.yaml +40 -0
paddlex/configs/modules/face_feature/MobileFaceNet.yaml +41 -0
paddlex/configs/modules/face_feature/ResNet50_face.yaml +41 -0
paddlex/configs/modules/formula_recognition/LaTeX_OCR_rec.yaml +40 -0
paddlex/configs/modules/formula_recognition/PP-FormulaNet-L.yaml +40 -0
paddlex/configs/modules/formula_recognition/PP-FormulaNet-S.yaml +40 -0
paddlex/configs/modules/formula_recognition/UniMERNet.yaml +40 -0
paddlex/configs/modules/human_detection/PP-YOLOE-L_human.yaml +42 -0
paddlex/configs/modules/human_detection/PP-YOLOE-S_human.yaml +42 -0
paddlex/configs/modules/image_anomaly_detection/STFPM.yaml +41 -0
paddlex/configs/modules/image_classification/CLIP_vit_base_patch16_224.yaml +41 -0
paddlex/configs/modules/image_classification/CLIP_vit_large_patch14_224.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_base_224.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_base_384.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_large_224.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_large_384.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_small.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_tiny.yaml +41 -0
paddlex/configs/modules/image_classification/FasterNet-L.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-M.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-S.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-T0.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-T1.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-T2.yaml +40 -0
paddlex/configs/modules/image_classification/MobileNetV1_x0_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV1_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV1_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV1_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x0_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x1_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x2_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x0_35.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x1_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x0_35.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x1_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_conv_large.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_conv_medium.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_conv_small.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_hybrid_large.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_hybrid_medium.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B0.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B1.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B2.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B3.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B4.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B5.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B6.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNet_base.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNet_small.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNet_tiny.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNetV2_base.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNetV2_large.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNetV2_small.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_25.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_35.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x1_5.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x2_0.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x2_5.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet101.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet101_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet152.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet152_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet18.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet18_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet200_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet34.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet34_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet50.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet50_vd.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S1.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S2.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S3.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S4.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_base_patch4_window12_384.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_base_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_large_patch4_window12_384.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_large_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_small_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_tiny_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_feature/PP-ShiTuV2_rec.yaml +42 -0
paddlex/configs/modules/image_feature/PP-ShiTuV2_rec_CLIP_vit_base.yaml +42 -0
paddlex/configs/modules/image_feature/PP-ShiTuV2_rec_CLIP_vit_large.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/CLIP_vit_base_patch16_448_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B0_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B4_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B6_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-LCNet_x1_0_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/ResNet50_ML.yaml +41 -0
paddlex/configs/modules/image_unwarping/UVDoc.yaml +12 -0
paddlex/configs/modules/instance_segmentation/Cascade-MaskRCNN-ResNet50-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Cascade-MaskRCNN-ResNet50-vd-SSLDv2-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-H.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-L.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-M.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-S.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-X.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNeXt101-vd-FPN.yaml +39 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet101-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet101-vd-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50-vd-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50.yaml +40 -0
paddlex/configs/modules/instance_segmentation/PP-YOLOE_seg-S.yaml +40 -0
paddlex/configs/modules/instance_segmentation/SOLOv2.yaml +40 -0
paddlex/configs/modules/keypoint_detection/PP-TinyPose_128x96.yaml +40 -0
paddlex/configs/modules/keypoint_detection/PP-TinyPose_256x192.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout-L.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout-M.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout-S.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-L_layout_17cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-L_layout_3cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-S_layout_17cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-S_layout_3cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet_layout_1x.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet_layout_1x_table.yaml +40 -0
paddlex/configs/modules/layout_detection/RT-DETR-H_layout_17cls.yaml +40 -0
paddlex/configs/modules/layout_detection/RT-DETR-H_layout_3cls.yaml +40 -0
paddlex/configs/modules/mainbody_detection/PP-ShiTuV2_det.yaml +41 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_base.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_large.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_medium.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_small.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_tiny.yaml +12 -0
paddlex/configs/modules/object_detection/Cascade-FasterRCNN-ResNet50-FPN.yaml +41 -0
paddlex/configs/modules/object_detection/Cascade-FasterRCNN-ResNet50-vd-SSLDv2-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/CenterNet-DLA-34.yaml +41 -0
paddlex/configs/modules/object_detection/CenterNet-ResNet50.yaml +41 -0
paddlex/configs/modules/object_detection/Co-DINO-R50.yaml +40 -0
paddlex/configs/modules/object_detection/Co-DINO-Swin-L.yaml +40 -0
paddlex/configs/modules/object_detection/Co-Deformable-DETR-R50.yaml +40 -0
paddlex/configs/modules/object_detection/Co-Deformable-DETR-Swin-T.yaml +40 -0
paddlex/configs/modules/object_detection/DETR-R50.yaml +42 -0
paddlex/configs/modules/object_detection/FCOS-ResNet50.yaml +41 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNeXt101-vd-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet101-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet101.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet34-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-vd-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-vd-SSLDv2-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-Swin-Tiny-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-L.yaml +40 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-M.yaml +40 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-S.yaml +40 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-X.yaml +40 -0
paddlex/configs/modules/object_detection/PicoDet-L.yaml +40 -0
paddlex/configs/modules/object_detection/PicoDet-M.yaml +42 -0
paddlex/configs/modules/object_detection/PicoDet-S.yaml +40 -0
paddlex/configs/modules/object_detection/PicoDet-XS.yaml +42 -0
paddlex/configs/modules/object_detection/RT-DETR-H.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-L.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-R18.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-R50.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-X.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-L.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-M.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-N.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-S.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-T.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-X.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOv3-DarkNet53.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOv3-MobileNetV3.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOv3-ResNet50_vd_DCN.yaml +40 -0
paddlex/configs/modules/open_vocabulary_detection/GroundingDINO-T.yaml +13 -0
paddlex/configs/modules/open_vocabulary_segmentation/SAM-H_box.yaml +17 -0
paddlex/configs/modules/open_vocabulary_segmentation/SAM-H_point.yaml +15 -0
paddlex/configs/modules/pedestrian_attribute_recognition/PP-LCNet_x1_0_pedestrian_attribute.yaml +41 -0
paddlex/configs/modules/rotated_object_detection/PP-YOLOE-R-L.yaml +40 -0
paddlex/configs/modules/seal_text_detection/PP-OCRv4_mobile_seal_det.yaml +40 -0
paddlex/configs/modules/seal_text_detection/PP-OCRv4_server_seal_det.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3-R101.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3-R50.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3_Plus-R101.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3_Plus-R50.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/MaskFormer_small.yaml +42 -0
paddlex/configs/modules/semantic_segmentation/MaskFormer_tiny.yaml +42 -0
paddlex/configs/modules/semantic_segmentation/OCRNet_HRNet-W18.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/OCRNet_HRNet-W48.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/PP-LiteSeg-B.yaml +41 -0
paddlex/configs/modules/semantic_segmentation/PP-LiteSeg-T.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_base.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_large.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_small.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_tiny.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B0.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B1.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B2.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B3.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B4.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B5.yaml +40 -0
paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-L.yaml +42 -0
paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-S.yaml +42 -0
paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-largesize-L.yaml +42 -0
paddlex/configs/modules/table_cells_detection/RT-DETR-L_wired_table_cell_det.yaml +40 -0
paddlex/configs/modules/table_cells_detection/RT-DETR-L_wireless_table_cell_det.yaml +40 -0
paddlex/configs/modules/table_classification/PP-LCNet_x1_0_table_cls.yaml +41 -0
paddlex/configs/modules/table_structure_recognition/SLANeXt_wired.yaml +39 -0
paddlex/configs/modules/table_structure_recognition/SLANeXt_wireless.yaml +39 -0
paddlex/configs/modules/table_structure_recognition/SLANet.yaml +39 -0
paddlex/configs/modules/table_structure_recognition/SLANet_plus.yaml +39 -0
paddlex/configs/modules/text_detection/PP-OCRv3_mobile_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv3_server_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv4_mobile_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv4_server_det.yaml +40 -0
paddlex/configs/modules/text_recognition/PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv4_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv4_server_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv4_server_rec_doc.yaml +39 -0
paddlex/configs/modules/text_recognition/arabic_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ch_RepSVTR_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ch_SVTRv2_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/chinese_cht_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/cyrillic_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/devanagari_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/en_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/en_PP-OCRv4_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/japan_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ka_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/korean_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/latin_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ta_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/te_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/textline_orientation/PP-LCNet_x0_25_textline_ori.yaml +41 -0
paddlex/configs/modules/ts_anomaly_detection/AutoEncoder_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/DLinear_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/Nonstationary_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/PatchTST_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/TimesNet_ad.yaml +37 -0
paddlex/configs/modules/ts_classification/TimesNet_cls.yaml +37 -0
paddlex/configs/modules/ts_forecast/DLinear.yaml +38 -0
paddlex/configs/modules/ts_forecast/NLinear.yaml +38 -0
paddlex/configs/modules/ts_forecast/Nonstationary.yaml +38 -0
paddlex/configs/modules/ts_forecast/PatchTST.yaml +38 -0
paddlex/configs/modules/ts_forecast/RLinear.yaml +38 -0
paddlex/configs/modules/ts_forecast/TiDE.yaml +38 -0
paddlex/configs/modules/ts_forecast/TimesNet.yaml +38 -0
paddlex/configs/modules/vehicle_attribute_recognition/PP-LCNet_x1_0_vehicle_attribute.yaml +41 -0
paddlex/configs/modules/vehicle_detection/PP-YOLOE-L_vehicle.yaml +41 -0
paddlex/configs/modules/vehicle_detection/PP-YOLOE-S_vehicle.yaml +42 -0
paddlex/configs/modules/video_classification/PP-TSM-R50_8frames_uniform.yaml +42 -0
paddlex/configs/modules/video_classification/PP-TSMv2-LCNetV2_16frames_uniform.yaml +42 -0
paddlex/configs/modules/video_classification/PP-TSMv2-LCNetV2_8frames_uniform.yaml +42 -0
paddlex/configs/modules/video_detection/YOWO.yaml +40 -0
paddlex/configs/pipelines/3d_bev_detection.yaml +9 -0
paddlex/configs/pipelines/OCR.yaml +44 -0
paddlex/configs/pipelines/PP-ChatOCRv3-doc.yaml +149 -0
paddlex/configs/pipelines/PP-ChatOCRv4-doc.yaml +184 -0
paddlex/configs/pipelines/PP-ShiTuV2.yaml +18 -0
paddlex/configs/pipelines/PP-StructureV3.yaml +226 -0
paddlex/configs/pipelines/anomaly_detection.yaml +8 -0
paddlex/configs/pipelines/doc_preprocessor.yaml +15 -0
paddlex/configs/pipelines/face_recognition.yaml +18 -0
paddlex/configs/pipelines/formula_recognition.yaml +39 -0
paddlex/configs/pipelines/human_keypoint_detection.yaml +17 -0
paddlex/configs/pipelines/image_classification.yaml +10 -0
paddlex/configs/pipelines/image_multilabel_classification.yaml +9 -0
paddlex/configs/pipelines/instance_segmentation.yaml +10 -0
paddlex/configs/pipelines/layout_parsing.yaml +101 -0
paddlex/configs/pipelines/multilingual_speech_recognition.yaml +9 -0
paddlex/configs/pipelines/object_detection.yaml +10 -0
paddlex/configs/pipelines/open_vocabulary_detection.yaml +12 -0
paddlex/configs/pipelines/open_vocabulary_segmentation.yaml +13 -0
paddlex/configs/pipelines/pedestrian_attribute_recognition.yaml +15 -0
paddlex/configs/pipelines/rotated_object_detection.yaml +10 -0
paddlex/configs/pipelines/seal_recognition.yaml +51 -0
paddlex/configs/pipelines/semantic_segmentation.yaml +10 -0
paddlex/configs/pipelines/small_object_detection.yaml +10 -0
paddlex/configs/pipelines/table_recognition.yaml +56 -0
paddlex/configs/pipelines/table_recognition_v2.yaml +76 -0
paddlex/configs/pipelines/ts_anomaly_detection.yaml +8 -0
paddlex/configs/pipelines/ts_classification.yaml +8 -0
paddlex/configs/pipelines/ts_forecast.yaml +8 -0
paddlex/configs/pipelines/vehicle_attribute_recognition.yaml +15 -0
paddlex/configs/pipelines/video_classification.yaml +9 -0
paddlex/configs/pipelines/video_detection.yaml +10 -0
paddlex/engine.py +54 -0
paddlex/hpip_links.html +19 -0
paddlex/inference/__init__.py +19 -0
paddlex/inference/common/__init__.py +13 -0
paddlex/inference/common/batch_sampler/__init__.py +20 -0
paddlex/inference/common/batch_sampler/audio_batch_sampler.py +84 -0
paddlex/inference/common/batch_sampler/base_batch_sampler.py +90 -0
paddlex/inference/common/batch_sampler/det_3d_batch_sampler.py +147 -0
paddlex/inference/common/batch_sampler/image_batch_sampler.py +136 -0
paddlex/inference/common/batch_sampler/ts_batch_sampler.py +110 -0
paddlex/inference/common/batch_sampler/video_batch_sampler.py +94 -0
paddlex/inference/common/reader/__init__.py +19 -0
paddlex/inference/common/reader/audio_reader.py +46 -0
paddlex/inference/common/reader/det_3d_reader.py +239 -0
paddlex/inference/common/reader/image_reader.py +69 -0
paddlex/inference/common/reader/ts_reader.py +45 -0
paddlex/inference/common/reader/video_reader.py +42 -0
paddlex/inference/common/result/__init__.py +29 -0
paddlex/inference/common/result/base_cv_result.py +31 -0
paddlex/inference/common/result/base_result.py +70 -0
paddlex/inference/common/result/base_ts_result.py +42 -0
paddlex/inference/common/result/base_video_result.py +36 -0
paddlex/inference/common/result/mixin.py +703 -0
paddlex/inference/models/3d_bev_detection/__init__.py +15 -0
paddlex/inference/models/3d_bev_detection/predictor.py +314 -0
paddlex/inference/models/3d_bev_detection/processors.py +978 -0
paddlex/inference/models/3d_bev_detection/result.py +65 -0
paddlex/inference/models/3d_bev_detection/visualizer_3d.py +131 -0
paddlex/inference/models/__init__.py +130 -0
paddlex/inference/models/anomaly_detection/__init__.py +15 -0
paddlex/inference/models/anomaly_detection/predictor.py +145 -0
paddlex/inference/models/anomaly_detection/processors.py +46 -0
paddlex/inference/models/anomaly_detection/result.py +70 -0
paddlex/inference/models/base/__init__.py +15 -0
paddlex/inference/models/base/predictor/__init__.py +16 -0
paddlex/inference/models/base/predictor/base_predictor.py +175 -0
paddlex/inference/models/base/predictor/basic_predictor.py +139 -0
paddlex/inference/models/common/__init__.py +35 -0
paddlex/inference/models/common/static_infer.py +329 -0
paddlex/inference/models/common/tokenizer/__init__.py +17 -0
paddlex/inference/models/common/tokenizer/bert_tokenizer.py +655 -0
paddlex/inference/models/common/tokenizer/gpt_tokenizer.py +451 -0
paddlex/inference/models/common/tokenizer/tokenizer_utils.py +2141 -0
paddlex/inference/models/common/tokenizer/tokenizer_utils_base.py +3504 -0
paddlex/inference/models/common/tokenizer/utils.py +66 -0
paddlex/inference/models/common/tokenizer/vocab.py +647 -0
paddlex/inference/models/common/ts/__init__.py +15 -0
paddlex/inference/models/common/ts/funcs.py +533 -0
paddlex/inference/models/common/ts/processors.py +313 -0
paddlex/inference/models/common/vision/__init__.py +23 -0
paddlex/inference/models/common/vision/funcs.py +93 -0
paddlex/inference/models/common/vision/processors.py +270 -0
paddlex/inference/models/face_feature/__init__.py +15 -0
paddlex/inference/models/face_feature/predictor.py +65 -0
paddlex/inference/models/formula_recognition/__init__.py +15 -0
paddlex/inference/models/formula_recognition/predictor.py +203 -0
paddlex/inference/models/formula_recognition/processors.py +986 -0
paddlex/inference/models/formula_recognition/result.py +403 -0
paddlex/inference/models/image_classification/__init__.py +15 -0
paddlex/inference/models/image_classification/predictor.py +182 -0
paddlex/inference/models/image_classification/processors.py +87 -0
paddlex/inference/models/image_classification/result.py +92 -0
paddlex/inference/models/image_feature/__init__.py +15 -0
paddlex/inference/models/image_feature/predictor.py +156 -0
paddlex/inference/models/image_feature/processors.py +29 -0
paddlex/inference/models/image_feature/result.py +33 -0
paddlex/inference/models/image_multilabel_classification/__init__.py +15 -0
paddlex/inference/models/image_multilabel_classification/predictor.py +94 -0
paddlex/inference/models/image_multilabel_classification/processors.py +85 -0
paddlex/inference/models/image_multilabel_classification/result.py +95 -0
paddlex/inference/models/image_unwarping/__init__.py +15 -0
paddlex/inference/models/image_unwarping/predictor.py +105 -0
paddlex/inference/models/image_unwarping/processors.py +88 -0
paddlex/inference/models/image_unwarping/result.py +45 -0
paddlex/inference/models/instance_segmentation/__init__.py +15 -0
paddlex/inference/models/instance_segmentation/predictor.py +210 -0
paddlex/inference/models/instance_segmentation/processors.py +105 -0
paddlex/inference/models/instance_segmentation/result.py +161 -0
paddlex/inference/models/keypoint_detection/__init__.py +15 -0
paddlex/inference/models/keypoint_detection/predictor.py +188 -0
paddlex/inference/models/keypoint_detection/processors.py +359 -0
paddlex/inference/models/keypoint_detection/result.py +192 -0
paddlex/inference/models/multilingual_speech_recognition/__init__.py +15 -0
paddlex/inference/models/multilingual_speech_recognition/predictor.py +141 -0
paddlex/inference/models/multilingual_speech_recognition/processors.py +1941 -0
paddlex/inference/models/multilingual_speech_recognition/result.py +21 -0
paddlex/inference/models/object_detection/__init__.py +15 -0
paddlex/inference/models/object_detection/predictor.py +348 -0
paddlex/inference/models/object_detection/processors.py +855 -0
paddlex/inference/models/object_detection/result.py +113 -0
paddlex/inference/models/object_detection/utils.py +68 -0
paddlex/inference/models/open_vocabulary_detection/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_detection/predictor.py +155 -0
paddlex/inference/models/open_vocabulary_detection/processors/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_detection/processors/groundingdino_processors.py +485 -0
paddlex/inference/models/open_vocabulary_segmentation/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_segmentation/predictor.py +120 -0
paddlex/inference/models/open_vocabulary_segmentation/processors/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_segmentation/processors/sam_processer.py +249 -0
paddlex/inference/models/open_vocabulary_segmentation/results/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_segmentation/results/sam_result.py +147 -0
paddlex/inference/models/semantic_segmentation/__init__.py +15 -0
paddlex/inference/models/semantic_segmentation/predictor.py +167 -0
paddlex/inference/models/semantic_segmentation/processors.py +114 -0
paddlex/inference/models/semantic_segmentation/result.py +72 -0
paddlex/inference/models/table_structure_recognition/__init__.py +15 -0
paddlex/inference/models/table_structure_recognition/predictor.py +171 -0
paddlex/inference/models/table_structure_recognition/processors.py +235 -0
paddlex/inference/models/table_structure_recognition/result.py +70 -0
paddlex/inference/models/text_detection/__init__.py +15 -0
paddlex/inference/models/text_detection/predictor.py +191 -0
paddlex/inference/models/text_detection/processors.py +466 -0
paddlex/inference/models/text_detection/result.py +51 -0
paddlex/inference/models/text_recognition/__init__.py +15 -0
paddlex/inference/models/text_recognition/predictor.py +106 -0
paddlex/inference/models/text_recognition/processors.py +231 -0
paddlex/inference/models/text_recognition/result.py +75 -0
paddlex/inference/models/ts_anomaly_detection/__init__.py +15 -0
paddlex/inference/models/ts_anomaly_detection/predictor.py +146 -0
paddlex/inference/models/ts_anomaly_detection/processors.py +94 -0
paddlex/inference/models/ts_anomaly_detection/result.py +72 -0
paddlex/inference/models/ts_classification/__init__.py +15 -0
paddlex/inference/models/ts_classification/predictor.py +135 -0
paddlex/inference/models/ts_classification/processors.py +117 -0
paddlex/inference/models/ts_classification/result.py +78 -0
paddlex/inference/models/ts_forecasting/__init__.py +15 -0
paddlex/inference/models/ts_forecasting/predictor.py +159 -0
paddlex/inference/models/ts_forecasting/processors.py +149 -0
paddlex/inference/models/ts_forecasting/result.py +83 -0
paddlex/inference/models/video_classification/__init__.py +15 -0
paddlex/inference/models/video_classification/predictor.py +147 -0
paddlex/inference/models/video_classification/processors.py +409 -0
paddlex/inference/models/video_classification/result.py +92 -0
paddlex/inference/models/video_detection/__init__.py +15 -0
paddlex/inference/models/video_detection/predictor.py +136 -0
paddlex/inference/models/video_detection/processors.py +450 -0
paddlex/inference/models/video_detection/result.py +104 -0
paddlex/inference/pipelines/3d_bev_detection/__init__.py +15 -0
paddlex/inference/pipelines/3d_bev_detection/pipeline.py +67 -0
paddlex/inference/pipelines/__init__.py +228 -0
paddlex/inference/pipelines/anomaly_detection/__init__.py +15 -0
paddlex/inference/pipelines/anomaly_detection/pipeline.py +62 -0
paddlex/inference/pipelines/attribute_recognition/__init__.py +15 -0
paddlex/inference/pipelines/attribute_recognition/pipeline.py +105 -0
paddlex/inference/pipelines/attribute_recognition/result.py +100 -0
paddlex/inference/pipelines/base.py +132 -0
paddlex/inference/pipelines/components/__init__.py +23 -0
paddlex/inference/pipelines/components/chat_server/__init__.py +16 -0
paddlex/inference/pipelines/components/chat_server/base.py +39 -0
paddlex/inference/pipelines/components/chat_server/openai_bot_chat.py +236 -0
paddlex/inference/pipelines/components/common/__init__.py +18 -0
paddlex/inference/pipelines/components/common/base_operator.py +36 -0
paddlex/inference/pipelines/components/common/base_result.py +65 -0
paddlex/inference/pipelines/components/common/convert_points_and_boxes.py +46 -0
paddlex/inference/pipelines/components/common/crop_image_regions.py +550 -0
paddlex/inference/pipelines/components/common/seal_det_warp.py +941 -0
paddlex/inference/pipelines/components/common/sort_boxes.py +83 -0
paddlex/inference/pipelines/components/faisser.py +352 -0
paddlex/inference/pipelines/components/prompt_engineering/__init__.py +16 -0
paddlex/inference/pipelines/components/prompt_engineering/base.py +35 -0
paddlex/inference/pipelines/components/prompt_engineering/generate_ensemble_prompt.py +127 -0
paddlex/inference/pipelines/components/prompt_engineering/generate_kie_prompt.py +148 -0
paddlex/inference/pipelines/components/retriever/__init__.py +16 -0
paddlex/inference/pipelines/components/retriever/base.py +226 -0
paddlex/inference/pipelines/components/retriever/openai_bot_retriever.py +70 -0
paddlex/inference/pipelines/components/retriever/qianfan_bot_retriever.py +163 -0
paddlex/inference/pipelines/components/utils/__init__.py +13 -0
paddlex/inference/pipelines/components/utils/mixin.py +206 -0
paddlex/inference/pipelines/doc_preprocessor/__init__.py +15 -0
paddlex/inference/pipelines/doc_preprocessor/pipeline.py +190 -0
paddlex/inference/pipelines/doc_preprocessor/result.py +103 -0
paddlex/inference/pipelines/face_recognition/__init__.py +15 -0
paddlex/inference/pipelines/face_recognition/pipeline.py +61 -0
paddlex/inference/pipelines/face_recognition/result.py +43 -0
paddlex/inference/pipelines/formula_recognition/__init__.py +15 -0
paddlex/inference/pipelines/formula_recognition/pipeline.py +303 -0
paddlex/inference/pipelines/formula_recognition/result.py +291 -0
paddlex/inference/pipelines/image_classification/__init__.py +15 -0
paddlex/inference/pipelines/image_classification/pipeline.py +71 -0
paddlex/inference/pipelines/image_multilabel_classification/__init__.py +15 -0
paddlex/inference/pipelines/image_multilabel_classification/pipeline.py +78 -0
paddlex/inference/pipelines/instance_segmentation/__init__.py +15 -0
paddlex/inference/pipelines/instance_segmentation/pipeline.py +70 -0
paddlex/inference/pipelines/keypoint_detection/__init__.py +15 -0
paddlex/inference/pipelines/keypoint_detection/pipeline.py +137 -0
paddlex/inference/pipelines/layout_parsing/__init__.py +16 -0
paddlex/inference/pipelines/layout_parsing/pipeline.py +570 -0
paddlex/inference/pipelines/layout_parsing/pipeline_v2.py +739 -0
paddlex/inference/pipelines/layout_parsing/result.py +203 -0
paddlex/inference/pipelines/layout_parsing/result_v2.py +470 -0
paddlex/inference/pipelines/layout_parsing/utils.py +2385 -0
paddlex/inference/pipelines/multilingual_speech_recognition/__init__.py +15 -0
paddlex/inference/pipelines/multilingual_speech_recognition/pipeline.py +67 -0
paddlex/inference/pipelines/object_detection/__init__.py +15 -0
paddlex/inference/pipelines/object_detection/pipeline.py +95 -0
paddlex/inference/pipelines/ocr/__init__.py +15 -0
paddlex/inference/pipelines/ocr/pipeline.py +389 -0
paddlex/inference/pipelines/ocr/result.py +248 -0
paddlex/inference/pipelines/open_vocabulary_detection/__init__.py +15 -0
paddlex/inference/pipelines/open_vocabulary_detection/pipeline.py +75 -0
paddlex/inference/pipelines/open_vocabulary_segmentation/__init__.py +15 -0
paddlex/inference/pipelines/open_vocabulary_segmentation/pipeline.py +89 -0
paddlex/inference/pipelines/pp_chatocr/__init__.py +16 -0
paddlex/inference/pipelines/pp_chatocr/pipeline_base.py +102 -0
paddlex/inference/pipelines/pp_chatocr/pipeline_v3.py +773 -0
paddlex/inference/pipelines/pp_chatocr/pipeline_v4.py +977 -0
paddlex/inference/pipelines/pp_shitu_v2/__init__.py +15 -0
paddlex/inference/pipelines/pp_shitu_v2/pipeline.py +152 -0
paddlex/inference/pipelines/pp_shitu_v2/result.py +126 -0
paddlex/inference/pipelines/rotated_object_detection/__init__.py +15 -0
paddlex/inference/pipelines/rotated_object_detection/pipeline.py +74 -0
paddlex/inference/pipelines/seal_recognition/__init__.py +15 -0
paddlex/inference/pipelines/seal_recognition/pipeline.py +271 -0
paddlex/inference/pipelines/seal_recognition/result.py +87 -0
paddlex/inference/pipelines/semantic_segmentation/__init__.py +15 -0
paddlex/inference/pipelines/semantic_segmentation/pipeline.py +74 -0
paddlex/inference/pipelines/small_object_detection/__init__.py +15 -0
paddlex/inference/pipelines/small_object_detection/pipeline.py +74 -0
paddlex/inference/pipelines/table_recognition/__init__.py +16 -0
paddlex/inference/pipelines/table_recognition/pipeline.py +462 -0
paddlex/inference/pipelines/table_recognition/pipeline_v2.py +792 -0
paddlex/inference/pipelines/table_recognition/result.py +216 -0
paddlex/inference/pipelines/table_recognition/table_recognition_post_processing.py +362 -0
paddlex/inference/pipelines/table_recognition/table_recognition_post_processing_v2.py +470 -0
paddlex/inference/pipelines/table_recognition/utils.py +44 -0
paddlex/inference/pipelines/ts_anomaly_detection/__init__.py +15 -0
paddlex/inference/pipelines/ts_anomaly_detection/pipeline.py +62 -0
paddlex/inference/pipelines/ts_classification/__init__.py +15 -0
paddlex/inference/pipelines/ts_classification/pipeline.py +62 -0
paddlex/inference/pipelines/ts_forecasting/__init__.py +15 -0
paddlex/inference/pipelines/ts_forecasting/pipeline.py +62 -0
paddlex/inference/pipelines/video_classification/__init__.py +15 -0
paddlex/inference/pipelines/video_classification/pipeline.py +68 -0
paddlex/inference/pipelines/video_detection/__init__.py +15 -0
paddlex/inference/pipelines/video_detection/pipeline.py +73 -0
paddlex/inference/serving/__init__.py +13 -0
paddlex/inference/serving/basic_serving/__init__.py +18 -0
paddlex/inference/serving/basic_serving/_app.py +209 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/__init__.py +41 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/__init__.py +13 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/common.py +96 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/image_recognition.py +36 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/ocr.py +90 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/anomaly_detection.py +64 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/doc_preprocessor.py +97 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/face_recognition.py +223 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/formula_recognition.py +97 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/human_keypoint_detection.py +78 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/image_classification.py +66 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/image_multilabel_classification.py +70 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/instance_segmentation.py +81 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/layout_parsing.py +115 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/m_3d_bev_detection.py +76 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/multilingual_speech_recognition.py +89 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/object_detection.py +74 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ocr.py +99 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/open_vocabulary_detection.py +78 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/open_vocabulary_segmentation.py +85 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pedestrian_attribute_recognition.py +81 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv3_doc.py +191 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv4_doc.py +221 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_shituv2.py +218 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_structurev3.py +136 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/rotated_object_detection.py +78 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/seal_recognition.py +103 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/semantic_segmentation.py +64 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/small_object_detection.py +69 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition.py +105 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition_v2.py +107 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ts_anomaly_detection.py +62 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ts_classification.py +61 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ts_forecast.py +62 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/vehicle_attribute_recognition.py +81 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/video_classification.py +73 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/video_detection.py +89 -0
paddlex/inference/serving/basic_serving/_server.py +35 -0
paddlex/inference/serving/infra/__init__.py +13 -0
paddlex/inference/serving/infra/config.py +36 -0
paddlex/inference/serving/infra/models.py +72 -0
paddlex/inference/serving/infra/storage.py +175 -0
paddlex/inference/serving/infra/utils.py +259 -0
paddlex/inference/serving/schemas/__init__.py +13 -0
paddlex/inference/serving/schemas/anomaly_detection.py +39 -0
paddlex/inference/serving/schemas/doc_preprocessor.py +54 -0
paddlex/inference/serving/schemas/face_recognition.py +124 -0
paddlex/inference/serving/schemas/formula_recognition.py +56 -0
paddlex/inference/serving/schemas/human_keypoint_detection.py +55 -0
paddlex/inference/serving/schemas/image_classification.py +45 -0
paddlex/inference/serving/schemas/image_multilabel_classification.py +47 -0
paddlex/inference/serving/schemas/instance_segmentation.py +53 -0
paddlex/inference/serving/schemas/layout_parsing.py +72 -0
paddlex/inference/serving/schemas/m_3d_bev_detection.py +48 -0
paddlex/inference/serving/schemas/multilingual_speech_recognition.py +57 -0
paddlex/inference/serving/schemas/object_detection.py +52 -0
paddlex/inference/serving/schemas/ocr.py +60 -0
paddlex/inference/serving/schemas/open_vocabulary_detection.py +52 -0
paddlex/inference/serving/schemas/open_vocabulary_segmentation.py +52 -0
paddlex/inference/serving/schemas/pedestrian_attribute_recognition.py +61 -0
paddlex/inference/serving/schemas/pp_chatocrv3_doc.py +134 -0
paddlex/inference/serving/schemas/pp_chatocrv4_doc.py +151 -0
paddlex/inference/serving/schemas/pp_shituv2.py +124 -0
paddlex/inference/serving/schemas/pp_structurev3.py +84 -0
paddlex/inference/serving/schemas/rotated_object_detection.py +52 -0
paddlex/inference/serving/schemas/seal_recognition.py +62 -0
paddlex/inference/serving/schemas/semantic_segmentation.py +45 -0
paddlex/inference/serving/schemas/shared/__init__.py +13 -0
paddlex/inference/serving/schemas/shared/classification.py +23 -0
paddlex/inference/serving/schemas/shared/image_segmentation.py +28 -0
paddlex/inference/serving/schemas/shared/object_detection.py +24 -0
paddlex/inference/serving/schemas/shared/ocr.py +25 -0
paddlex/inference/serving/schemas/small_object_detection.py +52 -0
paddlex/inference/serving/schemas/table_recognition.py +64 -0
paddlex/inference/serving/schemas/table_recognition_v2.py +66 -0
paddlex/inference/serving/schemas/ts_anomaly_detection.py +37 -0
paddlex/inference/serving/schemas/ts_classification.py +38 -0
paddlex/inference/serving/schemas/ts_forecast.py +37 -0
paddlex/inference/serving/schemas/vehicle_attribute_recognition.py +61 -0
paddlex/inference/serving/schemas/video_classification.py +44 -0
paddlex/inference/serving/schemas/video_detection.py +56 -0
paddlex/inference/utils/__init__.py +13 -0
paddlex/inference/utils/benchmark.py +226 -0
paddlex/inference/utils/color_map.py +123 -0
paddlex/inference/utils/get_pipeline_path.py +27 -0
paddlex/inference/utils/io/__init__.py +36 -0
paddlex/inference/utils/io/readers.py +500 -0
paddlex/inference/utils/io/style.py +374 -0
paddlex/inference/utils/io/tablepyxl.py +149 -0
paddlex/inference/utils/io/writers.py +459 -0
paddlex/inference/utils/new_ir_blacklist.py +28 -0
paddlex/inference/utils/official_models.py +352 -0
paddlex/inference/utils/pp_option.py +256 -0
paddlex/model.py +113 -0
paddlex/modules/3d_bev_detection/__init__.py +18 -0
paddlex/modules/3d_bev_detection/dataset_checker/__init__.py +95 -0
paddlex/modules/3d_bev_detection/dataset_checker/dataset_src/__init__.py +17 -0
paddlex/modules/3d_bev_detection/dataset_checker/dataset_src/analyse_dataset.py +106 -0
paddlex/modules/3d_bev_detection/dataset_checker/dataset_src/check_dataset.py +102 -0
paddlex/modules/3d_bev_detection/evaluator.py +46 -0
paddlex/modules/3d_bev_detection/exportor.py +22 -0
paddlex/modules/3d_bev_detection/model_list.py +18 -0
paddlex/modules/3d_bev_detection/trainer.py +70 -0
paddlex/modules/__init__.py +138 -0
paddlex/modules/anomaly_detection/__init__.py +18 -0
paddlex/modules/anomaly_detection/dataset_checker/__init__.py +95 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/analyse_dataset.py +79 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/check_dataset.py +87 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/convert_dataset.py +230 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/split_dataset.py +87 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/utils/visualizer.py +71 -0
paddlex/modules/anomaly_detection/evaluator.py +58 -0
paddlex/modules/anomaly_detection/exportor.py +22 -0
paddlex/modules/anomaly_detection/model_list.py +16 -0
paddlex/modules/anomaly_detection/trainer.py +71 -0
paddlex/modules/base/__init__.py +18 -0
paddlex/modules/base/build_model.py +34 -0
paddlex/modules/base/dataset_checker/__init__.py +16 -0
paddlex/modules/base/dataset_checker/dataset_checker.py +169 -0
paddlex/modules/base/dataset_checker/utils.py +110 -0
paddlex/modules/base/evaluator.py +170 -0
paddlex/modules/base/exportor.py +146 -0
paddlex/modules/base/trainer.py +134 -0
paddlex/modules/face_recognition/__init__.py +18 -0
paddlex/modules/face_recognition/dataset_checker/__init__.py +71 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/__init__.py +16 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/check_dataset.py +174 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/utils/visualizer.py +156 -0
paddlex/modules/face_recognition/evaluator.py +52 -0
paddlex/modules/face_recognition/exportor.py +22 -0
paddlex/modules/face_recognition/model_list.py +15 -0
paddlex/modules/face_recognition/trainer.py +75 -0
paddlex/modules/formula_recognition/__init__.py +18 -0
paddlex/modules/formula_recognition/dataset_checker/__init__.py +113 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/analyse_dataset.py +157 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/check_dataset.py +80 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/convert_dataset.py +94 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/formula_recognition/evaluator.py +77 -0
paddlex/modules/formula_recognition/exportor.py +22 -0
paddlex/modules/formula_recognition/model_list.py +20 -0
paddlex/modules/formula_recognition/trainer.py +121 -0
paddlex/modules/general_recognition/__init__.py +18 -0
paddlex/modules/general_recognition/dataset_checker/__init__.py +107 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/analyse_dataset.py +98 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/check_dataset.py +100 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/convert_dataset.py +99 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/split_dataset.py +82 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/utils/visualizer.py +150 -0
paddlex/modules/general_recognition/evaluator.py +31 -0
paddlex/modules/general_recognition/exportor.py +22 -0
paddlex/modules/general_recognition/model_list.py +19 -0
paddlex/modules/general_recognition/trainer.py +52 -0
paddlex/modules/image_classification/__init__.py +18 -0
paddlex/modules/image_classification/dataset_checker/__init__.py +104 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/analyse_dataset.py +93 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/check_dataset.py +131 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/convert_dataset.py +51 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/utils/visualizer.py +156 -0
paddlex/modules/image_classification/evaluator.py +43 -0
paddlex/modules/image_classification/exportor.py +22 -0
paddlex/modules/image_classification/model_list.py +99 -0
paddlex/modules/image_classification/trainer.py +82 -0
paddlex/modules/image_unwarping/__init__.py +13 -0
paddlex/modules/image_unwarping/model_list.py +17 -0
paddlex/modules/instance_segmentation/__init__.py +18 -0
paddlex/modules/instance_segmentation/dataset_checker/__init__.py +108 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/analyse_dataset.py +78 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/check_dataset.py +92 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/convert_dataset.py +241 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/split_dataset.py +119 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/utils/visualizer.py +221 -0
paddlex/modules/instance_segmentation/evaluator.py +32 -0
paddlex/modules/instance_segmentation/exportor.py +22 -0
paddlex/modules/instance_segmentation/model_list.py +33 -0
paddlex/modules/instance_segmentation/trainer.py +31 -0
paddlex/modules/keypoint_detection/__init__.py +18 -0
paddlex/modules/keypoint_detection/dataset_checker/__init__.py +56 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/__init__.py +15 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/check_dataset.py +86 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/utils/visualizer.py +119 -0
paddlex/modules/keypoint_detection/evaluator.py +41 -0
paddlex/modules/keypoint_detection/exportor.py +22 -0
paddlex/modules/keypoint_detection/model_list.py +16 -0
paddlex/modules/keypoint_detection/trainer.py +39 -0
paddlex/modules/multilabel_classification/__init__.py +18 -0
paddlex/modules/multilabel_classification/dataset_checker/__init__.py +106 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/analyse_dataset.py +95 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/check_dataset.py +131 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/convert_dataset.py +117 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/utils/visualizer.py +153 -0
paddlex/modules/multilabel_classification/evaluator.py +43 -0
paddlex/modules/multilabel_classification/exportor.py +22 -0
paddlex/modules/multilabel_classification/model_list.py +24 -0
paddlex/modules/multilabel_classification/trainer.py +85 -0
paddlex/modules/multilingual_speech_recognition/__init__.py +18 -0
paddlex/modules/multilingual_speech_recognition/dataset_checker.py +27 -0
paddlex/modules/multilingual_speech_recognition/evaluator.py +27 -0
paddlex/modules/multilingual_speech_recognition/exportor.py +27 -0
paddlex/modules/multilingual_speech_recognition/model_list.py +22 -0
paddlex/modules/multilingual_speech_recognition/trainer.py +40 -0
paddlex/modules/object_detection/__init__.py +18 -0
paddlex/modules/object_detection/dataset_checker/__init__.py +115 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/analyse_dataset.py +80 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/check_dataset.py +86 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/convert_dataset.py +433 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/split_dataset.py +119 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/utils/visualizer.py +192 -0
paddlex/modules/object_detection/evaluator.py +52 -0
paddlex/modules/object_detection/exportor.py +22 -0
paddlex/modules/object_detection/model_list.py +84 -0
paddlex/modules/object_detection/trainer.py +99 -0
paddlex/modules/open_vocabulary_detection/__init__.py +18 -0
paddlex/modules/open_vocabulary_detection/dataset_checker.py +29 -0
paddlex/modules/open_vocabulary_detection/evaluator.py +29 -0
paddlex/modules/open_vocabulary_detection/exportor.py +29 -0
paddlex/modules/open_vocabulary_detection/model_list.py +18 -0
paddlex/modules/open_vocabulary_detection/trainer.py +42 -0
paddlex/modules/open_vocabulary_segmentation/__init__.py +18 -0
paddlex/modules/open_vocabulary_segmentation/dataset_checker.py +29 -0
paddlex/modules/open_vocabulary_segmentation/evaluator.py +29 -0
paddlex/modules/open_vocabulary_segmentation/exportor.py +29 -0
paddlex/modules/open_vocabulary_segmentation/model_list.py +19 -0
paddlex/modules/open_vocabulary_segmentation/trainer.py +42 -0
paddlex/modules/semantic_segmentation/__init__.py +18 -0
paddlex/modules/semantic_segmentation/dataset_checker/__init__.py +110 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/analyse_dataset.py +73 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/check_dataset.py +80 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/convert_dataset.py +162 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/split_dataset.py +87 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/utils/visualizer.py +71 -0
paddlex/modules/semantic_segmentation/evaluator.py +58 -0
paddlex/modules/semantic_segmentation/exportor.py +31 -0
paddlex/modules/semantic_segmentation/model_list.py +37 -0
paddlex/modules/semantic_segmentation/trainer.py +73 -0
paddlex/modules/table_recognition/__init__.py +18 -0
paddlex/modules/table_recognition/dataset_checker/__init__.py +98 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/analyse_dataset.py +58 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/check_dataset.py +86 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/split_dataset.py +79 -0
paddlex/modules/table_recognition/evaluator.py +43 -0
paddlex/modules/table_recognition/exportor.py +22 -0
paddlex/modules/table_recognition/model_list.py +21 -0
paddlex/modules/table_recognition/trainer.py +70 -0
paddlex/modules/text_detection/__init__.py +18 -0
paddlex/modules/text_detection/dataset_checker/__init__.py +109 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/analyse_dataset.py +217 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/check_dataset.py +106 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/split_dataset.py +140 -0
paddlex/modules/text_detection/evaluator.py +41 -0
paddlex/modules/text_detection/exportor.py +22 -0
paddlex/modules/text_detection/model_list.py +24 -0
paddlex/modules/text_detection/trainer.py +68 -0
paddlex/modules/text_recognition/__init__.py +18 -0
paddlex/modules/text_recognition/dataset_checker/__init__.py +126 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/analyse_dataset.py +161 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/check_dataset.py +107 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/convert_dataset.py +94 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/text_recognition/evaluator.py +64 -0
paddlex/modules/text_recognition/exportor.py +22 -0
paddlex/modules/text_recognition/model_list.py +34 -0
paddlex/modules/text_recognition/trainer.py +106 -0
paddlex/modules/ts_anomaly_detection/__init__.py +19 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/__init__.py +112 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/analyse_dataset.py +27 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/convert_dataset.py +78 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/split_dataset.py +63 -0
paddlex/modules/ts_anomaly_detection/evaluator.py +67 -0
paddlex/modules/ts_anomaly_detection/exportor.py +45 -0
paddlex/modules/ts_anomaly_detection/model_list.py +22 -0
paddlex/modules/ts_anomaly_detection/trainer.py +113 -0
paddlex/modules/ts_classification/__init__.py +19 -0
paddlex/modules/ts_classification/dataset_checker/__init__.py +112 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/analyse_dataset.py +74 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/convert_dataset.py +78 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/split_dataset.py +88 -0
paddlex/modules/ts_classification/evaluator.py +66 -0
paddlex/modules/ts_classification/exportor.py +45 -0
paddlex/modules/ts_classification/model_list.py +18 -0
paddlex/modules/ts_classification/trainer.py +108 -0
paddlex/modules/ts_forecast/__init__.py +19 -0
paddlex/modules/ts_forecast/dataset_checker/__init__.py +112 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/analyse_dataset.py +27 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/convert_dataset.py +77 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/split_dataset.py +63 -0
paddlex/modules/ts_forecast/evaluator.py +66 -0
paddlex/modules/ts_forecast/exportor.py +45 -0
paddlex/modules/ts_forecast/model_list.py +24 -0
paddlex/modules/ts_forecast/trainer.py +108 -0
paddlex/modules/video_classification/__init__.py +18 -0
paddlex/modules/video_classification/dataset_checker/__init__.py +93 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/analyse_dataset.py +93 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/check_dataset.py +121 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/split_dataset.py +82 -0
paddlex/modules/video_classification/evaluator.py +44 -0
paddlex/modules/video_classification/exportor.py +22 -0
paddlex/modules/video_classification/model_list.py +19 -0
paddlex/modules/video_classification/trainer.py +88 -0
paddlex/modules/video_detection/__init__.py +18 -0
paddlex/modules/video_detection/dataset_checker/__init__.py +86 -0
paddlex/modules/video_detection/dataset_checker/dataset_src/__init__.py +17 -0
paddlex/modules/video_detection/dataset_checker/dataset_src/analyse_dataset.py +101 -0
paddlex/modules/video_detection/dataset_checker/dataset_src/check_dataset.py +134 -0
paddlex/modules/video_detection/evaluator.py +42 -0
paddlex/modules/video_detection/exportor.py +22 -0
paddlex/modules/video_detection/model_list.py +15 -0
paddlex/modules/video_detection/trainer.py +82 -0
paddlex/ops/__init__.py +149 -0
paddlex/ops/iou3d_nms/iou3d_cpu.cpp +264 -0
paddlex/ops/iou3d_nms/iou3d_cpu.h +27 -0
paddlex/ops/iou3d_nms/iou3d_nms.cpp +204 -0
paddlex/ops/iou3d_nms/iou3d_nms.h +33 -0
paddlex/ops/iou3d_nms/iou3d_nms_api.cpp +108 -0
paddlex/ops/iou3d_nms/iou3d_nms_kernel.cu +482 -0
paddlex/ops/setup.py +37 -0
paddlex/ops/voxel/voxelize_op.cc +191 -0
paddlex/ops/voxel/voxelize_op.cu +346 -0
paddlex/paddle2onnx_requirements.txt +1 -0
paddlex/paddlex_cli.py +464 -0
paddlex/repo_apis/Paddle3D_api/__init__.py +17 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/__init__.py +18 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/config.py +118 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/model.py +238 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/register.py +55 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/runner.py +104 -0
paddlex/repo_apis/Paddle3D_api/pp3d_config.py +144 -0
paddlex/repo_apis/PaddleClas_api/__init__.py +17 -0
paddlex/repo_apis/PaddleClas_api/cls/__init__.py +19 -0
paddlex/repo_apis/PaddleClas_api/cls/config.py +594 -0
paddlex/repo_apis/PaddleClas_api/cls/model.py +355 -0
paddlex/repo_apis/PaddleClas_api/cls/register.py +908 -0
paddlex/repo_apis/PaddleClas_api/cls/runner.py +219 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/__init__.py +18 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/config.py +141 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/model.py +23 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/register.py +68 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/runner.py +55 -0
paddlex/repo_apis/PaddleDetection_api/__init__.py +17 -0
paddlex/repo_apis/PaddleDetection_api/config_helper.py +280 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/__init__.py +18 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/config.py +458 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/model.py +403 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/register.py +263 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/runner.py +226 -0
paddlex/repo_apis/PaddleDetection_api/object_det/__init__.py +19 -0
paddlex/repo_apis/PaddleDetection_api/object_det/config.py +539 -0
paddlex/repo_apis/PaddleDetection_api/object_det/model.py +430 -0
paddlex/repo_apis/PaddleDetection_api/object_det/official_categories.py +220 -0
paddlex/repo_apis/PaddleDetection_api/object_det/register.py +1106 -0
paddlex/repo_apis/PaddleDetection_api/object_det/runner.py +226 -0
paddlex/repo_apis/PaddleNLP_api/__init__.py +13 -0
paddlex/repo_apis/PaddleOCR_api/__init__.py +21 -0
paddlex/repo_apis/PaddleOCR_api/config_utils.py +53 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/config.py +570 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/model.py +402 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/register.py +73 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/runner.py +240 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/config.py +64 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/model.py +126 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/register.py +71 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/runner.py +51 -0
paddlex/repo_apis/PaddleOCR_api/text_det/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/text_det/config.py +62 -0
paddlex/repo_apis/PaddleOCR_api/text_det/model.py +72 -0
paddlex/repo_apis/PaddleOCR_api/text_det/register.py +90 -0
paddlex/repo_apis/PaddleOCR_api/text_det/runner.py +53 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/config.py +563 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/model.py +402 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/register.py +199 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/runner.py +240 -0
paddlex/repo_apis/PaddleSeg_api/__init__.py +16 -0
paddlex/repo_apis/PaddleSeg_api/base_seg_config.py +134 -0
paddlex/repo_apis/PaddleSeg_api/seg/__init__.py +16 -0
paddlex/repo_apis/PaddleSeg_api/seg/config.py +186 -0
paddlex/repo_apis/PaddleSeg_api/seg/model.py +491 -0
paddlex/repo_apis/PaddleSeg_api/seg/register.py +273 -0
paddlex/repo_apis/PaddleSeg_api/seg/runner.py +262 -0
paddlex/repo_apis/PaddleTS_api/__init__.py +19 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/config.py +89 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/register.py +146 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_base/__init__.py +13 -0
paddlex/repo_apis/PaddleTS_api/ts_base/config.py +246 -0
paddlex/repo_apis/PaddleTS_api/ts_base/model.py +276 -0
paddlex/repo_apis/PaddleTS_api/ts_base/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/config.py +73 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/register.py +59 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/config.py +137 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/register.py +186 -0
paddlex/repo_apis/PaddleVideo_api/__init__.py +17 -0
paddlex/repo_apis/PaddleVideo_api/config_utils.py +51 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/__init__.py +19 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/config.py +547 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/model.py +346 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/register.py +71 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/runner.py +205 -0
paddlex/repo_apis/PaddleVideo_api/video_det/__init__.py +19 -0
paddlex/repo_apis/PaddleVideo_api/video_det/config.py +548 -0
paddlex/repo_apis/PaddleVideo_api/video_det/model.py +298 -0
paddlex/repo_apis/PaddleVideo_api/video_det/register.py +45 -0
paddlex/repo_apis/PaddleVideo_api/video_det/runner.py +200 -0
paddlex/repo_apis/__init__.py +13 -0
paddlex/repo_apis/base/__init__.py +23 -0
paddlex/repo_apis/base/config.py +238 -0
paddlex/repo_apis/base/model.py +571 -0
paddlex/repo_apis/base/register.py +135 -0
paddlex/repo_apis/base/runner.py +391 -0
paddlex/repo_apis/base/utils/__init__.py +13 -0
paddlex/repo_apis/base/utils/arg.py +64 -0
paddlex/repo_apis/base/utils/subprocess.py +107 -0
paddlex/repo_manager/__init__.py +24 -0
paddlex/repo_manager/core.py +271 -0
paddlex/repo_manager/meta.py +170 -0
paddlex/repo_manager/repo.py +415 -0
paddlex/repo_manager/requirements.txt +21 -0
paddlex/repo_manager/utils.py +359 -0
paddlex/serving_requirements.txt +9 -0
paddlex/utils/__init__.py +1 -12
paddlex/utils/cache.py +148 -0
paddlex/utils/config.py +215 -0
paddlex/utils/custom_device_whitelist.py +457 -0
paddlex/utils/device.py +151 -0
paddlex/utils/download.py +168 -182
paddlex/utils/env.py +11 -50
paddlex/utils/errors/__init__.py +17 -0
paddlex/utils/errors/dataset_checker.py +78 -0
paddlex/utils/errors/others.py +152 -0
paddlex/utils/file_interface.py +212 -0
paddlex/utils/flags.py +65 -0
paddlex/utils/fonts/__init__.py +67 -0
paddlex/utils/func_register.py +41 -0
paddlex/utils/interactive_get_pipeline.py +55 -0
paddlex/utils/lazy_loader.py +68 -0
paddlex/utils/logging.py +131 -33
paddlex/utils/misc.py +201 -0
paddlex/utils/pipeline_arguments.py +711 -0
paddlex/utils/result_saver.py +59 -0
paddlex/utils/subclass_register.py +101 -0
paddlex/version.py +54 -0
paddlex-3.0.0rc0.dist-info/LICENSE +169 -0
paddlex-3.0.0rc0.dist-info/METADATA +1035 -0
paddlex-3.0.0rc0.dist-info/RECORD +1015 -0
paddlex-3.0.0rc0.dist-info/WHEEL +5 -0
paddlex-3.0.0rc0.dist-info/entry_points.txt +2 -0
paddlex-3.0.0rc0.dist-info/top_level.txt +1 -0
PaddleClas/__init__.py +0 -16
PaddleClas/deploy/__init__.py +0 -1
PaddleClas/deploy/paddleserving/__init__.py +0 -0
PaddleClas/deploy/paddleserving/classification_web_service.py +0 -74
PaddleClas/deploy/paddleserving/cpu_utilization.py +0 -4
PaddleClas/deploy/paddleserving/pipeline_http_client.py +0 -20
PaddleClas/deploy/paddleserving/pipeline_rpc_client.py +0 -33
PaddleClas/deploy/paddleserving/recognition/__init__.py +0 -0
PaddleClas/deploy/paddleserving/recognition/pipeline_http_client.py +0 -21
PaddleClas/deploy/paddleserving/recognition/pipeline_rpc_client.py +0 -34
PaddleClas/deploy/paddleserving/recognition/recognition_web_service.py +0 -209
PaddleClas/deploy/python/__init__.py +0 -0
PaddleClas/deploy/python/build_gallery.py +0 -214
PaddleClas/deploy/python/det_preprocess.py +0 -205
PaddleClas/deploy/python/postprocess.py +0 -161
PaddleClas/deploy/python/predict_cls.py +0 -142
PaddleClas/deploy/python/predict_det.py +0 -158
PaddleClas/deploy/python/predict_rec.py +0 -138
PaddleClas/deploy/python/predict_system.py +0 -144
PaddleClas/deploy/python/preprocess.py +0 -337
PaddleClas/deploy/utils/__init__.py +0 -5
PaddleClas/deploy/utils/config.py +0 -197
PaddleClas/deploy/utils/draw_bbox.py +0 -61
PaddleClas/deploy/utils/encode_decode.py +0 -31
PaddleClas/deploy/utils/get_image_list.py +0 -49
PaddleClas/deploy/utils/logger.py +0 -120
PaddleClas/deploy/utils/predictor.py +0 -71
PaddleClas/deploy/vector_search/__init__.py +0 -1
PaddleClas/deploy/vector_search/interface.py +0 -272
PaddleClas/deploy/vector_search/test.py +0 -34
PaddleClas/hubconf.py +0 -788
PaddleClas/paddleclas.py +0 -552
PaddleClas/ppcls/__init__.py +0 -20
PaddleClas/ppcls/arch/__init__.py +0 -127
PaddleClas/ppcls/arch/backbone/__init__.py +0 -80
PaddleClas/ppcls/arch/backbone/base/__init__.py +0 -0
PaddleClas/ppcls/arch/backbone/base/theseus_layer.py +0 -126
PaddleClas/ppcls/arch/backbone/legendary_models/__init__.py +0 -6
PaddleClas/ppcls/arch/backbone/legendary_models/esnet.py +0 -355
PaddleClas/ppcls/arch/backbone/legendary_models/hrnet.py +0 -744
PaddleClas/ppcls/arch/backbone/legendary_models/inception_v3.py +0 -539
PaddleClas/ppcls/arch/backbone/legendary_models/mobilenet_v1.py +0 -234
PaddleClas/ppcls/arch/backbone/legendary_models/mobilenet_v3.py +0 -561
PaddleClas/ppcls/arch/backbone/legendary_models/pp_lcnet.py +0 -399
PaddleClas/ppcls/arch/backbone/legendary_models/resnet.py +0 -534
PaddleClas/ppcls/arch/backbone/legendary_models/vgg.py +0 -231
PaddleClas/ppcls/arch/backbone/model_zoo/__init__.py +0 -0
PaddleClas/ppcls/arch/backbone/model_zoo/alexnet.py +0 -168
PaddleClas/ppcls/arch/backbone/model_zoo/cspnet.py +0 -376
PaddleClas/ppcls/arch/backbone/model_zoo/darknet.py +0 -197
PaddleClas/ppcls/arch/backbone/model_zoo/densenet.py +0 -344
PaddleClas/ppcls/arch/backbone/model_zoo/distilled_vision_transformer.py +0 -272
PaddleClas/ppcls/arch/backbone/model_zoo/dla.py +0 -528
PaddleClas/ppcls/arch/backbone/model_zoo/dpn.py +0 -451
PaddleClas/ppcls/arch/backbone/model_zoo/efficientnet.py +0 -976
PaddleClas/ppcls/arch/backbone/model_zoo/ghostnet.py +0 -363
PaddleClas/ppcls/arch/backbone/model_zoo/googlenet.py +0 -229
PaddleClas/ppcls/arch/backbone/model_zoo/gvt.py +0 -693
PaddleClas/ppcls/arch/backbone/model_zoo/hardnet.py +0 -293
PaddleClas/ppcls/arch/backbone/model_zoo/inception_v4.py +0 -477
PaddleClas/ppcls/arch/backbone/model_zoo/levit.py +0 -589
PaddleClas/ppcls/arch/backbone/model_zoo/mixnet.py +0 -815
PaddleClas/ppcls/arch/backbone/model_zoo/mobilenet_v2.py +0 -287
PaddleClas/ppcls/arch/backbone/model_zoo/rednet.py +0 -203
PaddleClas/ppcls/arch/backbone/model_zoo/regnet.py +0 -431
PaddleClas/ppcls/arch/backbone/model_zoo/repvgg.py +0 -422
PaddleClas/ppcls/arch/backbone/model_zoo/res2net.py +0 -264
PaddleClas/ppcls/arch/backbone/model_zoo/res2net_vd.py +0 -305
PaddleClas/ppcls/arch/backbone/model_zoo/resnest.py +0 -740
PaddleClas/ppcls/arch/backbone/model_zoo/resnet_vc.py +0 -309
PaddleClas/ppcls/arch/backbone/model_zoo/resnext.py +0 -298
PaddleClas/ppcls/arch/backbone/model_zoo/resnext101_wsl.py +0 -490
PaddleClas/ppcls/arch/backbone/model_zoo/resnext_vd.py +0 -317
PaddleClas/ppcls/arch/backbone/model_zoo/rexnet.py +0 -281
PaddleClas/ppcls/arch/backbone/model_zoo/se_resnet_vd.py +0 -390
PaddleClas/ppcls/arch/backbone/model_zoo/se_resnext.py +0 -364
PaddleClas/ppcls/arch/backbone/model_zoo/se_resnext_vd.py +0 -309
PaddleClas/ppcls/arch/backbone/model_zoo/shufflenet_v2.py +0 -362
PaddleClas/ppcls/arch/backbone/model_zoo/squeezenet.py +0 -194
PaddleClas/ppcls/arch/backbone/model_zoo/swin_transformer.py +0 -857
PaddleClas/ppcls/arch/backbone/model_zoo/tnt.py +0 -385
PaddleClas/ppcls/arch/backbone/model_zoo/vision_transformer.py +0 -495
PaddleClas/ppcls/arch/backbone/model_zoo/xception.py +0 -377
PaddleClas/ppcls/arch/backbone/model_zoo/xception_deeplab.py +0 -421
PaddleClas/ppcls/arch/backbone/variant_models/__init__.py +0 -3
PaddleClas/ppcls/arch/backbone/variant_models/pp_lcnet_variant.py +0 -29
PaddleClas/ppcls/arch/backbone/variant_models/resnet_variant.py +0 -23
PaddleClas/ppcls/arch/backbone/variant_models/vgg_variant.py +0 -28
PaddleClas/ppcls/arch/gears/__init__.py +0 -32
PaddleClas/ppcls/arch/gears/arcmargin.py +0 -72
PaddleClas/ppcls/arch/gears/circlemargin.py +0 -59
PaddleClas/ppcls/arch/gears/cosmargin.py +0 -55
PaddleClas/ppcls/arch/gears/fc.py +0 -35
PaddleClas/ppcls/arch/gears/identity_head.py +0 -9
PaddleClas/ppcls/arch/gears/vehicle_neck.py +0 -52
PaddleClas/ppcls/arch/utils.py +0 -53
PaddleClas/ppcls/data/__init__.py +0 -144
PaddleClas/ppcls/data/dataloader/DistributedRandomIdentitySampler.py +0 -90
PaddleClas/ppcls/data/dataloader/__init__.py +0 -9
PaddleClas/ppcls/data/dataloader/common_dataset.py +0 -84
PaddleClas/ppcls/data/dataloader/dali.py +0 -319
PaddleClas/ppcls/data/dataloader/icartoon_dataset.py +0 -36
PaddleClas/ppcls/data/dataloader/imagenet_dataset.py +0 -38
PaddleClas/ppcls/data/dataloader/logo_dataset.py +0 -46
PaddleClas/ppcls/data/dataloader/mix_dataset.py +0 -49
PaddleClas/ppcls/data/dataloader/mix_sampler.py +0 -79
PaddleClas/ppcls/data/dataloader/multilabel_dataset.py +0 -59
PaddleClas/ppcls/data/dataloader/pk_sampler.py +0 -105
PaddleClas/ppcls/data/dataloader/vehicle_dataset.py +0 -138
PaddleClas/ppcls/data/postprocess/__init__.py +0 -41
PaddleClas/ppcls/data/postprocess/topk.py +0 -85
PaddleClas/ppcls/data/preprocess/__init__.py +0 -100
PaddleClas/ppcls/data/preprocess/batch_ops/__init__.py +0 -1
PaddleClas/ppcls/data/preprocess/batch_ops/batch_operators.py +0 -231
PaddleClas/ppcls/data/preprocess/ops/__init__.py +0 -1
PaddleClas/ppcls/data/preprocess/ops/autoaugment.py +0 -264
PaddleClas/ppcls/data/preprocess/ops/cutout.py +0 -41
PaddleClas/ppcls/data/preprocess/ops/fmix.py +0 -217
PaddleClas/ppcls/data/preprocess/ops/functional.py +0 -138
PaddleClas/ppcls/data/preprocess/ops/grid.py +0 -89
PaddleClas/ppcls/data/preprocess/ops/hide_and_seek.py +0 -44
PaddleClas/ppcls/data/preprocess/ops/operators.py +0 -384
PaddleClas/ppcls/data/preprocess/ops/randaugment.py +0 -106
PaddleClas/ppcls/data/preprocess/ops/random_erasing.py +0 -90
PaddleClas/ppcls/data/preprocess/ops/timm_autoaugment.py +0 -877
PaddleClas/ppcls/data/utils/__init__.py +0 -13
PaddleClas/ppcls/data/utils/get_image_list.py +0 -49
PaddleClas/ppcls/engine/__init__.py +0 -0
PaddleClas/ppcls/engine/engine.py +0 -436
PaddleClas/ppcls/engine/evaluation/__init__.py +0 -16
PaddleClas/ppcls/engine/evaluation/classification.py +0 -143
PaddleClas/ppcls/engine/evaluation/retrieval.py +0 -169
PaddleClas/ppcls/engine/slim/__init__.py +0 -16
PaddleClas/ppcls/engine/slim/prune.py +0 -66
PaddleClas/ppcls/engine/slim/quant.py +0 -55
PaddleClas/ppcls/engine/train/__init__.py +0 -14
PaddleClas/ppcls/engine/train/train.py +0 -79
PaddleClas/ppcls/engine/train/utils.py +0 -72
PaddleClas/ppcls/loss/__init__.py +0 -65
PaddleClas/ppcls/loss/celoss.py +0 -67
PaddleClas/ppcls/loss/centerloss.py +0 -54
PaddleClas/ppcls/loss/comfunc.py +0 -45
PaddleClas/ppcls/loss/deephashloss.py +0 -92
PaddleClas/ppcls/loss/distanceloss.py +0 -43
PaddleClas/ppcls/loss/distillationloss.py +0 -141
PaddleClas/ppcls/loss/dmlloss.py +0 -46
PaddleClas/ppcls/loss/emlloss.py +0 -97
PaddleClas/ppcls/loss/googlenetloss.py +0 -41
PaddleClas/ppcls/loss/msmloss.py +0 -78
PaddleClas/ppcls/loss/multilabelloss.py +0 -43
PaddleClas/ppcls/loss/npairsloss.py +0 -38
PaddleClas/ppcls/loss/pairwisecosface.py +0 -55
PaddleClas/ppcls/loss/supconloss.py +0 -108
PaddleClas/ppcls/loss/trihardloss.py +0 -82
PaddleClas/ppcls/loss/triplet.py +0 -137
PaddleClas/ppcls/metric/__init__.py +0 -51
PaddleClas/ppcls/metric/metrics.py +0 -308
PaddleClas/ppcls/optimizer/__init__.py +0 -72
PaddleClas/ppcls/optimizer/learning_rate.py +0 -326
PaddleClas/ppcls/optimizer/optimizer.py +0 -207
PaddleClas/ppcls/utils/__init__.py +0 -27
PaddleClas/ppcls/utils/check.py +0 -151
PaddleClas/ppcls/utils/config.py +0 -210
PaddleClas/ppcls/utils/download.py +0 -319
PaddleClas/ppcls/utils/ema.py +0 -63
PaddleClas/ppcls/utils/logger.py +0 -137
PaddleClas/ppcls/utils/metrics.py +0 -107
PaddleClas/ppcls/utils/misc.py +0 -63
PaddleClas/ppcls/utils/model_zoo.py +0 -213
PaddleClas/ppcls/utils/profiler.py +0 -111
PaddleClas/ppcls/utils/save_load.py +0 -136
PaddleClas/setup.py +0 -58
PaddleClas/tools/__init__.py +0 -15
PaddleClas/tools/eval.py +0 -31
PaddleClas/tools/export_model.py +0 -34
PaddleClas/tools/infer.py +0 -31
PaddleClas/tools/train.py +0 -32
paddlex/cls.py +0 -82
paddlex/command.py +0 -215
paddlex/cv/__init__.py +0 -17
paddlex/cv/datasets/__init__.py +0 -18
paddlex/cv/datasets/coco.py +0 -208
paddlex/cv/datasets/imagenet.py +0 -88
paddlex/cv/datasets/seg_dataset.py +0 -91
paddlex/cv/datasets/voc.py +0 -445
paddlex/cv/models/__init__.py +0 -18
paddlex/cv/models/base.py +0 -631
paddlex/cv/models/classifier.py +0 -989
paddlex/cv/models/detector.py +0 -2292
paddlex/cv/models/load_model.py +0 -148
paddlex/cv/models/segmenter.py +0 -768
paddlex/cv/models/slim/__init__.py +0 -13
paddlex/cv/models/slim/prune.py +0 -55
paddlex/cv/models/utils/__init__.py +0 -13
paddlex/cv/models/utils/det_metrics/__init__.py +0 -15
paddlex/cv/models/utils/det_metrics/coco_utils.py +0 -476
paddlex/cv/models/utils/det_metrics/metrics.py +0 -220
paddlex/cv/models/utils/infer_nets.py +0 -45
paddlex/cv/models/utils/seg_metrics.py +0 -62
paddlex/cv/models/utils/visualize.py +0 -399
paddlex/cv/transforms/__init__.py +0 -46
paddlex/cv/transforms/batch_operators.py +0 -286
paddlex/cv/transforms/box_utils.py +0 -41
paddlex/cv/transforms/functions.py +0 -193
paddlex/cv/transforms/operators.py +0 -1402
paddlex/deploy.py +0 -268
paddlex/det.py +0 -49
paddlex/paddleseg/__init__.py +0 -17
paddlex/paddleseg/core/__init__.py +0 -20
paddlex/paddleseg/core/infer.py +0 -289
paddlex/paddleseg/core/predict.py +0 -145
paddlex/paddleseg/core/train.py +0 -258
paddlex/paddleseg/core/val.py +0 -172
paddlex/paddleseg/cvlibs/__init__.py +0 -17
paddlex/paddleseg/cvlibs/callbacks.py +0 -279
paddlex/paddleseg/cvlibs/config.py +0 -359
paddlex/paddleseg/cvlibs/manager.py +0 -142
paddlex/paddleseg/cvlibs/param_init.py +0 -91
paddlex/paddleseg/datasets/__init__.py +0 -21
paddlex/paddleseg/datasets/ade.py +0 -112
paddlex/paddleseg/datasets/cityscapes.py +0 -86
paddlex/paddleseg/datasets/cocostuff.py +0 -79
paddlex/paddleseg/datasets/dataset.py +0 -164
paddlex/paddleseg/datasets/mini_deep_globe_road_extraction.py +0 -95
paddlex/paddleseg/datasets/optic_disc_seg.py +0 -97
paddlex/paddleseg/datasets/pascal_context.py +0 -80
paddlex/paddleseg/datasets/voc.py +0 -113
paddlex/paddleseg/models/__init__.py +0 -39
paddlex/paddleseg/models/ann.py +0 -436
paddlex/paddleseg/models/attention_unet.py +0 -189
paddlex/paddleseg/models/backbones/__init__.py +0 -18
paddlex/paddleseg/models/backbones/hrnet.py +0 -815
paddlex/paddleseg/models/backbones/mobilenetv3.py +0 -365
paddlex/paddleseg/models/backbones/resnet_vd.py +0 -364
paddlex/paddleseg/models/backbones/xception_deeplab.py +0 -415
paddlex/paddleseg/models/bisenet.py +0 -311
paddlex/paddleseg/models/danet.py +0 -220
paddlex/paddleseg/models/decoupled_segnet.py +0 -233
paddlex/paddleseg/models/deeplab.py +0 -258
paddlex/paddleseg/models/dnlnet.py +0 -231
paddlex/paddleseg/models/emanet.py +0 -219
paddlex/paddleseg/models/fast_scnn.py +0 -318
paddlex/paddleseg/models/fcn.py +0 -135
paddlex/paddleseg/models/gcnet.py +0 -223
paddlex/paddleseg/models/gscnn.py +0 -357
paddlex/paddleseg/models/hardnet.py +0 -309
paddlex/paddleseg/models/isanet.py +0 -202
paddlex/paddleseg/models/layers/__init__.py +0 -19
paddlex/paddleseg/models/layers/activation.py +0 -73
paddlex/paddleseg/models/layers/attention.py +0 -146
paddlex/paddleseg/models/layers/layer_libs.py +0 -168
paddlex/paddleseg/models/layers/nonlocal2d.py +0 -155
paddlex/paddleseg/models/layers/pyramid_pool.py +0 -182
paddlex/paddleseg/models/losses/__init__.py +0 -27
paddlex/paddleseg/models/losses/binary_cross_entropy_loss.py +0 -174
paddlex/paddleseg/models/losses/bootstrapped_cross_entropy.py +0 -73
paddlex/paddleseg/models/losses/cross_entropy_loss.py +0 -94
paddlex/paddleseg/models/losses/decoupledsegnet_relax_boundary_loss.py +0 -129
paddlex/paddleseg/models/losses/dice_loss.py +0 -61
paddlex/paddleseg/models/losses/edge_attention_loss.py +0 -78
paddlex/paddleseg/models/losses/gscnn_dual_task_loss.py +0 -141
paddlex/paddleseg/models/losses/l1_loss.py +0 -76
paddlex/paddleseg/models/losses/lovasz_loss.py +0 -222
paddlex/paddleseg/models/losses/mean_square_error_loss.py +0 -65
paddlex/paddleseg/models/losses/mixed_loss.py +0 -58
paddlex/paddleseg/models/losses/ohem_cross_entropy_loss.py +0 -99
paddlex/paddleseg/models/losses/ohem_edge_attention_loss.py +0 -114
paddlex/paddleseg/models/ocrnet.py +0 -248
paddlex/paddleseg/models/pspnet.py +0 -147
paddlex/paddleseg/models/sfnet.py +0 -236
paddlex/paddleseg/models/shufflenet_slim.py +0 -268
paddlex/paddleseg/models/u2net.py +0 -574
paddlex/paddleseg/models/unet.py +0 -155
paddlex/paddleseg/models/unet_3plus.py +0 -316
paddlex/paddleseg/models/unet_plusplus.py +0 -237
paddlex/paddleseg/transforms/__init__.py +0 -16
paddlex/paddleseg/transforms/functional.py +0 -161
paddlex/paddleseg/transforms/transforms.py +0 -937
paddlex/paddleseg/utils/__init__.py +0 -22
paddlex/paddleseg/utils/config_check.py +0 -60
paddlex/paddleseg/utils/download.py +0 -163
paddlex/paddleseg/utils/env/__init__.py +0 -16
paddlex/paddleseg/utils/env/seg_env.py +0 -56
paddlex/paddleseg/utils/env/sys_env.py +0 -122
paddlex/paddleseg/utils/logger.py +0 -48
paddlex/paddleseg/utils/metrics.py +0 -146
paddlex/paddleseg/utils/progbar.py +0 -212
paddlex/paddleseg/utils/timer.py +0 -53
paddlex/paddleseg/utils/utils.py +0 -120
paddlex/paddleseg/utils/visualize.py +0 -90
paddlex/ppcls/__init__.py +0 -20
paddlex/ppcls/arch/__init__.py +0 -127
paddlex/ppcls/arch/backbone/__init__.py +0 -80
paddlex/ppcls/arch/backbone/base/__init__.py +0 -0
paddlex/ppcls/arch/backbone/base/theseus_layer.py +0 -130
paddlex/ppcls/arch/backbone/legendary_models/__init__.py +0 -6
paddlex/ppcls/arch/backbone/legendary_models/esnet.py +0 -355
paddlex/ppcls/arch/backbone/legendary_models/hrnet.py +0 -748
paddlex/ppcls/arch/backbone/legendary_models/inception_v3.py +0 -539
paddlex/ppcls/arch/backbone/legendary_models/mobilenet_v1.py +0 -234
paddlex/ppcls/arch/backbone/legendary_models/mobilenet_v3.py +0 -561
paddlex/ppcls/arch/backbone/legendary_models/pp_lcnet.py +0 -399
paddlex/ppcls/arch/backbone/legendary_models/resnet.py +0 -534
paddlex/ppcls/arch/backbone/legendary_models/vgg.py +0 -235
paddlex/ppcls/arch/backbone/model_zoo/__init__.py +0 -0
paddlex/ppcls/arch/backbone/model_zoo/alexnet.py +0 -168
paddlex/ppcls/arch/backbone/model_zoo/cspnet.py +0 -376
paddlex/ppcls/arch/backbone/model_zoo/darknet.py +0 -197
paddlex/ppcls/arch/backbone/model_zoo/densenet.py +0 -344
paddlex/ppcls/arch/backbone/model_zoo/distilled_vision_transformer.py +0 -272
paddlex/ppcls/arch/backbone/model_zoo/dla.py +0 -528
paddlex/ppcls/arch/backbone/model_zoo/dpn.py +0 -451
paddlex/ppcls/arch/backbone/model_zoo/efficientnet.py +0 -976
paddlex/ppcls/arch/backbone/model_zoo/ghostnet.py +0 -363
paddlex/ppcls/arch/backbone/model_zoo/googlenet.py +0 -229
paddlex/ppcls/arch/backbone/model_zoo/gvt.py +0 -693
paddlex/ppcls/arch/backbone/model_zoo/hardnet.py +0 -293
paddlex/ppcls/arch/backbone/model_zoo/inception_v4.py +0 -477
paddlex/ppcls/arch/backbone/model_zoo/levit.py +0 -589
paddlex/ppcls/arch/backbone/model_zoo/mixnet.py +0 -815
paddlex/ppcls/arch/backbone/model_zoo/mobilenet_v2.py +0 -287
paddlex/ppcls/arch/backbone/model_zoo/rednet.py +0 -203
paddlex/ppcls/arch/backbone/model_zoo/regnet.py +0 -431
paddlex/ppcls/arch/backbone/model_zoo/repvgg.py +0 -422
paddlex/ppcls/arch/backbone/model_zoo/res2net.py +0 -264
paddlex/ppcls/arch/backbone/model_zoo/res2net_vd.py +0 -305
paddlex/ppcls/arch/backbone/model_zoo/resnest.py +0 -740
paddlex/ppcls/arch/backbone/model_zoo/resnet_vc.py +0 -309
paddlex/ppcls/arch/backbone/model_zoo/resnext.py +0 -298
paddlex/ppcls/arch/backbone/model_zoo/resnext101_wsl.py +0 -490
paddlex/ppcls/arch/backbone/model_zoo/resnext_vd.py +0 -317
paddlex/ppcls/arch/backbone/model_zoo/rexnet.py +0 -281
paddlex/ppcls/arch/backbone/model_zoo/se_resnet_vd.py +0 -390
paddlex/ppcls/arch/backbone/model_zoo/se_resnext.py +0 -364
paddlex/ppcls/arch/backbone/model_zoo/se_resnext_vd.py +0 -309
paddlex/ppcls/arch/backbone/model_zoo/shufflenet_v2.py +0 -362
paddlex/ppcls/arch/backbone/model_zoo/squeezenet.py +0 -194
paddlex/ppcls/arch/backbone/model_zoo/swin_transformer.py +0 -857
paddlex/ppcls/arch/backbone/model_zoo/tnt.py +0 -385
paddlex/ppcls/arch/backbone/model_zoo/vision_transformer.py +0 -495
paddlex/ppcls/arch/backbone/model_zoo/xception.py +0 -377
paddlex/ppcls/arch/backbone/model_zoo/xception_deeplab.py +0 -421
paddlex/ppcls/arch/backbone/variant_models/__init__.py +0 -3
paddlex/ppcls/arch/backbone/variant_models/pp_lcnet_variant.py +0 -29
paddlex/ppcls/arch/backbone/variant_models/resnet_variant.py +0 -23
paddlex/ppcls/arch/backbone/variant_models/vgg_variant.py +0 -28
paddlex/ppcls/arch/gears/__init__.py +0 -32
paddlex/ppcls/arch/gears/arcmargin.py +0 -72
paddlex/ppcls/arch/gears/circlemargin.py +0 -59
paddlex/ppcls/arch/gears/cosmargin.py +0 -55
paddlex/ppcls/arch/gears/fc.py +0 -35
paddlex/ppcls/arch/gears/identity_head.py +0 -9
paddlex/ppcls/arch/gears/vehicle_neck.py +0 -52
paddlex/ppcls/arch/utils.py +0 -53
paddlex/ppcls/data/__init__.py +0 -144
paddlex/ppcls/data/dataloader/DistributedRandomIdentitySampler.py +0 -90
paddlex/ppcls/data/dataloader/__init__.py +0 -9
paddlex/ppcls/data/dataloader/common_dataset.py +0 -84
paddlex/ppcls/data/dataloader/dali.py +0 -319
paddlex/ppcls/data/dataloader/icartoon_dataset.py +0 -36
paddlex/ppcls/data/dataloader/imagenet_dataset.py +0 -38
paddlex/ppcls/data/dataloader/logo_dataset.py +0 -46
paddlex/ppcls/data/dataloader/mix_dataset.py +0 -49
paddlex/ppcls/data/dataloader/mix_sampler.py +0 -79
paddlex/ppcls/data/dataloader/multilabel_dataset.py +0 -59
paddlex/ppcls/data/dataloader/pk_sampler.py +0 -105
paddlex/ppcls/data/dataloader/vehicle_dataset.py +0 -138
paddlex/ppcls/data/postprocess/__init__.py +0 -41
paddlex/ppcls/data/postprocess/topk.py +0 -85
paddlex/ppcls/data/preprocess/__init__.py +0 -100
paddlex/ppcls/data/preprocess/batch_ops/__init__.py +0 -0
paddlex/ppcls/data/preprocess/batch_ops/batch_operators.py +0 -231
paddlex/ppcls/data/preprocess/ops/__init__.py +0 -0
paddlex/ppcls/data/preprocess/ops/autoaugment.py +0 -264
paddlex/ppcls/data/preprocess/ops/cutout.py +0 -41
paddlex/ppcls/data/preprocess/ops/fmix.py +0 -217
paddlex/ppcls/data/preprocess/ops/functional.py +0 -141
paddlex/ppcls/data/preprocess/ops/grid.py +0 -89
paddlex/ppcls/data/preprocess/ops/hide_and_seek.py +0 -44
paddlex/ppcls/data/preprocess/ops/operators.py +0 -384
paddlex/ppcls/data/preprocess/ops/randaugment.py +0 -106
paddlex/ppcls/data/preprocess/ops/random_erasing.py +0 -90
paddlex/ppcls/data/preprocess/ops/timm_autoaugment.py +0 -877
paddlex/ppcls/data/utils/__init__.py +0 -13
paddlex/ppcls/data/utils/get_image_list.py +0 -49
paddlex/ppcls/engine/__init__.py +0 -0
paddlex/ppcls/engine/engine.py +0 -436
paddlex/ppcls/engine/evaluation/__init__.py +0 -16
paddlex/ppcls/engine/evaluation/classification.py +0 -143
paddlex/ppcls/engine/evaluation/retrieval.py +0 -169
paddlex/ppcls/engine/slim/__init__.py +0 -16
paddlex/ppcls/engine/slim/prune.py +0 -66
paddlex/ppcls/engine/slim/quant.py +0 -55
paddlex/ppcls/engine/train/__init__.py +0 -14
paddlex/ppcls/engine/train/train.py +0 -79
paddlex/ppcls/engine/train/utils.py +0 -72
paddlex/ppcls/loss/__init__.py +0 -65
paddlex/ppcls/loss/celoss.py +0 -67
paddlex/ppcls/loss/centerloss.py +0 -54
paddlex/ppcls/loss/comfunc.py +0 -45
paddlex/ppcls/loss/deephashloss.py +0 -96
paddlex/ppcls/loss/distanceloss.py +0 -43
paddlex/ppcls/loss/distillationloss.py +0 -141
paddlex/ppcls/loss/dmlloss.py +0 -46
paddlex/ppcls/loss/emlloss.py +0 -97
paddlex/ppcls/loss/googlenetloss.py +0 -42
paddlex/ppcls/loss/msmloss.py +0 -78
paddlex/ppcls/loss/multilabelloss.py +0 -43
paddlex/ppcls/loss/npairsloss.py +0 -38
paddlex/ppcls/loss/pairwisecosface.py +0 -59
paddlex/ppcls/loss/supconloss.py +0 -108
paddlex/ppcls/loss/trihardloss.py +0 -82
paddlex/ppcls/loss/triplet.py +0 -137
paddlex/ppcls/metric/__init__.py +0 -51
paddlex/ppcls/metric/metrics.py +0 -308
paddlex/ppcls/optimizer/__init__.py +0 -72
paddlex/ppcls/optimizer/learning_rate.py +0 -326
paddlex/ppcls/optimizer/optimizer.py +0 -208
paddlex/ppcls/utils/__init__.py +0 -27
paddlex/ppcls/utils/check.py +0 -151
paddlex/ppcls/utils/config.py +0 -210
paddlex/ppcls/utils/download.py +0 -319
paddlex/ppcls/utils/ema.py +0 -63
paddlex/ppcls/utils/logger.py +0 -137
paddlex/ppcls/utils/metrics.py +0 -112
paddlex/ppcls/utils/misc.py +0 -63
paddlex/ppcls/utils/model_zoo.py +0 -213
paddlex/ppcls/utils/profiler.py +0 -111
paddlex/ppcls/utils/save_load.py +0 -136
paddlex/ppdet/__init__.py +0 -16
paddlex/ppdet/core/__init__.py +0 -15
paddlex/ppdet/core/config/__init__.py +0 -13
paddlex/ppdet/core/config/schema.py +0 -248
paddlex/ppdet/core/config/yaml_helpers.py +0 -118
paddlex/ppdet/core/workspace.py +0 -278
paddlex/ppdet/data/__init__.py +0 -21
paddlex/ppdet/data/crop_utils/__init__.py +0 -13
paddlex/ppdet/data/crop_utils/annotation_cropper.py +0 -585
paddlex/ppdet/data/crop_utils/chip_box_utils.py +0 -170
paddlex/ppdet/data/reader.py +0 -302
paddlex/ppdet/data/shm_utils.py +0 -67
paddlex/ppdet/data/source/__init__.py +0 -29
paddlex/ppdet/data/source/category.py +0 -904
paddlex/ppdet/data/source/coco.py +0 -251
paddlex/ppdet/data/source/dataset.py +0 -197
paddlex/ppdet/data/source/keypoint_coco.py +0 -669
paddlex/ppdet/data/source/mot.py +0 -636
paddlex/ppdet/data/source/sniper_coco.py +0 -191
paddlex/ppdet/data/source/voc.py +0 -231
paddlex/ppdet/data/source/widerface.py +0 -180
paddlex/ppdet/data/transform/__init__.py +0 -28
paddlex/ppdet/data/transform/atss_assigner.py +0 -270
paddlex/ppdet/data/transform/autoaugment_utils.py +0 -1591
paddlex/ppdet/data/transform/batch_operators.py +0 -1080
paddlex/ppdet/data/transform/gridmask_utils.py +0 -86
paddlex/ppdet/data/transform/keypoint_operators.py +0 -868
paddlex/ppdet/data/transform/mot_operators.py +0 -628
paddlex/ppdet/data/transform/op_helper.py +0 -498
paddlex/ppdet/data/transform/operators.py +0 -3025
paddlex/ppdet/engine/__init__.py +0 -30
paddlex/ppdet/engine/callbacks.py +0 -340
paddlex/ppdet/engine/env.py +0 -50
paddlex/ppdet/engine/export_utils.py +0 -177
paddlex/ppdet/engine/tracker.py +0 -538
paddlex/ppdet/engine/trainer.py +0 -723
paddlex/ppdet/metrics/__init__.py +0 -29
paddlex/ppdet/metrics/coco_utils.py +0 -184
paddlex/ppdet/metrics/json_results.py +0 -149
paddlex/ppdet/metrics/keypoint_metrics.py +0 -401
paddlex/ppdet/metrics/map_utils.py +0 -444
paddlex/ppdet/metrics/mcmot_metrics.py +0 -470
paddlex/ppdet/metrics/metrics.py +0 -434
paddlex/ppdet/metrics/mot_metrics.py +0 -1236
paddlex/ppdet/metrics/munkres.py +0 -428
paddlex/ppdet/metrics/widerface_utils.py +0 -393
paddlex/ppdet/model_zoo/__init__.py +0 -18
paddlex/ppdet/model_zoo/model_zoo.py +0 -84
paddlex/ppdet/modeling/__init__.py +0 -45
paddlex/ppdet/modeling/architectures/__init__.py +0 -51
paddlex/ppdet/modeling/architectures/blazeface.py +0 -91
paddlex/ppdet/modeling/architectures/cascade_rcnn.py +0 -144
paddlex/ppdet/modeling/architectures/centernet.py +0 -108
paddlex/ppdet/modeling/architectures/deepsort.py +0 -69
paddlex/ppdet/modeling/architectures/detr.py +0 -93
paddlex/ppdet/modeling/architectures/fairmot.py +0 -100
paddlex/ppdet/modeling/architectures/faster_rcnn.py +0 -106
paddlex/ppdet/modeling/architectures/fcos.py +0 -105
paddlex/ppdet/modeling/architectures/gfl.py +0 -87
paddlex/ppdet/modeling/architectures/jde.py +0 -111
paddlex/ppdet/modeling/architectures/keypoint_hrhrnet.py +0 -287
paddlex/ppdet/modeling/architectures/keypoint_hrnet.py +0 -267
paddlex/ppdet/modeling/architectures/mask_rcnn.py +0 -135
paddlex/ppdet/modeling/architectures/meta_arch.py +0 -128
paddlex/ppdet/modeling/architectures/picodet.py +0 -91
paddlex/ppdet/modeling/architectures/s2anet.py +0 -102
paddlex/ppdet/modeling/architectures/solov2.py +0 -110
paddlex/ppdet/modeling/architectures/sparse_rcnn.py +0 -99
paddlex/ppdet/modeling/architectures/ssd.py +0 -93
paddlex/ppdet/modeling/architectures/tood.py +0 -78
paddlex/ppdet/modeling/architectures/ttfnet.py +0 -98
paddlex/ppdet/modeling/architectures/yolo.py +0 -124
paddlex/ppdet/modeling/assigners/__init__.py +0 -23
paddlex/ppdet/modeling/assigners/atss_assigner.py +0 -211
paddlex/ppdet/modeling/assigners/simota_assigner.py +0 -262
paddlex/ppdet/modeling/assigners/task_aligned_assigner.py +0 -158
paddlex/ppdet/modeling/assigners/utils.py +0 -195
paddlex/ppdet/modeling/backbones/__init__.py +0 -49
paddlex/ppdet/modeling/backbones/blazenet.py +0 -323
paddlex/ppdet/modeling/backbones/darknet.py +0 -340
paddlex/ppdet/modeling/backbones/dla.py +0 -244
paddlex/ppdet/modeling/backbones/esnet.py +0 -290
paddlex/ppdet/modeling/backbones/ghostnet.py +0 -470
paddlex/ppdet/modeling/backbones/hardnet.py +0 -224
paddlex/ppdet/modeling/backbones/hrnet.py +0 -727
paddlex/ppdet/modeling/backbones/lcnet.py +0 -259
paddlex/ppdet/modeling/backbones/lite_hrnet.py +0 -886
paddlex/ppdet/modeling/backbones/mobilenet_v1.py +0 -418
paddlex/ppdet/modeling/backbones/mobilenet_v3.py +0 -483
paddlex/ppdet/modeling/backbones/name_adapter.py +0 -69
paddlex/ppdet/modeling/backbones/res2net.py +0 -358
paddlex/ppdet/modeling/backbones/resnet.py +0 -613
paddlex/ppdet/modeling/backbones/senet.py +0 -139
paddlex/ppdet/modeling/backbones/shufflenet_v2.py +0 -246
paddlex/ppdet/modeling/backbones/swin_transformer.py +0 -743
paddlex/ppdet/modeling/backbones/vgg.py +0 -210
paddlex/ppdet/modeling/bbox_utils.py +0 -778
paddlex/ppdet/modeling/heads/__init__.py +0 -53
paddlex/ppdet/modeling/heads/bbox_head.py +0 -377
paddlex/ppdet/modeling/heads/cascade_head.py +0 -284
paddlex/ppdet/modeling/heads/centernet_head.py +0 -292
paddlex/ppdet/modeling/heads/detr_head.py +0 -368
paddlex/ppdet/modeling/heads/face_head.py +0 -110
paddlex/ppdet/modeling/heads/fcos_head.py +0 -259
paddlex/ppdet/modeling/heads/gfl_head.py +0 -487
paddlex/ppdet/modeling/heads/keypoint_hrhrnet_head.py +0 -108
paddlex/ppdet/modeling/heads/mask_head.py +0 -250
paddlex/ppdet/modeling/heads/pico_head.py +0 -278
paddlex/ppdet/modeling/heads/roi_extractor.py +0 -111
paddlex/ppdet/modeling/heads/s2anet_head.py +0 -1056
paddlex/ppdet/modeling/heads/simota_head.py +0 -506
paddlex/ppdet/modeling/heads/solov2_head.py +0 -560
paddlex/ppdet/modeling/heads/sparsercnn_head.py +0 -375
paddlex/ppdet/modeling/heads/ssd_head.py +0 -215
paddlex/ppdet/modeling/heads/tood_head.py +0 -366
paddlex/ppdet/modeling/heads/ttf_head.py +0 -316
paddlex/ppdet/modeling/heads/yolo_head.py +0 -124
paddlex/ppdet/modeling/initializer.py +0 -317
paddlex/ppdet/modeling/keypoint_utils.py +0 -342
paddlex/ppdet/modeling/layers.py +0 -1430
paddlex/ppdet/modeling/losses/__init__.py +0 -43
paddlex/ppdet/modeling/losses/ctfocal_loss.py +0 -68
paddlex/ppdet/modeling/losses/detr_loss.py +0 -233
paddlex/ppdet/modeling/losses/fairmot_loss.py +0 -41
paddlex/ppdet/modeling/losses/fcos_loss.py +0 -225
paddlex/ppdet/modeling/losses/gfocal_loss.py +0 -217
paddlex/ppdet/modeling/losses/iou_aware_loss.py +0 -47
paddlex/ppdet/modeling/losses/iou_loss.py +0 -210
paddlex/ppdet/modeling/losses/jde_loss.py +0 -193
paddlex/ppdet/modeling/losses/keypoint_loss.py +0 -229
paddlex/ppdet/modeling/losses/solov2_loss.py +0 -101
paddlex/ppdet/modeling/losses/sparsercnn_loss.py +0 -425
paddlex/ppdet/modeling/losses/ssd_loss.py +0 -170
paddlex/ppdet/modeling/losses/varifocal_loss.py +0 -152
paddlex/ppdet/modeling/losses/yolo_loss.py +0 -212
paddlex/ppdet/modeling/mot/__init__.py +0 -25
paddlex/ppdet/modeling/mot/matching/__init__.py +0 -19
paddlex/ppdet/modeling/mot/matching/deepsort_matching.py +0 -382
paddlex/ppdet/modeling/mot/matching/jde_matching.py +0 -144
paddlex/ppdet/modeling/mot/motion/__init__.py +0 -17
paddlex/ppdet/modeling/mot/motion/kalman_filter.py +0 -270
paddlex/ppdet/modeling/mot/tracker/__init__.py +0 -23
paddlex/ppdet/modeling/mot/tracker/base_jde_tracker.py +0 -297
paddlex/ppdet/modeling/mot/tracker/base_sde_tracker.py +0 -156
paddlex/ppdet/modeling/mot/tracker/deepsort_tracker.py +0 -188
paddlex/ppdet/modeling/mot/tracker/jde_tracker.py +0 -277
paddlex/ppdet/modeling/mot/utils.py +0 -263
paddlex/ppdet/modeling/mot/visualization.py +0 -150
paddlex/ppdet/modeling/necks/__init__.py +0 -30
paddlex/ppdet/modeling/necks/bifpn.py +0 -302
paddlex/ppdet/modeling/necks/blazeface_fpn.py +0 -216
paddlex/ppdet/modeling/necks/centernet_fpn.py +0 -426
paddlex/ppdet/modeling/necks/csp_pan.py +0 -364
paddlex/ppdet/modeling/necks/fpn.py +0 -231
paddlex/ppdet/modeling/necks/hrfpn.py +0 -126
paddlex/ppdet/modeling/necks/ttf_fpn.py +0 -242
paddlex/ppdet/modeling/necks/yolo_fpn.py +0 -988
paddlex/ppdet/modeling/ops.py +0 -1611
paddlex/ppdet/modeling/post_process.py +0 -731
paddlex/ppdet/modeling/proposal_generator/__init__.py +0 -2
paddlex/ppdet/modeling/proposal_generator/anchor_generator.py +0 -135
paddlex/ppdet/modeling/proposal_generator/proposal_generator.py +0 -77
paddlex/ppdet/modeling/proposal_generator/rpn_head.py +0 -260
paddlex/ppdet/modeling/proposal_generator/target.py +0 -681
paddlex/ppdet/modeling/proposal_generator/target_layer.py +0 -491
paddlex/ppdet/modeling/reid/__init__.py +0 -25
paddlex/ppdet/modeling/reid/fairmot_embedding_head.py +0 -225
paddlex/ppdet/modeling/reid/jde_embedding_head.py +0 -214
paddlex/ppdet/modeling/reid/pplcnet_embedding.py +0 -282
paddlex/ppdet/modeling/reid/pyramidal_embedding.py +0 -144
paddlex/ppdet/modeling/reid/resnet.py +0 -310
paddlex/ppdet/modeling/shape_spec.py +0 -25
paddlex/ppdet/modeling/transformers/__init__.py +0 -25
paddlex/ppdet/modeling/transformers/deformable_transformer.py +0 -517
paddlex/ppdet/modeling/transformers/detr_transformer.py +0 -353
paddlex/ppdet/modeling/transformers/matchers.py +0 -127
paddlex/ppdet/modeling/transformers/position_encoding.py +0 -108
paddlex/ppdet/modeling/transformers/utils.py +0 -110
paddlex/ppdet/optimizer.py +0 -335
paddlex/ppdet/slim/__init__.py +0 -82
paddlex/ppdet/slim/distill.py +0 -110
paddlex/ppdet/slim/prune.py +0 -85
paddlex/ppdet/slim/quant.py +0 -84
paddlex/ppdet/slim/unstructured_prune.py +0 -66
paddlex/ppdet/utils/__init__.py +0 -13
paddlex/ppdet/utils/check.py +0 -112
paddlex/ppdet/utils/checkpoint.py +0 -226
paddlex/ppdet/utils/cli.py +0 -151
paddlex/ppdet/utils/colormap.py +0 -58
paddlex/ppdet/utils/download.py +0 -558
paddlex/ppdet/utils/logger.py +0 -70
paddlex/ppdet/utils/profiler.py +0 -111
paddlex/ppdet/utils/stats.py +0 -94
paddlex/ppdet/utils/visualizer.py +0 -321
paddlex/ppdet/utils/voc_utils.py +0 -86
paddlex/seg.py +0 -41
paddlex/tools/__init__.py +0 -17
paddlex/tools/anchor_clustering/__init__.py +0 -15
paddlex/tools/anchor_clustering/yolo_cluster.py +0 -178
paddlex/tools/convert.py +0 -52
paddlex/tools/dataset_conversion/__init__.py +0 -24
paddlex/tools/dataset_conversion/x2coco.py +0 -379
paddlex/tools/dataset_conversion/x2imagenet.py +0 -82
paddlex/tools/dataset_conversion/x2seg.py +0 -343
paddlex/tools/dataset_conversion/x2voc.py +0 -230
paddlex/tools/dataset_split/__init__.py +0 -23
paddlex/tools/dataset_split/coco_split.py +0 -69
paddlex/tools/dataset_split/imagenet_split.py +0 -75
paddlex/tools/dataset_split/seg_split.py +0 -96
paddlex/tools/dataset_split/utils.py +0 -75
paddlex/tools/dataset_split/voc_split.py +0 -91
paddlex/tools/split.py +0 -41
paddlex/utils/checkpoint.py +0 -492
paddlex/utils/shm.py +0 -67
paddlex/utils/stats.py +0 -68
paddlex/utils/utils.py +0 -229
paddlex-2.1.0.data/data/paddlex_restful/restful/templates/paddlex_restful_demo.html +0 -5205
paddlex-2.1.0.dist-info/LICENSE +0 -201
paddlex-2.1.0.dist-info/METADATA +0 -32
paddlex-2.1.0.dist-info/RECORD +0 -698
paddlex-2.1.0.dist-info/WHEEL +0 -5
paddlex-2.1.0.dist-info/entry_points.txt +0 -4
paddlex-2.1.0.dist-info/top_level.txt +0 -3
paddlex_restful/__init__.py +0 -15
paddlex_restful/command.py +0 -63
paddlex_restful/restful/__init__.py +0 -15
paddlex_restful/restful/app.py +0 -969
paddlex_restful/restful/dataset/__init__.py +0 -13
paddlex_restful/restful/dataset/cls_dataset.py +0 -159
paddlex_restful/restful/dataset/dataset.py +0 -266
paddlex_restful/restful/dataset/datasetbase.py +0 -86
paddlex_restful/restful/dataset/det_dataset.py +0 -190
paddlex_restful/restful/dataset/ins_seg_dataset.py +0 -312
paddlex_restful/restful/dataset/operate.py +0 -155
paddlex_restful/restful/dataset/seg_dataset.py +0 -222
paddlex_restful/restful/dataset/utils.py +0 -267
paddlex_restful/restful/demo.py +0 -202
paddlex_restful/restful/dir.py +0 -45
paddlex_restful/restful/model.py +0 -312
paddlex_restful/restful/project/__init__.py +0 -13
paddlex_restful/restful/project/evaluate/__init__.py +0 -13
paddlex_restful/restful/project/evaluate/classification.py +0 -126
paddlex_restful/restful/project/evaluate/detection.py +0 -789
paddlex_restful/restful/project/evaluate/draw_pred_result.py +0 -181
paddlex_restful/restful/project/evaluate/segmentation.py +0 -122
paddlex_restful/restful/project/operate.py +0 -931
paddlex_restful/restful/project/project.py +0 -143
paddlex_restful/restful/project/prune/__init__.py +0 -13
paddlex_restful/restful/project/prune/classification.py +0 -32
paddlex_restful/restful/project/prune/detection.py +0 -48
paddlex_restful/restful/project/prune/segmentation.py +0 -34
paddlex_restful/restful/project/task.py +0 -884
paddlex_restful/restful/project/train/__init__.py +0 -13
paddlex_restful/restful/project/train/classification.py +0 -141
paddlex_restful/restful/project/train/detection.py +0 -263
paddlex_restful/restful/project/train/params.py +0 -432
paddlex_restful/restful/project/train/params_v2.py +0 -326
paddlex_restful/restful/project/train/segmentation.py +0 -191
paddlex_restful/restful/project/visualize.py +0 -244
paddlex_restful/restful/system.py +0 -102
paddlex_restful/restful/templates/paddlex_restful_demo.html +0 -5205
paddlex_restful/restful/utils.py +0 -841
paddlex_restful/restful/workspace.py +0 -343
paddlex_restful/restful/workspace_pb2.py +0 -1411

paddlex/ppdet/data/transform/operators.py DELETED Viewed

@@ -1,3025 +0,0 @@
-# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# function:
-#    operators to process sample,
-#    eg: decode/resize/crop image
-from __future__ import absolute_import
-from __future__ import print_function
-from __future__ import division
-try:
-    from collections.abc import Sequence
-except Exception:
-    from collections import Sequence
-from numbers import Number, Integral
-import uuid
-import random
-import math
-import numpy as np
-import os
-import copy
-import logging
-import cv2
-from PIL import Image, ImageDraw
-import pickle
-import threading
-MUTEX = threading.Lock()
-from paddlex.ppdet.core.workspace import serializable
-from paddlex.ppdet.modeling import bbox_utils
-from ..reader import Compose
-from .op_helper import (satisfy_sample_constraint, filter_and_process,
-                        generate_sample_bbox, clip_bbox, data_anchor_sampling,
-                        satisfy_sample_constraint_coverage,
-                        crop_image_sampling, generate_sample_bbox_square,
-                        bbox_area_sampling, is_poly, get_border)
-from paddlex.ppdet.utils.logger import setup_logger
-from paddlex.ppdet.modeling.keypoint_utils import get_affine_transform, affine_transform
-logger = setup_logger(__name__)
-registered_ops = []
-def register_op(cls):
-    registered_ops.append(cls.__name__)
-    if not hasattr(BaseOperator, cls.__name__):
-        setattr(BaseOperator, cls.__name__, cls)
-    else:
-        raise KeyError("The {} class has been registered.".format(
-            cls.__name__))
-    return serializable(cls)
-class BboxError(ValueError):
-    pass
-class ImageError(ValueError):
-    pass
-class BaseOperator(object):
-    def __init__(self, name=None):
-        if name is None:
-            name = self.__class__.__name__
-        self._id = name + '_' + str(uuid.uuid4())[-6:]
-    def apply(self, sample, context=None):
-        """ Process a sample.
-        Args:
-            sample (dict): a dict of sample, eg: {'image':xx, 'label': xxx}
-            context (dict): info about this sample processing
-        Returns:
-            result (dict): a processed sample
-        """
-        return sample
-    def __call__(self, sample, context=None):
-        """ Process a sample.
-        Args:
-            sample (dict): a dict of sample, eg: {'image':xx, 'label': xxx}
-            context (dict): info about this sample processing
-        Returns:
-            result (dict): a processed sample
-        """
-        if isinstance(sample, Sequence):
-            for i in range(len(sample)):
-                sample[i] = self.apply(sample[i], context)
-        else:
-            sample = self.apply(sample, context)
-        return sample
-    def __str__(self):
-        return str(self._id)
-@register_op
-class Decode(BaseOperator):
-    def __init__(self):
-        """ Transform the image data to numpy format following the rgb format
-        """
-        super(Decode, self).__init__()
-    def apply(self, sample, context=None):
-        """ load image if 'im_file' field is not empty but 'image' is"""
-        if 'image' not in sample:
-            with open(sample['im_file'], 'rb') as f:
-                sample['image'] = f.read()
-            sample.pop('im_file')
-        im = sample['image']
-        data = np.frombuffer(im, dtype='uint8')
-        im = cv2.imdecode(data, 1)  # BGR mode, but need RGB mode
-        if 'keep_ori_im' in sample and sample['keep_ori_im']:
-            sample['ori_image'] = im
-        im = cv2.cvtColor(im, cv2.COLOR_BGR2RGB)
-        sample['image'] = im
-        if 'h' not in sample:
-            sample['h'] = im.shape[0]
-        elif sample['h'] != im.shape[0]:
-            logger.warning(
-                "The actual image height: {} is not equal to the "
-                "height: {} in annotation, and update sample['h'] by actual "
-                "image height.".format(im.shape[0], sample['h']))
-            sample['h'] = im.shape[0]
-        if 'w' not in sample:
-            sample['w'] = im.shape[1]
-        elif sample['w'] != im.shape[1]:
-            logger.warning(
-                "The actual image width: {} is not equal to the "
-                "width: {} in annotation, and update sample['w'] by actual "
-                "image width.".format(im.shape[1], sample['w']))
-            sample['w'] = im.shape[1]
-        sample['im_shape'] = np.array(im.shape[:2], dtype=np.float32)
-        sample['scale_factor'] = np.array([1., 1.], dtype=np.float32)
-        return sample
-def _make_dirs(dirname):
-    try:
-        from pathlib import Path
-    except ImportError:
-        from pathlib2 import Path
-    Path(dirname).mkdir(exist_ok=True)
-@register_op
-class DecodeCache(BaseOperator):
-    def __init__(self, cache_root=None):
-        '''decode image and caching
-        '''
-        super(DecodeCache, self).__init__()
-        self.use_cache = False if cache_root is None else True
-        self.cache_root = cache_root
-        if cache_root is not None:
-            _make_dirs(cache_root)
-    def apply(self, sample, context=None):
-        if self.use_cache and os.path.exists(
-                self.cache_path(self.cache_root, sample['im_file'])):
-            path = self.cache_path(self.cache_root, sample['im_file'])
-            im = self.load(path)
-        else:
-            if 'image' not in sample:
-                with open(sample['im_file'], 'rb') as f:
-                    sample['image'] = f.read()
-            im = sample['image']
-            data = np.frombuffer(im, dtype='uint8')
-            im = cv2.imdecode(data, 1)  # BGR mode, but need RGB mode
-            if 'keep_ori_im' in sample and sample['keep_ori_im']:
-                sample['ori_image'] = im
-            im = cv2.cvtColor(im, cv2.COLOR_BGR2RGB)
-            if self.use_cache and not os.path.exists(
-                    self.cache_path(self.cache_root, sample['im_file'])):
-                path = self.cache_path(self.cache_root, sample['im_file'])
-                self.dump(im, path)
-        sample['image'] = im
-        sample['h'] = im.shape[0]
-        sample['w'] = im.shape[1]
-        sample['im_shape'] = np.array(im.shape[:2], dtype=np.float32)
-        sample['scale_factor'] = np.array([1., 1.], dtype=np.float32)
-        sample.pop('im_file')
-        return sample
-    @staticmethod
-    def cache_path(dir_oot, im_file):
-        return os.path.join(dir_oot, os.path.basename(im_file) + '.pkl')
-    @staticmethod
-    def load(path):
-        with open(path, 'rb') as f:
-            im = pickle.load(f)
-        return im
-    @staticmethod
-    def dump(obj, path):
-        MUTEX.acquire()
-        try:
-            with open(path, 'wb') as f:
-                pickle.dump(obj, f)
-        except Exception as e:
-            logger.warning('dump {} occurs exception {}'.format(path, str(e)))
-        finally:
-            MUTEX.release()
-@register_op
-class SniperDecodeCrop(BaseOperator):
-    def __init__(self):
-        super(SniperDecodeCrop, self).__init__()
-    def __call__(self, sample, context=None):
-        if 'image' not in sample:
-            with open(sample['im_file'], 'rb') as f:
-                sample['image'] = f.read()
-            sample.pop('im_file')
-        im = sample['image']
-        data = np.frombuffer(im, dtype='uint8')
-        im = cv2.imdecode(data,
-                          cv2.IMREAD_COLOR)  # BGR mode, but need RGB mode
-        if 'keep_ori_im' in sample and sample['keep_ori_im']:
-            sample['ori_image'] = im
-        im = cv2.cvtColor(im, cv2.COLOR_BGR2RGB)
-        chip = sample['chip']
-        x1, y1, x2, y2 = [int(xi) for xi in chip]
-        im = im[max(y1, 0):min(y2, im.shape[0]), max(x1, 0):min(x2, im.shape[
-            1]), :]
-        sample['image'] = im
-        h = im.shape[0]
-        w = im.shape[1]
-        # sample['im_info'] = [h, w, 1.0]
-        sample['h'] = h
-        sample['w'] = w
-        sample['im_shape'] = np.array(im.shape[:2], dtype=np.float32)
-        sample['scale_factor'] = np.array([1., 1.], dtype=np.float32)
-        return sample
-@register_op
-class Permute(BaseOperator):
-    def __init__(self):
-        """
-        Change the channel to be (C, H, W)
-        """
-        super(Permute, self).__init__()
-    def apply(self, sample, context=None):
-        im = sample['image']
-        im = im.transpose((2, 0, 1))
-        sample['image'] = im
-        return sample
-@register_op
-class Lighting(BaseOperator):
-    """
-    Lighting the image by eigenvalues and eigenvectors
-    Args:
-        eigval (list): eigenvalues
-        eigvec (list): eigenvectors
-        alphastd (float): random weight of lighting, 0.1 by default
-    """
-    def __init__(self, eigval, eigvec, alphastd=0.1):
-        super(Lighting, self).__init__()
-        self.alphastd = alphastd
-        self.eigval = np.array(eigval).astype('float32')
-        self.eigvec = np.array(eigvec).astype('float32')
-    def apply(self, sample, context=None):
-        alpha = np.random.normal(scale=self.alphastd, size=(3, ))
-        sample['image'] += np.dot(self.eigvec, self.eigval * alpha)
-        return sample
-@register_op
-class RandomErasingImage(BaseOperator):
-    def __init__(self, prob=0.5, lower=0.02, higher=0.4, aspect_ratio=0.3):
-        """
-        Random Erasing Data Augmentation, see https://arxiv.org/abs/1708.04896
-        Args:
-            prob (float): probability to carry out random erasing
-            lower (float): lower limit of the erasing area ratio
-            higher (float): upper limit of the erasing area ratio
-            aspect_ratio (float): aspect ratio of the erasing region
-        """
-        super(RandomErasingImage, self).__init__()
-        self.prob = prob
-        self.lower = lower
-        self.higher = higher
-        self.aspect_ratio = aspect_ratio
-    def apply(self, sample):
-        gt_bbox = sample['gt_bbox']
-        im = sample['image']
-        if not isinstance(im, np.ndarray):
-            raise TypeError("{}: image is not a numpy array.".format(self))
-        if len(im.shape) != 3:
-            raise ImageError("{}: image is not 3-dimensional.".format(self))
-        for idx in range(gt_bbox.shape[0]):
-            if self.prob <= np.random.rand():
-                continue
-            x1, y1, x2, y2 = gt_bbox[idx, :]
-            w_bbox = x2 - x1
-            h_bbox = y2 - y1
-            area = w_bbox * h_bbox
-            target_area = random.uniform(self.lower, self.higher) * area
-            aspect_ratio = random.uniform(self.aspect_ratio,
-                                          1 / self.aspect_ratio)
-            h = int(round(math.sqrt(target_area * aspect_ratio)))
-            w = int(round(math.sqrt(target_area / aspect_ratio)))
-            if w < w_bbox and h < h_bbox:
-                off_y1 = random.randint(0, int(h_bbox - h))
-                off_x1 = random.randint(0, int(w_bbox - w))
-                im[int(y1 + off_y1):int(y1 + off_y1 + h), int(x1 + off_x1):int(
-                    x1 + off_x1 + w), :] = 0
-        sample['image'] = im
-        return sample
-@register_op
-class NormalizeImage(BaseOperator):
-    def __init__(self,
-                 mean=[0.485, 0.456, 0.406],
-                 std=[1, 1, 1],
-                 is_scale=True):
-        """
-        Args:
-            mean (list): the pixel mean
-            std (list): the pixel variance
-        """
-        super(NormalizeImage, self).__init__()
-        self.mean = mean
-        self.std = std
-        self.is_scale = is_scale
-        if not (isinstance(self.mean, list) and isinstance(self.std, list) and
-                isinstance(self.is_scale, bool)):
-            raise TypeError("{}: input type is invalid.".format(self))
-        from functools import reduce
-        if reduce(lambda x, y: x * y, self.std) == 0:
-            raise ValueError('{}: std is invalid!'.format(self))
-    def apply(self, sample, context=None):
-        """Normalize the image.
-        Operators:
-            1.(optional) Scale the image to [0,1]
-            2. Each pixel minus mean and is divided by std
-        """
-        im = sample['image']
-        im = im.astype(np.float32, copy=False)
-        mean = np.array(self.mean)[np.newaxis, np.newaxis, :]
-        std = np.array(self.std)[np.newaxis, np.newaxis, :]
-        if self.is_scale:
-            im = im / 255.0
-        im -= mean
-        im /= std
-        sample['image'] = im
-        return sample
-@register_op
-class GridMask(BaseOperator):
-    def __init__(self,
-                 use_h=True,
-                 use_w=True,
-                 rotate=1,
-                 offset=False,
-                 ratio=0.5,
-                 mode=1,
-                 prob=0.7,
-                 upper_iter=360000):
-        """
-        GridMask Data Augmentation, see https://arxiv.org/abs/2001.04086
-        Args:
-            use_h (bool): whether to mask vertically
-            use_w (boo;): whether to mask horizontally
-            rotate (float): angle for the mask to rotate
-            offset (float): mask offset
-            ratio (float): mask ratio
-            mode (int): gridmask mode
-            prob (float): max probability to carry out gridmask
-            upper_iter (int): suggested to be equal to global max_iter
-        """
-        super(GridMask, self).__init__()
-        self.use_h = use_h
-        self.use_w = use_w
-        self.rotate = rotate
-        self.offset = offset
-        self.ratio = ratio
-        self.mode = mode
-        self.prob = prob
-        self.upper_iter = upper_iter
-        from .gridmask_utils import Gridmask
-        self.gridmask_op = Gridmask(
-            use_h,
-            use_w,
-            rotate=rotate,
-            offset=offset,
-            ratio=ratio,
-            mode=mode,
-            prob=prob,
-            upper_iter=upper_iter)
-    def apply(self, sample, context=None):
-        sample['image'] = self.gridmask_op(sample['image'],
-                                           sample['curr_iter'])
-        return sample
-@register_op
-class RandomDistort(BaseOperator):
-    """Random color distortion.
-    Args:
-        hue (list): hue settings. in [lower, upper, probability] format.
-        saturation (list): saturation settings. in [lower, upper, probability] format.
-        contrast (list): contrast settings. in [lower, upper, probability] format.
-        brightness (list): brightness settings. in [lower, upper, probability] format.
-        random_apply (bool): whether to apply in random (yolo) or fixed (SSD)
-            order.
-        count (int): the number of doing distrot
-        random_channel (bool): whether to swap channels randomly
-    """
-    def __init__(self,
-                 hue=[-18, 18, 0.5],
-                 saturation=[0.5, 1.5, 0.5],
-                 contrast=[0.5, 1.5, 0.5],
-                 brightness=[0.5, 1.5, 0.5],
-                 random_apply=True,
-                 count=4,
-                 random_channel=False):
-        super(RandomDistort, self).__init__()
-        self.hue = hue
-        self.saturation = saturation
-        self.contrast = contrast
-        self.brightness = brightness
-        self.random_apply = random_apply
-        self.count = count
-        self.random_channel = random_channel
-    def apply_hue(self, img):
-        low, high, prob = self.hue
-        if np.random.uniform(0., 1.) < prob:
-            return img
-        img = img.astype(np.float32)
-        # it works, but result differ from HSV version
-        delta = np.random.uniform(low, high)
-        u = np.cos(delta * np.pi)
-        w = np.sin(delta * np.pi)
-        bt = np.array([[1.0, 0.0, 0.0], [0.0, u, -w], [0.0, w, u]])
-        tyiq = np.array([[0.299, 0.587, 0.114], [0.596, -0.274, -0.321],
-                         [0.211, -0.523, 0.311]])
-        ityiq = np.array([[1.0, 0.956, 0.621], [1.0, -0.272, -0.647],
-                          [1.0, -1.107, 1.705]])
-        t = np.dot(np.dot(ityiq, bt), tyiq).T
-        img = np.dot(img, t)
-        return img
-    def apply_saturation(self, img):
-        low, high, prob = self.saturation
-        if np.random.uniform(0., 1.) < prob:
-            return img
-        delta = np.random.uniform(low, high)
-        img = img.astype(np.float32)
-        # it works, but result differ from HSV version
-        gray = img * np.array([[[0.299, 0.587, 0.114]]], dtype=np.float32)
-        gray = gray.sum(axis=2, keepdims=True)
-        gray *= (1.0 - delta)
-        img *= delta
-        img += gray
-        return img
-    def apply_contrast(self, img):
-        low, high, prob = self.contrast
-        if np.random.uniform(0., 1.) < prob:
-            return img
-        delta = np.random.uniform(low, high)
-        img = img.astype(np.float32)
-        img *= delta
-        return img
-    def apply_brightness(self, img):
-        low, high, prob = self.brightness
-        if np.random.uniform(0., 1.) < prob:
-            return img
-        delta = np.random.uniform(low, high)
-        img = img.astype(np.float32)
-        img += delta
-        return img
-    def apply(self, sample, context=None):
-        img = sample['image']
-        if self.random_apply:
-            functions = [
-                self.apply_brightness, self.apply_contrast,
-                self.apply_saturation, self.apply_hue
-            ]
-            distortions = np.random.permutation(functions)[:self.count]
-            for func in distortions:
-                img = func(img)
-            sample['image'] = img
-            return sample
-        img = self.apply_brightness(img)
-        mode = np.random.randint(0, 2)
-        if mode:
-            img = self.apply_contrast(img)
-        img = self.apply_saturation(img)
-        img = self.apply_hue(img)
-        if not mode:
-            img = self.apply_contrast(img)
-        if self.random_channel:
-            if np.random.randint(0, 2):
-                img = img[..., np.random.permutation(3)]
-        sample['image'] = img
-        return sample
-@register_op
-class AutoAugment(BaseOperator):
-    def __init__(self, autoaug_type="v1"):
-        """
-        Args:
-            autoaug_type (str): autoaug type, support v0, v1, v2, v3, test
-        """
-        super(AutoAugment, self).__init__()
-        self.autoaug_type = autoaug_type
-    def apply(self, sample, context=None):
-        """
-        Learning Data Augmentation Strategies for Object Detection, see https://arxiv.org/abs/1906.11172
-        """
-        im = sample['image']
-        gt_bbox = sample['gt_bbox']
-        if not isinstance(im, np.ndarray):
-            raise TypeError("{}: image is not a numpy array.".format(self))
-        if len(im.shape) != 3:
-            raise ImageError("{}: image is not 3-dimensional.".format(self))
-        if len(gt_bbox) == 0:
-            return sample
-        height, width, _ = im.shape
-        norm_gt_bbox = np.ones_like(gt_bbox, dtype=np.float32)
-        norm_gt_bbox[:, 0] = gt_bbox[:, 1] / float(height)
-        norm_gt_bbox[:, 1] = gt_bbox[:, 0] / float(width)
-        norm_gt_bbox[:, 2] = gt_bbox[:, 3] / float(height)
-        norm_gt_bbox[:, 3] = gt_bbox[:, 2] / float(width)
-        from .autoaugment_utils import distort_image_with_autoaugment
-        im, norm_gt_bbox = distort_image_with_autoaugment(im, norm_gt_bbox,
-                                                          self.autoaug_type)
-        gt_bbox[:, 0] = norm_gt_bbox[:, 1] * float(width)
-        gt_bbox[:, 1] = norm_gt_bbox[:, 0] * float(height)
-        gt_bbox[:, 2] = norm_gt_bbox[:, 3] * float(width)
-        gt_bbox[:, 3] = norm_gt_bbox[:, 2] * float(height)
-        sample['image'] = im
-        sample['gt_bbox'] = gt_bbox
-        return sample
-@register_op
-class RandomFlip(BaseOperator):
-    def __init__(self, prob=0.5):
-        """
-        Args:
-            prob (float): the probability of flipping image
-        """
-        super(RandomFlip, self).__init__()
-        self.prob = prob
-        if not (isinstance(self.prob, float)):
-            raise TypeError("{}: input type is invalid.".format(self))
-    def apply_segm(self, segms, height, width):
-        def _flip_poly(poly, width):
-            flipped_poly = np.array(poly)
-            flipped_poly[0::2] = width - np.array(poly[0::2])
-            return flipped_poly.tolist()
-        def _flip_rle(rle, height, width):
-            if 'counts' in rle and type(rle['counts']) == list:
-                rle = mask_util.frPyObjects(rle, height, width)
-            mask = mask_util.decode(rle)
-            mask = mask[:, ::-1]
-            rle = mask_util.encode(np.array(mask, order='F', dtype=np.uint8))
-            return rle
-        flipped_segms = []
-        for segm in segms:
-            if is_poly(segm):
-                # Polygon format
-                flipped_segms.append(
-                    [_flip_poly(poly, width) for poly in segm])
-            else:
-                # RLE format
-                import pycocotools.mask as mask_util
-                flipped_segms.append(_flip_rle(segm, height, width))
-        return flipped_segms
-    def apply_keypoint(self, gt_keypoint, width):
-        for i in range(gt_keypoint.shape[1]):
-            if i % 2 == 0:
-                old_x = gt_keypoint[:, i].copy()
-                gt_keypoint[:, i] = width - old_x
-        return gt_keypoint
-    def apply_image(self, image):
-        return image[:, ::-1, :]
-    def apply_bbox(self, bbox, width):
-        oldx1 = bbox[:, 0].copy()
-        oldx2 = bbox[:, 2].copy()
-        bbox[:, 0] = width - oldx2
-        bbox[:, 2] = width - oldx1
-        return bbox
-    def apply_rbox(self, bbox, width):
-        oldx1 = bbox[:, 0].copy()
-        oldx2 = bbox[:, 2].copy()
-        oldx3 = bbox[:, 4].copy()
-        oldx4 = bbox[:, 6].copy()
-        bbox[:, 0] = width - oldx1
-        bbox[:, 2] = width - oldx2
-        bbox[:, 4] = width - oldx3
-        bbox[:, 6] = width - oldx4
-        bbox = [bbox_utils.get_best_begin_point_single(e) for e in bbox]
-        return bbox
-    def apply(self, sample, context=None):
-        """Filp the image and bounding box.
-        Operators:
-            1. Flip the image numpy.
-            2. Transform the bboxes' x coordinates.
-              (Must judge whether the coordinates are normalized!)
-            3. Transform the segmentations' x coordinates.
-              (Must judge whether the coordinates are normalized!)
-        Output:
-            sample: the image, bounding box and segmentation part
-                    in sample are flipped.
-        """
-        if np.random.uniform(0, 1) < self.prob:
-            im = sample['image']
-            height, width = im.shape[:2]
-            im = self.apply_image(im)
-            if 'gt_bbox' in sample and len(sample['gt_bbox']) > 0:
-                sample['gt_bbox'] = self.apply_bbox(sample['gt_bbox'], width)
-            if 'gt_poly' in sample and len(sample['gt_poly']) > 0:
-                sample['gt_poly'] = self.apply_segm(sample['gt_poly'], height,
-                                                    width)
-            if 'gt_keypoint' in sample and len(sample['gt_keypoint']) > 0:
-                sample['gt_keypoint'] = self.apply_keypoint(
-                    sample['gt_keypoint'], width)
-            if 'semantic' in sample and sample['semantic']:
-                sample['semantic'] = sample['semantic'][:, ::-1]
-            if 'gt_segm' in sample and sample['gt_segm'].any():
-                sample['gt_segm'] = sample['gt_segm'][:, :, ::-1]
-            if 'gt_rbox2poly' in sample and sample['gt_rbox2poly'].any():
-                sample['gt_rbox2poly'] = self.apply_rbox(
-                    sample['gt_rbox2poly'], width)
-            sample['flipped'] = True
-            sample['image'] = im
-        return sample
-@register_op
-class Resize(BaseOperator):
-    def __init__(self, target_size, keep_ratio, interp=cv2.INTER_LINEAR):
-        """
-        Resize image to target size. if keep_ratio is True,
-        resize the image's long side to the maximum of target_size
-        if keep_ratio is False, resize the image to target size(h, w)
-        Args:
-            target_size (int|list): image target size
-            keep_ratio (bool): whether keep_ratio or not, default true
-            interp (int): the interpolation method
-        """
-        super(Resize, self).__init__()
-        self.keep_ratio = keep_ratio
-        self.interp = interp
-        if not isinstance(target_size, (Integral, Sequence)):
-            raise TypeError(
-                "Type of target_size is invalid. Must be Integer or List or Tuple, now is {}".
-                format(type(target_size)))
-        if isinstance(target_size, Integral):
-            target_size = [target_size, target_size]
-        self.target_size = target_size
-    def apply_image(self, image, scale):
-        im_scale_x, im_scale_y = scale
-        return cv2.resize(
-            image,
-            None,
-            None,
-            fx=im_scale_x,
-            fy=im_scale_y,
-            interpolation=self.interp)
-    def apply_bbox(self, bbox, scale, size):
-        im_scale_x, im_scale_y = scale
-        resize_w, resize_h = size
-        bbox[:, 0::2] *= im_scale_x
-        bbox[:, 1::2] *= im_scale_y
-        bbox[:, 0::2] = np.clip(bbox[:, 0::2], 0, resize_w)
-        bbox[:, 1::2] = np.clip(bbox[:, 1::2], 0, resize_h)
-        return bbox
-    def apply_segm(self, segms, im_size, scale):
-        def _resize_poly(poly, im_scale_x, im_scale_y):
-            resized_poly = np.array(poly).astype('float32')
-            resized_poly[0::2] *= im_scale_x
-            resized_poly[1::2] *= im_scale_y
-            return resized_poly.tolist()
-        def _resize_rle(rle, im_h, im_w, im_scale_x, im_scale_y):
-            if 'counts' in rle and type(rle['counts']) == list:
-                rle = mask_util.frPyObjects(rle, im_h, im_w)
-            mask = mask_util.decode(rle)
-            mask = cv2.resize(
-                mask,
-                None,
-                None,
-                fx=im_scale_x,
-                fy=im_scale_y,
-                interpolation=self.interp)
-            rle = mask_util.encode(np.array(mask, order='F', dtype=np.uint8))
-            return rle
-        im_h, im_w = im_size
-        im_scale_x, im_scale_y = scale
-        resized_segms = []
-        for segm in segms:
-            if is_poly(segm):
-                # Polygon format
-                resized_segms.append([
-                    _resize_poly(poly, im_scale_x, im_scale_y) for poly in segm
-                ])
-            else:
-                # RLE format
-                import pycocotools.mask as mask_util
-                resized_segms.append(
-                    _resize_rle(segm, im_h, im_w, im_scale_x, im_scale_y))
-        return resized_segms
-    def apply(self, sample, context=None):
-        """ Resize the image numpy.
-        """
-        im = sample['image']
-        if not isinstance(im, np.ndarray):
-            raise TypeError("{}: image type is not numpy.".format(self))
-        if len(im.shape) != 3:
-            raise ImageError('{}: image is not 3-dimensional.'.format(self))
-        # apply image
-        im_shape = im.shape
-        if self.keep_ratio:
-            im_size_min = np.min(im_shape[0:2])
-            im_size_max = np.max(im_shape[0:2])
-            target_size_min = np.min(self.target_size)
-            target_size_max = np.max(self.target_size)
-            im_scale = min(target_size_min / im_size_min,
-                           target_size_max / im_size_max)
-            resize_h = im_scale * float(im_shape[0])
-            resize_w = im_scale * float(im_shape[1])
-            im_scale_x = im_scale
-            im_scale_y = im_scale
-        else:
-            resize_h, resize_w = self.target_size
-            im_scale_y = resize_h / im_shape[0]
-            im_scale_x = resize_w / im_shape[1]
-        im = self.apply_image(sample['image'], [im_scale_x, im_scale_y])
-        sample['image'] = im
-        sample['im_shape'] = np.asarray([resize_h, resize_w], dtype=np.float32)
-        if 'scale_factor' in sample:
-            scale_factor = sample['scale_factor']
-            sample['scale_factor'] = np.asarray(
-                [scale_factor[0] * im_scale_y, scale_factor[1] * im_scale_x],
-                dtype=np.float32)
-        else:
-            sample['scale_factor'] = np.asarray(
-                [im_scale_y, im_scale_x], dtype=np.float32)
-        # apply bbox
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) > 0:
-            sample['gt_bbox'] = self.apply_bbox(sample['gt_bbox'],
-                                                [im_scale_x, im_scale_y],
-                                                [resize_w, resize_h])
-        # apply rbox
-        if 'gt_rbox2poly' in sample:
-            if np.array(sample['gt_rbox2poly']).shape[1] != 8:
-                logger.warning(
-                    "gt_rbox2poly's length shoule be 8, but actually is {}".
-                    format(len(sample['gt_rbox2poly'])))
-            sample['gt_rbox2poly'] = self.apply_bbox(sample['gt_rbox2poly'],
-                                                     [im_scale_x, im_scale_y],
-                                                     [resize_w, resize_h])
-        # apply polygon
-        if 'gt_poly' in sample and len(sample['gt_poly']) > 0:
-            sample['gt_poly'] = self.apply_segm(
-                sample['gt_poly'], im_shape[:2], [im_scale_x, im_scale_y])
-        # apply semantic
-        if 'semantic' in sample and sample['semantic']:
-            semantic = sample['semantic']
-            semantic = cv2.resize(
-                semantic.astype('float32'),
-                None,
-                None,
-                fx=im_scale_x,
-                fy=im_scale_y,
-                interpolation=self.interp)
-            semantic = np.asarray(semantic).astype('int32')
-            semantic = np.expand_dims(semantic, 0)
-            sample['semantic'] = semantic
-        # apply gt_segm
-        if 'gt_segm' in sample and len(sample['gt_segm']) > 0:
-            masks = [
-                cv2.resize(
-                    gt_segm,
-                    None,
-                    None,
-                    fx=im_scale_x,
-                    fy=im_scale_y,
-                    interpolation=cv2.INTER_NEAREST)
-                for gt_segm in sample['gt_segm']
-            ]
-            sample['gt_segm'] = np.asarray(masks).astype(np.uint8)
-        return sample
-@register_op
-class MultiscaleTestResize(BaseOperator):
-    def __init__(self,
-                 origin_target_size=[800, 1333],
-                 target_size=[],
-                 interp=cv2.INTER_LINEAR,
-                 use_flip=True):
-        """
-        Rescale image to the each size in target size, and capped at max_size.
-        Args:
-            origin_target_size (list): origin target size of image
-            target_size (list): A list of target sizes of image.
-            interp (int): the interpolation method.
-            use_flip (bool): whether use flip augmentation.
-        """
-        super(MultiscaleTestResize, self).__init__()
-        self.interp = interp
-        self.use_flip = use_flip
-        if not isinstance(target_size, Sequence):
-            raise TypeError(
-                "Type of target_size is invalid. Must be List or Tuple, now is {}".
-                format(type(target_size)))
-        self.target_size = target_size
-        if not isinstance(origin_target_size, Sequence):
-            raise TypeError(
-                "Type of origin_target_size is invalid. Must be List or Tuple, now is {}".
-                format(type(origin_target_size)))
-        self.origin_target_size = origin_target_size
-    def apply(self, sample, context=None):
-        """ Resize the image numpy for multi-scale test.
-        """
-        samples = []
-        resizer = Resize(
-            self.origin_target_size, keep_ratio=True, interp=self.interp)
-        samples.append(resizer(sample.copy(), context))
-        if self.use_flip:
-            flipper = RandomFlip(1.1)
-            samples.append(flipper(sample.copy(), context=context))
-        for size in self.target_size:
-            resizer = Resize(size, keep_ratio=True, interp=self.interp)
-            samples.append(resizer(sample.copy(), context))
-        return samples
-@register_op
-class RandomResize(BaseOperator):
-    def __init__(self,
-                 target_size,
-                 keep_ratio=True,
-                 interp=cv2.INTER_LINEAR,
-                 random_size=True,
-                 random_interp=False):
-        """
-        Resize image to target size randomly. random target_size and interpolation method
-        Args:
-            target_size (int, list, tuple): image target size, if random size is True, must be list or tuple
-            keep_ratio (bool): whether keep_raio or not, default true
-            interp (int): the interpolation method
-            random_size (bool): whether random select target size of image
-            random_interp (bool): whether random select interpolation method
-        """
-        super(RandomResize, self).__init__()
-        self.keep_ratio = keep_ratio
-        self.interp = interp
-        self.interps = [
-            cv2.INTER_NEAREST,
-            cv2.INTER_LINEAR,
-            cv2.INTER_AREA,
-            cv2.INTER_CUBIC,
-            cv2.INTER_LANCZOS4,
-        ]
-        assert isinstance(target_size, (
-            Integral, Sequence)), "target_size must be Integer, List or Tuple"
-        if random_size and not isinstance(target_size, Sequence):
-            raise TypeError(
-                "Type of target_size is invalid when random_size is True. Must be List or Tuple, now is {}".
-                format(type(target_size)))
-        self.target_size = target_size
-        self.random_size = random_size
-        self.random_interp = random_interp
-    def apply(self, sample, context=None):
-        """ Resize the image numpy.
-        """
-        if self.random_size:
-            target_size = random.choice(self.target_size)
-        else:
-            target_size = self.target_size
-        if self.random_interp:
-            interp = random.choice(self.interps)
-        else:
-            interp = self.interp
-        resizer = Resize(target_size, self.keep_ratio, interp)
-        return resizer(sample, context=context)
-@register_op
-class RandomExpand(BaseOperator):
-    """Random expand the canvas.
-    Args:
-        ratio (float): maximum expansion ratio.
-        prob (float): probability to expand.
-        fill_value (list): color value used to fill the canvas. in RGB order.
-    """
-    def __init__(self, ratio=4., prob=0.5, fill_value=(127.5, 127.5, 127.5)):
-        super(RandomExpand, self).__init__()
-        assert ratio > 1.01, "expand ratio must be larger than 1.01"
-        self.ratio = ratio
-        self.prob = prob
-        assert isinstance(fill_value, (Number, Sequence)), \
-            "fill value must be either float or sequence"
-        if isinstance(fill_value, Number):
-            fill_value = (fill_value, ) * 3
-        if not isinstance(fill_value, tuple):
-            fill_value = tuple(fill_value)
-        self.fill_value = fill_value
-    def apply(self, sample, context=None):
-        if np.random.uniform(0., 1.) < self.prob:
-            return sample
-        im = sample['image']
-        height, width = im.shape[:2]
-        ratio = np.random.uniform(1., self.ratio)
-        h = int(height * ratio)
-        w = int(width * ratio)
-        if not h > height or not w > width:
-            return sample
-        y = np.random.randint(0, h - height)
-        x = np.random.randint(0, w - width)
-        offsets, size = [x, y], [h, w]
-        pad = Pad(size,
-                  pad_mode=-1,
-                  offsets=offsets,
-                  fill_value=self.fill_value)
-        return pad(sample, context=context)
-@register_op
-class CropWithSampling(BaseOperator):
-    def __init__(self, batch_sampler, satisfy_all=False, avoid_no_bbox=True):
-        """
-        Args:
-            batch_sampler (list): Multiple sets of different
-                                  parameters for cropping.
-            satisfy_all (bool): whether all boxes must satisfy.
-            e.g.[[1, 1, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0],
-                 [1, 50, 0.3, 1.0, 0.5, 2.0, 0.1, 1.0],
-                 [1, 50, 0.3, 1.0, 0.5, 2.0, 0.3, 1.0],
-                 [1, 50, 0.3, 1.0, 0.5, 2.0, 0.5, 1.0],
-                 [1, 50, 0.3, 1.0, 0.5, 2.0, 0.7, 1.0],
-                 [1, 50, 0.3, 1.0, 0.5, 2.0, 0.9, 1.0],
-                 [1, 50, 0.3, 1.0, 0.5, 2.0, 0.0, 1.0]]
-           [max sample, max trial, min scale, max scale,
-            min aspect ratio, max aspect ratio,
-            min overlap, max overlap]
-            avoid_no_bbox (bool): whether to to avoid the
-                                  situation where the box does not appear.
-        """
-        super(CropWithSampling, self).__init__()
-        self.batch_sampler = batch_sampler
-        self.satisfy_all = satisfy_all
-        self.avoid_no_bbox = avoid_no_bbox
-    def apply(self, sample, context):
-        """
-        Crop the image and modify bounding box.
-        Operators:
-            1. Scale the image width and height.
-            2. Crop the image according to a radom sample.
-            3. Rescale the bounding box.
-            4. Determine if the new bbox is satisfied in the new image.
-        Returns:
-            sample: the image, bounding box are replaced.
-        """
-        assert 'image' in sample, "image data not found"
-        im = sample['image']
-        gt_bbox = sample['gt_bbox']
-        gt_class = sample['gt_class']
-        im_height, im_width = im.shape[:2]
-        gt_score = None
-        if 'gt_score' in sample:
-            gt_score = sample['gt_score']
-        sampled_bbox = []
-        gt_bbox = gt_bbox.tolist()
-        for sampler in self.batch_sampler:
-            found = 0
-            for i in range(sampler[1]):
-                if found >= sampler[0]:
-                    break
-                sample_bbox = generate_sample_bbox(sampler)
-                if satisfy_sample_constraint(sampler, sample_bbox, gt_bbox,
-                                             self.satisfy_all):
-                    sampled_bbox.append(sample_bbox)
-                    found = found + 1
-        im = np.array(im)
-        while sampled_bbox:
-            idx = int(np.random.uniform(0, len(sampled_bbox)))
-            sample_bbox = sampled_bbox.pop(idx)
-            sample_bbox = clip_bbox(sample_bbox)
-            crop_bbox, crop_class, crop_score = \
-                filter_and_process(sample_bbox, gt_bbox, gt_class, scores=gt_score)
-            if self.avoid_no_bbox:
-                if len(crop_bbox) < 1:
-                    continue
-            xmin = int(sample_bbox[0] * im_width)
-            xmax = int(sample_bbox[2] * im_width)
-            ymin = int(sample_bbox[1] * im_height)
-            ymax = int(sample_bbox[3] * im_height)
-            im = im[ymin:ymax, xmin:xmax]
-            sample['image'] = im
-            sample['gt_bbox'] = crop_bbox
-            sample['gt_class'] = crop_class
-            sample['gt_score'] = crop_score
-            return sample
-        return sample
-@register_op
-class CropWithDataAchorSampling(BaseOperator):
-    def __init__(self,
-                 batch_sampler,
-                 anchor_sampler=None,
-                 target_size=None,
-                 das_anchor_scales=[16, 32, 64, 128],
-                 sampling_prob=0.5,
-                 min_size=8.,
-                 avoid_no_bbox=True):
-        """
-        Args:
-            anchor_sampler (list): anchor_sampling sets of different
-                                  parameters for cropping.
-            batch_sampler (list): Multiple sets of different
-                                  parameters for cropping.
-              e.g.[[1, 10, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.2, 0.0]]
-                  [[1, 50, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0],
-                   [1, 50, 0.3, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0],
-                   [1, 50, 0.3, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0],
-                   [1, 50, 0.3, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0],
-                   [1, 50, 0.3, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0]]
-              [max sample, max trial, min scale, max scale,
-               min aspect ratio, max aspect ratio,
-               min overlap, max overlap, min coverage, max coverage]
-            target_size (int): target image size.
-            das_anchor_scales (list[float]): a list of anchor scales in data
-                anchor smapling.
-            min_size (float): minimum size of sampled bbox.
-            avoid_no_bbox (bool): whether to to avoid the
-                                  situation where the box does not appear.
-        """
-        super(CropWithDataAchorSampling, self).__init__()
-        self.anchor_sampler = anchor_sampler
-        self.batch_sampler = batch_sampler
-        self.target_size = target_size
-        self.sampling_prob = sampling_prob
-        self.min_size = min_size
-        self.avoid_no_bbox = avoid_no_bbox
-        self.das_anchor_scales = np.array(das_anchor_scales)
-    def apply(self, sample, context):
-        """
-        Crop the image and modify bounding box.
-        Operators:
-            1. Scale the image width and height.
-            2. Crop the image according to a radom sample.
-            3. Rescale the bounding box.
-            4. Determine if the new bbox is satisfied in the new image.
-        Returns:
-            sample: the image, bounding box are replaced.
-        """
-        assert 'image' in sample, "image data not found"
-        im = sample['image']
-        gt_bbox = sample['gt_bbox']
-        gt_class = sample['gt_class']
-        image_height, image_width = im.shape[:2]
-        gt_bbox[:, 0] /= image_width
-        gt_bbox[:, 1] /= image_height
-        gt_bbox[:, 2] /= image_width
-        gt_bbox[:, 3] /= image_height
-        gt_score = None
-        if 'gt_score' in sample:
-            gt_score = sample['gt_score']
-        sampled_bbox = []
-        gt_bbox = gt_bbox.tolist()
-        prob = np.random.uniform(0., 1.)
-        if prob > self.sampling_prob:  # anchor sampling
-            assert self.anchor_sampler
-            for sampler in self.anchor_sampler:
-                found = 0
-                for i in range(sampler[1]):
-                    if found >= sampler[0]:
-                        break
-                    sample_bbox = data_anchor_sampling(
-                        gt_bbox, image_width, image_height,
-                        self.das_anchor_scales, self.target_size)
-                    if sample_bbox == 0:
-                        break
-                    if satisfy_sample_constraint_coverage(sampler, sample_bbox,
-                                                          gt_bbox):
-                        sampled_bbox.append(sample_bbox)
-                        found = found + 1
-            im = np.array(im)
-            while sampled_bbox:
-                idx = int(np.random.uniform(0, len(sampled_bbox)))
-                sample_bbox = sampled_bbox.pop(idx)
-                if 'gt_keypoint' in sample.keys():
-                    keypoints = (sample['gt_keypoint'],
-                                 sample['keypoint_ignore'])
-                    crop_bbox, crop_class, crop_score, gt_keypoints = \
-                        filter_and_process(sample_bbox, gt_bbox, gt_class,
-                                scores=gt_score,
-                                keypoints=keypoints)
-                else:
-                    crop_bbox, crop_class, crop_score = filter_and_process(
-                        sample_bbox, gt_bbox, gt_class, scores=gt_score)
-                crop_bbox, crop_class, crop_score = bbox_area_sampling(
-                    crop_bbox, crop_class, crop_score, self.target_size,
-                    self.min_size)
-                if self.avoid_no_bbox:
-                    if len(crop_bbox) < 1:
-                        continue
-                im = crop_image_sampling(im, sample_bbox, image_width,
-                                         image_height, self.target_size)
-                height, width = im.shape[:2]
-                crop_bbox[:, 0] *= width
-                crop_bbox[:, 1] *= height
-                crop_bbox[:, 2] *= width
-                crop_bbox[:, 3] *= height
-                sample['image'] = im
-                sample['gt_bbox'] = crop_bbox
-                sample['gt_class'] = crop_class
-                if 'gt_score' in sample:
-                    sample['gt_score'] = crop_score
-                if 'gt_keypoint' in sample.keys():
-                    sample['gt_keypoint'] = gt_keypoints[0]
-                    sample['keypoint_ignore'] = gt_keypoints[1]
-                return sample
-            return sample
-        else:
-            for sampler in self.batch_sampler:
-                found = 0
-                for i in range(sampler[1]):
-                    if found >= sampler[0]:
-                        break
-                    sample_bbox = generate_sample_bbox_square(
-                        sampler, image_width, image_height)
-                    if satisfy_sample_constraint_coverage(sampler, sample_bbox,
-                                                          gt_bbox):
-                        sampled_bbox.append(sample_bbox)
-                        found = found + 1
-            im = np.array(im)
-            while sampled_bbox:
-                idx = int(np.random.uniform(0, len(sampled_bbox)))
-                sample_bbox = sampled_bbox.pop(idx)
-                sample_bbox = clip_bbox(sample_bbox)
-                if 'gt_keypoint' in sample.keys():
-                    keypoints = (sample['gt_keypoint'],
-                                 sample['keypoint_ignore'])
-                    crop_bbox, crop_class, crop_score, gt_keypoints = \
-                        filter_and_process(sample_bbox, gt_bbox, gt_class,
-                                scores=gt_score,
-                                keypoints=keypoints)
-                else:
-                    crop_bbox, crop_class, crop_score = filter_and_process(
-                        sample_bbox, gt_bbox, gt_class, scores=gt_score)
-                # sampling bbox according the bbox area
-                crop_bbox, crop_class, crop_score = bbox_area_sampling(
-                    crop_bbox, crop_class, crop_score, self.target_size,
-                    self.min_size)
-                if self.avoid_no_bbox:
-                    if len(crop_bbox) < 1:
-                        continue
-                xmin = int(sample_bbox[0] * image_width)
-                xmax = int(sample_bbox[2] * image_width)
-                ymin = int(sample_bbox[1] * image_height)
-                ymax = int(sample_bbox[3] * image_height)
-                im = im[ymin:ymax, xmin:xmax]
-                height, width = im.shape[:2]
-                crop_bbox[:, 0] *= width
-                crop_bbox[:, 1] *= height
-                crop_bbox[:, 2] *= width
-                crop_bbox[:, 3] *= height
-                sample['image'] = im
-                sample['gt_bbox'] = crop_bbox
-                sample['gt_class'] = crop_class
-                if 'gt_score' in sample:
-                    sample['gt_score'] = crop_score
-                if 'gt_keypoint' in sample.keys():
-                    sample['gt_keypoint'] = gt_keypoints[0]
-                    sample['keypoint_ignore'] = gt_keypoints[1]
-                return sample
-            return sample
-@register_op
-class RandomCrop(BaseOperator):
-    """Random crop image and bboxes.
-    Args:
-        aspect_ratio (list): aspect ratio of cropped region.
-            in [min, max] format.
-        thresholds (list): iou thresholds for decide a valid bbox crop.
-        scaling (list): ratio between a cropped region and the original image.
-             in [min, max] format.
-        num_attempts (int): number of tries before giving up.
-        allow_no_crop (bool): allow return without actually cropping them.
-        cover_all_box (bool): ensure all bboxes are covered in the final crop.
-        is_mask_crop(bool): whether crop the segmentation.
-    """
-    def __init__(self,
-                 aspect_ratio=[.5, 2.],
-                 thresholds=[.0, .1, .3, .5, .7, .9],
-                 scaling=[.3, 1.],
-                 num_attempts=50,
-                 allow_no_crop=True,
-                 cover_all_box=False,
-                 is_mask_crop=False):
-        super(RandomCrop, self).__init__()
-        self.aspect_ratio = aspect_ratio
-        self.thresholds = thresholds
-        self.scaling = scaling
-        self.num_attempts = num_attempts
-        self.allow_no_crop = allow_no_crop
-        self.cover_all_box = cover_all_box
-        self.is_mask_crop = is_mask_crop
-    def crop_segms(self, segms, valid_ids, crop, height, width):
-        def _crop_poly(segm, crop):
-            xmin, ymin, xmax, ymax = crop
-            crop_coord = [xmin, ymin, xmin, ymax, xmax, ymax, xmax, ymin]
-            crop_p = np.array(crop_coord).reshape(4, 2)
-            crop_p = Polygon(crop_p)
-            crop_segm = list()
-            for poly in segm:
-                poly = np.array(poly).reshape(len(poly) // 2, 2)
-                polygon = Polygon(poly)
-                if not polygon.is_valid:
-                    exterior = polygon.exterior
-                    multi_lines = exterior.intersection(exterior)
-                    polygons = shapely.ops.polygonize(multi_lines)
-                    polygon = MultiPolygon(polygons)
-                multi_polygon = list()
-                if isinstance(polygon, MultiPolygon):
-                    multi_polygon = copy.deepcopy(polygon)
-                else:
-                    multi_polygon.append(copy.deepcopy(polygon))
-                for per_polygon in multi_polygon:
-                    inter = per_polygon.intersection(crop_p)
-                    if not inter:
-                        continue
-                    if isinstance(inter, (MultiPolygon, GeometryCollection)):
-                        for part in inter:
-                            if not isinstance(part, Polygon):
-                                continue
-                            part = np.squeeze(
-                                np.array(part.exterior.coords[:-1]).reshape(
-                                    1, -1))
-                            part[0::2] -= xmin
-                            part[1::2] -= ymin
-                            crop_segm.append(part.tolist())
-                    elif isinstance(inter, Polygon):
-                        crop_poly = np.squeeze(
-                            np.array(inter.exterior.coords[:-1]).reshape(1,
-                                                                         -1))
-                        crop_poly[0::2] -= xmin
-                        crop_poly[1::2] -= ymin
-                        crop_segm.append(crop_poly.tolist())
-                    else:
-                        continue
-            return crop_segm
-        def _crop_rle(rle, crop, height, width):
-            if 'counts' in rle and type(rle['counts']) == list:
-                rle = mask_util.frPyObjects(rle, height, width)
-            mask = mask_util.decode(rle)
-            mask = mask[crop[1]:crop[3], crop[0]:crop[2]]
-            rle = mask_util.encode(np.array(mask, order='F', dtype=np.uint8))
-            return rle
-        crop_segms = []
-        for id in valid_ids:
-            segm = segms[id]
-            if is_poly(segm):
-                import copy
-                import shapely.ops
-                from shapely.geometry import Polygon, MultiPolygon, GeometryCollection
-                logging.getLogger("shapely").setLevel(logging.WARNING)
-                # Polygon format
-                crop_segms.append(_crop_poly(segm, crop))
-            else:
-                # RLE format
-                import pycocotools.mask as mask_util
-                crop_segms.append(_crop_rle(segm, crop, height, width))
-        return crop_segms
-    def apply(self, sample, context=None):
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) == 0:
-            return sample
-        h, w = sample['image'].shape[:2]
-        gt_bbox = sample['gt_bbox']
-        # NOTE Original method attempts to generate one candidate for each
-        # threshold then randomly sample one from the resulting list.
-        # Here a short circuit approach is taken, i.e., randomly choose a
-        # threshold and attempt to find a valid crop, and simply return the
-        # first one found.
-        # The probability is not exactly the same, kinda resembling the
-        # "Monty Hall" problem. Actually carrying out the attempts will affect
-        # observability (just like opening doors in the "Monty Hall" game).
-        thresholds = list(self.thresholds)
-        if self.allow_no_crop:
-            thresholds.append('no_crop')
-        np.random.shuffle(thresholds)
-        for thresh in thresholds:
-            if thresh == 'no_crop':
-                return sample
-            found = False
-            for i in range(self.num_attempts):
-                scale = np.random.uniform(*self.scaling)
-                if self.aspect_ratio is not None:
-                    min_ar, max_ar = self.aspect_ratio
-                    aspect_ratio = np.random.uniform(
-                        max(min_ar, scale**2), min(max_ar, scale**-2))
-                    h_scale = scale / np.sqrt(aspect_ratio)
-                    w_scale = scale * np.sqrt(aspect_ratio)
-                else:
-                    h_scale = np.random.uniform(*self.scaling)
-                    w_scale = np.random.uniform(*self.scaling)
-                crop_h = h * h_scale
-                crop_w = w * w_scale
-                if self.aspect_ratio is None:
-                    if crop_h / crop_w < 0.5 or crop_h / crop_w > 2.0:
-                        continue
-                crop_h = int(crop_h)
-                crop_w = int(crop_w)
-                crop_y = np.random.randint(0, h - crop_h)
-                crop_x = np.random.randint(0, w - crop_w)
-                crop_box = [crop_x, crop_y, crop_x + crop_w, crop_y + crop_h]
-                iou = self._iou_matrix(
-                    gt_bbox, np.array(
-                        [crop_box], dtype=np.float32))
-                if iou.max() < thresh:
-                    continue
-                if self.cover_all_box and iou.min() < thresh:
-                    continue
-                cropped_box, valid_ids = self._crop_box_with_center_constraint(
-                    gt_bbox, np.array(
-                        crop_box, dtype=np.float32))
-                if valid_ids.size > 0:
-                    found = True
-                    break
-            if found:
-                if self.is_mask_crop and 'gt_poly' in sample and len(sample[
-                        'gt_poly']) > 0:
-                    crop_polys = self.crop_segms(
-                        sample['gt_poly'],
-                        valid_ids,
-                        np.array(
-                            crop_box, dtype=np.int64),
-                        h,
-                        w)
-                    if [] in crop_polys:
-                        delete_id = list()
-                        valid_polys = list()
-                        for id, crop_poly in enumerate(crop_polys):
-                            if crop_poly == []:
-                                delete_id.append(id)
-                            else:
-                                valid_polys.append(crop_poly)
-                        valid_ids = np.delete(valid_ids, delete_id)
-                        if len(valid_polys) == 0:
-                            return sample
-                        sample['gt_poly'] = valid_polys
-                    else:
-                        sample['gt_poly'] = crop_polys
-                if 'gt_segm' in sample:
-                    sample['gt_segm'] = self._crop_segm(sample['gt_segm'],
-                                                        crop_box)
-                    sample['gt_segm'] = np.take(
-                        sample['gt_segm'], valid_ids, axis=0)
-                sample['image'] = self._crop_image(sample['image'], crop_box)
-                sample['gt_bbox'] = np.take(cropped_box, valid_ids, axis=0)
-                sample['gt_class'] = np.take(
-                    sample['gt_class'], valid_ids, axis=0)
-                if 'gt_score' in sample:
-                    sample['gt_score'] = np.take(
-                        sample['gt_score'], valid_ids, axis=0)
-                if 'is_crowd' in sample:
-                    sample['is_crowd'] = np.take(
-                        sample['is_crowd'], valid_ids, axis=0)
-                return sample
-        return sample
-    def _iou_matrix(self, a, b):
-        tl_i = np.maximum(a[:, np.newaxis, :2], b[:, :2])
-        br_i = np.minimum(a[:, np.newaxis, 2:], b[:, 2:])
-        area_i = np.prod(br_i - tl_i, axis=2) * (tl_i < br_i).all(axis=2)
-        area_a = np.prod(a[:, 2:] - a[:, :2], axis=1)
-        area_b = np.prod(b[:, 2:] - b[:, :2], axis=1)
-        area_o = (area_a[:, np.newaxis] + area_b - area_i)
-        return area_i / (area_o + 1e-10)
-    def _crop_box_with_center_constraint(self, box, crop):
-        cropped_box = box.copy()
-        cropped_box[:, :2] = np.maximum(box[:, :2], crop[:2])
-        cropped_box[:, 2:] = np.minimum(box[:, 2:], crop[2:])
-        cropped_box[:, :2] -= crop[:2]
-        cropped_box[:, 2:] -= crop[:2]
-        centers = (box[:, :2] + box[:, 2:]) / 2
-        valid = np.logical_and(crop[:2] <= centers,
-                               centers < crop[2:]).all(axis=1)
-        valid = np.logical_and(
-            valid, (cropped_box[:, :2] < cropped_box[:, 2:]).all(axis=1))
-        return cropped_box, np.where(valid)[0]
-    def _crop_image(self, img, crop):
-        x1, y1, x2, y2 = crop
-        return img[y1:y2, x1:x2, :]
-    def _crop_segm(self, segm, crop):
-        x1, y1, x2, y2 = crop
-        return segm[:, y1:y2, x1:x2]
-@register_op
-class RandomScaledCrop(BaseOperator):
-    """Resize image and bbox based on long side (with optional random scaling),
-       then crop or pad image to target size.
-    Args:
-        target_dim (int): target size.
-        scale_range (list): random scale range.
-        interp (int): interpolation method, default to `cv2.INTER_LINEAR`.
-    """
-    def __init__(self,
-                 target_dim=512,
-                 scale_range=[.1, 2.],
-                 interp=cv2.INTER_LINEAR):
-        super(RandomScaledCrop, self).__init__()
-        self.target_dim = target_dim
-        self.scale_range = scale_range
-        self.interp = interp
-    def apply(self, sample, context=None):
-        img = sample['image']
-        h, w = img.shape[:2]
-        random_scale = np.random.uniform(*self.scale_range)
-        dim = self.target_dim
-        random_dim = int(dim * random_scale)
-        dim_max = max(h, w)
-        scale = random_dim / dim_max
-        resize_w = w * scale
-        resize_h = h * scale
-        offset_x = int(max(0, np.random.uniform(0., resize_w - dim)))
-        offset_y = int(max(0, np.random.uniform(0., resize_h - dim)))
-        img = cv2.resize(img, (resize_w, resize_h), interpolation=self.interp)
-        img = np.array(img)
-        canvas = np.zeros((dim, dim, 3), dtype=img.dtype)
-        canvas[:min(dim, resize_h), :min(dim, resize_w), :] = img[
-            offset_y:offset_y + dim, offset_x:offset_x + dim, :]
-        sample['image'] = canvas
-        sample['im_shape'] = np.asarray([resize_h, resize_w], dtype=np.float32)
-        scale_factor = sample['sacle_factor']
-        sample['scale_factor'] = np.asarray(
-            [scale_factor[0] * scale, scale_factor[1] * scale],
-            dtype=np.float32)
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) > 0:
-            scale_array = np.array([scale, scale] * 2, dtype=np.float32)
-            shift_array = np.array([offset_x, offset_y] * 2, dtype=np.float32)
-            boxes = sample['gt_bbox'] * scale_array - shift_array
-            boxes = np.clip(boxes, 0, dim - 1)
-            # filter boxes with no area
-            area = np.prod(boxes[..., 2:] - boxes[..., :2], axis=1)
-            valid = (area > 1.).nonzero()[0]
-            sample['gt_bbox'] = boxes[valid]
-            sample['gt_class'] = sample['gt_class'][valid]
-        return sample
-@register_op
-class Cutmix(BaseOperator):
-    def __init__(self, alpha=1.5, beta=1.5):
-        """
-        CutMix: Regularization Strategy to Train Strong Classifiers with Localizable Features, see https://arxiv.org/abs/1905.04899
-        Cutmix image and gt_bbbox/gt_score
-        Args:
-             alpha (float): alpha parameter of beta distribute
-             beta (float): beta parameter of beta distribute
-        """
-        super(Cutmix, self).__init__()
-        self.alpha = alpha
-        self.beta = beta
-        if self.alpha <= 0.0:
-            raise ValueError("alpha shold be positive in {}".format(self))
-        if self.beta <= 0.0:
-            raise ValueError("beta shold be positive in {}".format(self))
-    def apply_image(self, img1, img2, factor):
-        """ _rand_bbox """
-        h = max(img1.shape[0], img2.shape[0])
-        w = max(img1.shape[1], img2.shape[1])
-        cut_rat = np.sqrt(1. - factor)
-        cut_w = np.int32(w * cut_rat)
-        cut_h = np.int32(h * cut_rat)
-        # uniform
-        cx = np.random.randint(w)
-        cy = np.random.randint(h)
-        bbx1 = np.clip(cx - cut_w // 2, 0, w - 1)
-        bby1 = np.clip(cy - cut_h // 2, 0, h - 1)
-        bbx2 = np.clip(cx + cut_w // 2, 0, w - 1)
-        bby2 = np.clip(cy + cut_h // 2, 0, h - 1)
-        img_1_pad = np.zeros((h, w, img1.shape[2]), 'float32')
-        img_1_pad[:img1.shape[0], :img1.shape[1], :] = \
-            img1.astype('float32')
-        img_2_pad = np.zeros((h, w, img2.shape[2]), 'float32')
-        img_2_pad[:img2.shape[0], :img2.shape[1], :] = \
-            img2.astype('float32')
-        img_1_pad[bby1:bby2, bbx1:bbx2, :] = img_2_pad[bby1:bby2, bbx1:bbx2, :]
-        return img_1_pad
-    def __call__(self, sample, context=None):
-        if not isinstance(sample, Sequence):
-            return sample
-        assert len(sample) == 2, 'cutmix need two samples'
-        factor = np.random.beta(self.alpha, self.beta)
-        factor = max(0.0, min(1.0, factor))
-        if factor >= 1.0:
-            return sample[0]
-        if factor <= 0.0:
-            return sample[1]
-        img1 = sample[0]['image']
-        img2 = sample[1]['image']
-        img = self.apply_image(img1, img2, factor)
-        gt_bbox1 = sample[0]['gt_bbox']
-        gt_bbox2 = sample[1]['gt_bbox']
-        gt_bbox = np.concatenate((gt_bbox1, gt_bbox2), axis=0)
-        gt_class1 = sample[0]['gt_class']
-        gt_class2 = sample[1]['gt_class']
-        gt_class = np.concatenate((gt_class1, gt_class2), axis=0)
-        gt_score1 = np.ones_like(sample[0]['gt_class'])
-        gt_score2 = np.ones_like(sample[1]['gt_class'])
-        gt_score = np.concatenate(
-            (gt_score1 * factor, gt_score2 * (1. - factor)), axis=0)
-        result = copy.deepcopy(sample[0])
-        result['image'] = img
-        result['gt_bbox'] = gt_bbox
-        result['gt_score'] = gt_score
-        result['gt_class'] = gt_class
-        if 'is_crowd' in sample[0]:
-            is_crowd1 = sample[0]['is_crowd']
-            is_crowd2 = sample[1]['is_crowd']
-            is_crowd = np.concatenate((is_crowd1, is_crowd2), axis=0)
-            result['is_crowd'] = is_crowd
-        if 'difficult' in sample[0]:
-            is_difficult1 = sample[0]['difficult']
-            is_difficult2 = sample[1]['difficult']
-            is_difficult = np.concatenate(
-                (is_difficult1, is_difficult2), axis=0)
-            result['difficult'] = is_difficult
-        return result
-@register_op
-class Mixup(BaseOperator):
-    def __init__(self, alpha=1.5, beta=1.5):
-        """ Mixup image and gt_bbbox/gt_score
-        Args:
-            alpha (float): alpha parameter of beta distribute
-            beta (float): beta parameter of beta distribute
-        """
-        super(Mixup, self).__init__()
-        self.alpha = alpha
-        self.beta = beta
-        if self.alpha <= 0.0:
-            raise ValueError("alpha shold be positive in {}".format(self))
-        if self.beta <= 0.0:
-            raise ValueError("beta shold be positive in {}".format(self))
-    def apply_image(self, img1, img2, factor):
-        h = max(img1.shape[0], img2.shape[0])
-        w = max(img1.shape[1], img2.shape[1])
-        img = np.zeros((h, w, img1.shape[2]), 'float32')
-        img[:img1.shape[0], :img1.shape[1], :] = \
-            img1.astype('float32') * factor
-        img[:img2.shape[0], :img2.shape[1], :] += \
-            img2.astype('float32') * (1.0 - factor)
-        return img.astype('uint8')
-    def __call__(self, sample, context=None):
-        if not isinstance(sample, Sequence):
-            return sample
-        assert len(sample) == 2, 'mixup need two samples'
-        factor = np.random.beta(self.alpha, self.beta)
-        factor = max(0.0, min(1.0, factor))
-        if factor >= 1.0:
-            return sample[0]
-        if factor <= 0.0:
-            return sample[1]
-        im = self.apply_image(sample[0]['image'], sample[1]['image'], factor)
-        result = copy.deepcopy(sample[0])
-        result['image'] = im
-        # apply bbox and score
-        if 'gt_bbox' in sample[0]:
-            gt_bbox1 = sample[0]['gt_bbox']
-            gt_bbox2 = sample[1]['gt_bbox']
-            gt_bbox = np.concatenate((gt_bbox1, gt_bbox2), axis=0)
-            result['gt_bbox'] = gt_bbox
-        if 'gt_class' in sample[0]:
-            gt_class1 = sample[0]['gt_class']
-            gt_class2 = sample[1]['gt_class']
-            gt_class = np.concatenate((gt_class1, gt_class2), axis=0)
-            result['gt_class'] = gt_class
-            gt_score1 = np.ones_like(sample[0]['gt_class'])
-            gt_score2 = np.ones_like(sample[1]['gt_class'])
-            gt_score = np.concatenate(
-                (gt_score1 * factor, gt_score2 * (1. - factor)), axis=0)
-            result['gt_score'] = gt_score
-        if 'is_crowd' in sample[0]:
-            is_crowd1 = sample[0]['is_crowd']
-            is_crowd2 = sample[1]['is_crowd']
-            is_crowd = np.concatenate((is_crowd1, is_crowd2), axis=0)
-            result['is_crowd'] = is_crowd
-        if 'difficult' in sample[0]:
-            is_difficult1 = sample[0]['difficult']
-            is_difficult2 = sample[1]['difficult']
-            is_difficult = np.concatenate(
-                (is_difficult1, is_difficult2), axis=0)
-            result['difficult'] = is_difficult
-        if 'gt_ide' in sample[0]:
-            gt_ide1 = sample[0]['gt_ide']
-            gt_ide2 = sample[1]['gt_ide']
-            gt_ide = np.concatenate((gt_ide1, gt_ide2), axis=0)
-            result['gt_ide'] = gt_ide
-        return result
-@register_op
-class NormalizeBox(BaseOperator):
-    """Transform the bounding box's coornidates to [0,1]."""
-    def __init__(self):
-        super(NormalizeBox, self).__init__()
-    def apply(self, sample, context):
-        im = sample['image']
-        gt_bbox = sample['gt_bbox']
-        height, width, _ = im.shape
-        for i in range(gt_bbox.shape[0]):
-            gt_bbox[i][0] = gt_bbox[i][0] / width
-            gt_bbox[i][1] = gt_bbox[i][1] / height
-            gt_bbox[i][2] = gt_bbox[i][2] / width
-            gt_bbox[i][3] = gt_bbox[i][3] / height
-        sample['gt_bbox'] = gt_bbox
-        if 'gt_keypoint' in sample.keys():
-            gt_keypoint = sample['gt_keypoint']
-            for i in range(gt_keypoint.shape[1]):
-                if i % 2:
-                    gt_keypoint[:, i] = gt_keypoint[:, i] / height
-                else:
-                    gt_keypoint[:, i] = gt_keypoint[:, i] / width
-            sample['gt_keypoint'] = gt_keypoint
-        return sample
-@register_op
-class BboxXYXY2XYWH(BaseOperator):
-    """
-    Convert bbox XYXY format to XYWH format.
-    """
-    def __init__(self):
-        super(BboxXYXY2XYWH, self).__init__()
-    def apply(self, sample, context=None):
-        assert 'gt_bbox' in sample
-        bbox = sample['gt_bbox']
-        bbox[:, 2:4] = bbox[:, 2:4] - bbox[:, :2]
-        bbox[:, :2] = bbox[:, :2] + bbox[:, 2:4] / 2.
-        sample['gt_bbox'] = bbox
-        return sample
-@register_op
-class PadBox(BaseOperator):
-    def __init__(self, num_max_boxes=50):
-        """
-        Pad zeros to bboxes if number of bboxes is less than num_max_boxes.
-        Args:
-            num_max_boxes (int): the max number of bboxes
-        """
-        self.num_max_boxes = num_max_boxes
-        super(PadBox, self).__init__()
-    def apply(self, sample, context=None):
-        assert 'gt_bbox' in sample
-        bbox = sample['gt_bbox']
-        gt_num = min(self.num_max_boxes, len(bbox))
-        num_max = self.num_max_boxes
-        # fields = context['fields'] if context else []
-        pad_bbox = np.zeros((num_max, 4), dtype=np.float32)
-        if gt_num > 0:
-            pad_bbox[:gt_num, :] = bbox[:gt_num, :]
-        sample['gt_bbox'] = pad_bbox
-        if 'gt_class' in sample:
-            pad_class = np.zeros((num_max, ), dtype=np.int32)
-            if gt_num > 0:
-                pad_class[:gt_num] = sample['gt_class'][:gt_num, 0]
-            sample['gt_class'] = pad_class
-        if 'gt_score' in sample:
-            pad_score = np.zeros((num_max, ), dtype=np.float32)
-            if gt_num > 0:
-                pad_score[:gt_num] = sample['gt_score'][:gt_num, 0]
-            sample['gt_score'] = pad_score
-        # in training, for example in op ExpandImage,
-        # the bbox and gt_class is expandded, but the difficult is not,
-        # so, judging by it's length
-        if 'difficult' in sample:
-            pad_diff = np.zeros((num_max, ), dtype=np.int32)
-            if gt_num > 0:
-                pad_diff[:gt_num] = sample['difficult'][:gt_num, 0]
-            sample['difficult'] = pad_diff
-        if 'is_crowd' in sample:
-            pad_crowd = np.zeros((num_max, ), dtype=np.int32)
-            if gt_num > 0:
-                pad_crowd[:gt_num] = sample['is_crowd'][:gt_num, 0]
-            sample['is_crowd'] = pad_crowd
-        if 'gt_ide' in sample:
-            pad_ide = np.zeros((num_max, ), dtype=np.int32)
-            if gt_num > 0:
-                pad_ide[:gt_num] = sample['gt_ide'][:gt_num, 0]
-            sample['gt_ide'] = pad_ide
-        return sample
-@register_op
-class DebugVisibleImage(BaseOperator):
-    """
-    In debug mode, visualize images according to `gt_box`.
-    (Currently only supported when not cropping and flipping image.)
-    """
-    def __init__(self, output_dir='output/debug', is_normalized=False):
-        super(DebugVisibleImage, self).__init__()
-        self.is_normalized = is_normalized
-        self.output_dir = output_dir
-        if not os.path.isdir(output_dir):
-            os.makedirs(output_dir)
-        if not isinstance(self.is_normalized, bool):
-            raise TypeError("{}: input type is invalid.".format(self))
-    def apply(self, sample, context=None):
-        image = Image.fromarray(sample['image'].astype(np.uint8))
-        out_file_name = '{:012d}.jpg'.format(sample['im_id'][0])
-        width = sample['w']
-        height = sample['h']
-        gt_bbox = sample['gt_bbox']
-        gt_class = sample['gt_class']
-        draw = ImageDraw.Draw(image)
-        for i in range(gt_bbox.shape[0]):
-            if self.is_normalized:
-                gt_bbox[i][0] = gt_bbox[i][0] * width
-                gt_bbox[i][1] = gt_bbox[i][1] * height
-                gt_bbox[i][2] = gt_bbox[i][2] * width
-                gt_bbox[i][3] = gt_bbox[i][3] * height
-            xmin, ymin, xmax, ymax = gt_bbox[i]
-            draw.line(
-                [(xmin, ymin), (xmin, ymax), (xmax, ymax), (xmax, ymin),
-                 (xmin, ymin)],
-                width=2,
-                fill='green')
-            # draw label
-            text = str(gt_class[i][0])
-            tw, th = draw.textsize(text)
-            draw.rectangle(
-                [(xmin + 1, ymin - th), (xmin + tw + 1, ymin)], fill='green')
-            draw.text((xmin + 1, ymin - th), text, fill=(255, 255, 255))
-        if 'gt_keypoint' in sample.keys():
-            gt_keypoint = sample['gt_keypoint']
-            if self.is_normalized:
-                for i in range(gt_keypoint.shape[1]):
-                    if i % 2:
-                        gt_keypoint[:, i] = gt_keypoint[:, i] * height
-                    else:
-                        gt_keypoint[:, i] = gt_keypoint[:, i] * width
-            for i in range(gt_keypoint.shape[0]):
-                keypoint = gt_keypoint[i]
-                for j in range(int(keypoint.shape[0] / 2)):
-                    x1 = round(keypoint[2 * j]).astype(np.int32)
-                    y1 = round(keypoint[2 * j + 1]).astype(np.int32)
-                    draw.ellipse(
-                        (x1, y1, x1 + 5, y1 + 5),
-                        fill='green',
-                        outline='green')
-        save_path = os.path.join(self.output_dir, out_file_name)
-        image.save(save_path, quality=95)
-        return sample
-@register_op
-class Pad(BaseOperator):
-    def __init__(self,
-                 size=None,
-                 size_divisor=32,
-                 pad_mode=0,
-                 offsets=None,
-                 fill_value=(127.5, 127.5, 127.5)):
-        """
-        Pad image to a specified size or multiple of size_divisor.
-        Args:
-            size (int, Sequence): image target size, if None, pad to multiple of size_divisor, default None
-            size_divisor (int): size divisor, default 32
-            pad_mode (int): pad mode, currently only supports four modes [-1, 0, 1, 2]. if -1, use specified offsets
-                if 0, only pad to right and bottom. if 1, pad according to center. if 2, only pad left and top
-            offsets (list): [offset_x, offset_y], specify offset while padding, only supported pad_mode=-1
-            fill_value (bool): rgb value of pad area, default (127.5, 127.5, 127.5)
-        """
-        super(Pad, self).__init__()
-        if not isinstance(size, (int, Sequence)):
-            raise TypeError(
-                "Type of target_size is invalid when random_size is True. \
-                            Must be List, now is {}".format(type(size)))
-        if isinstance(size, int):
-            size = [size, size]
-        assert pad_mode in [
-            -1, 0, 1, 2
-        ], 'currently only supports four modes [-1, 0, 1, 2]'
-        if pad_mode == -1:
-            assert offsets, 'if pad_mode is -1, offsets should not be None'
-        self.size = size
-        self.size_divisor = size_divisor
-        self.pad_mode = pad_mode
-        self.fill_value = fill_value
-        self.offsets = offsets
-    def apply_segm(self, segms, offsets, im_size, size):
-        def _expand_poly(poly, x, y):
-            expanded_poly = np.array(poly)
-            expanded_poly[0::2] += x
-            expanded_poly[1::2] += y
-            return expanded_poly.tolist()
-        def _expand_rle(rle, x, y, height, width, h, w):
-            if 'counts' in rle and type(rle['counts']) == list:
-                rle = mask_util.frPyObjects(rle, height, width)
-            mask = mask_util.decode(rle)
-            expanded_mask = np.full((h, w), 0).astype(mask.dtype)
-            expanded_mask[y:y + height, x:x + width] = mask
-            rle = mask_util.encode(
-                np.array(
-                    expanded_mask, order='F', dtype=np.uint8))
-            return rle
-        x, y = offsets
-        height, width = im_size
-        h, w = size
-        expanded_segms = []
-        for segm in segms:
-            if is_poly(segm):
-                # Polygon format
-                expanded_segms.append(
-                    [_expand_poly(poly, x, y) for poly in segm])
-            else:
-                # RLE format
-                import pycocotools.mask as mask_util
-                expanded_segms.append(
-                    _expand_rle(segm, x, y, height, width, h, w))
-        return expanded_segms
-    def apply_bbox(self, bbox, offsets):
-        return bbox + np.array(offsets * 2, dtype=np.float32)
-    def apply_keypoint(self, keypoints, offsets):
-        n = len(keypoints[0]) // 2
-        return keypoints + np.array(offsets * n, dtype=np.float32)
-    def apply_image(self, image, offsets, im_size, size):
-        x, y = offsets
-        im_h, im_w = im_size
-        h, w = size
-        canvas = np.ones((h, w, 3), dtype=np.float32)
-        canvas *= np.array(self.fill_value, dtype=np.float32)
-        canvas[y:y + im_h, x:x + im_w, :] = image.astype(np.float32)
-        return canvas
-    def apply(self, sample, context=None):
-        im = sample['image']
-        im_h, im_w = im.shape[:2]
-        if self.size:
-            h, w = self.size
-            assert (
-                im_h < h and im_w < w
-            ), '(h, w) of target size should be greater than (im_h, im_w)'
-        else:
-            h = np.ceil(im_h / self.size_divisor) * self.size_divisor
-            w = np.ceil(im_w / self.size_divisor) * self.size_divisor
-        if h == im_h and w == im_w:
-            return sample
-        if self.pad_mode == -1:
-            offset_x, offset_y = self.offsets
-        elif self.pad_mode == 0:
-            offset_y, offset_x = 0, 0
-        elif self.pad_mode == 1:
-            offset_y, offset_x = (h - im_h) // 2, (w - im_w) // 2
-        else:
-            offset_y, offset_x = h - im_h, w - im_w
-        offsets, im_size, size = [offset_x, offset_y], [im_h, im_w], [h, w]
-        sample['image'] = self.apply_image(im, offsets, im_size, size)
-        if self.pad_mode == 0:
-            return sample
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) > 0:
-            sample['gt_bbox'] = self.apply_bbox(sample['gt_bbox'], offsets)
-        if 'gt_poly' in sample and len(sample['gt_poly']) > 0:
-            sample['gt_poly'] = self.apply_segm(sample['gt_poly'], offsets,
-                                                im_size, size)
-        if 'gt_keypoint' in sample and len(sample['gt_keypoint']) > 0:
-            sample['gt_keypoint'] = self.apply_keypoint(sample['gt_keypoint'],
-                                                        offsets)
-        return sample
-@register_op
-class Poly2Mask(BaseOperator):
-    """
-    gt poly to mask annotations
-    """
-    def __init__(self):
-        super(Poly2Mask, self).__init__()
-        import pycocotools.mask as maskUtils
-        self.maskutils = maskUtils
-    def _poly2mask(self, mask_ann, img_h, img_w):
-        if isinstance(mask_ann, list):
-            # polygon -- a single object might consist of multiple parts
-            # we merge all parts into one mask rle code
-            rles = self.maskutils.frPyObjects(mask_ann, img_h, img_w)
-            rle = self.maskutils.merge(rles)
-        elif isinstance(mask_ann['counts'], list):
-            # uncompressed RLE
-            rle = self.maskutils.frPyObjects(mask_ann, img_h, img_w)
-        else:
-            # rle
-            rle = mask_ann
-        mask = self.maskutils.decode(rle)
-        return mask
-    def apply(self, sample, context=None):
-        assert 'gt_poly' in sample
-        im_h = sample['h']
-        im_w = sample['w']
-        masks = [
-            self._poly2mask(gt_poly, im_h, im_w)
-            for gt_poly in sample['gt_poly']
-        ]
-        sample['gt_segm'] = np.asarray(masks).astype(np.uint8)
-        return sample
-@register_op
-class Rbox2Poly(BaseOperator):
-    """
-    Convert rbbox format to poly format.
-    """
-    def __init__(self):
-        super(Rbox2Poly, self).__init__()
-    def apply(self, sample, context=None):
-        assert 'gt_rbox' in sample
-        assert sample['gt_rbox'].shape[1] == 5
-        rrects = sample['gt_rbox']
-        x_ctr = rrects[:, 0]
-        y_ctr = rrects[:, 1]
-        width = rrects[:, 2]
-        height = rrects[:, 3]
-        x1 = x_ctr - width / 2.0
-        y1 = y_ctr - height / 2.0
-        x2 = x_ctr + width / 2.0
-        y2 = y_ctr + height / 2.0
-        sample['gt_bbox'] = np.stack([x1, y1, x2, y2], axis=1)
-        polys = bbox_utils.rbox2poly_np(rrects)
-        sample['gt_rbox2poly'] = polys
-        return sample
-@register_op
-class AugmentHSV(BaseOperator):
-    def __init__(self, fraction=0.50, is_bgr=True):
-        """
-        Augment the SV channel of image data.
-        Args:
-            fraction (float): the fraction for augment. Default: 0.5.
-            is_bgr (bool): whether the image is BGR mode. Default: True.
-        """
-        super(AugmentHSV, self).__init__()
-        self.fraction = fraction
-        self.is_bgr = is_bgr
-    def apply(self, sample, context=None):
-        img = sample['image']
-        if self.is_bgr:
-            img_hsv = cv2.cvtColor(img, cv2.COLOR_BGR2HSV)
-        else:
-            img_hsv = cv2.cvtColor(img, cv2.COLOR_RGB2HSV)
-        S = img_hsv[:, :, 1].astype(np.float32)
-        V = img_hsv[:, :, 2].astype(np.float32)
-        a = (random.random() * 2 - 1) * self.fraction + 1
-        S *= a
-        if a > 1:
-            np.clip(S, a_min=0, a_max=255, out=S)
-        a = (random.random() * 2 - 1) * self.fraction + 1
-        V *= a
-        if a > 1:
-            np.clip(V, a_min=0, a_max=255, out=V)
-        img_hsv[:, :, 1] = S.astype(np.uint8)
-        img_hsv[:, :, 2] = V.astype(np.uint8)
-        if self.is_bgr:
-            cv2.cvtColor(img_hsv, cv2.COLOR_HSV2BGR, dst=img)
-        else:
-            cv2.cvtColor(img_hsv, cv2.COLOR_HSV2RGB, dst=img)
-        sample['image'] = img
-        return sample
-@register_op
-class Norm2PixelBbox(BaseOperator):
-    """
-    Transform the bounding box's coornidates which is in [0,1] to pixels.
-    """
-    def __init__(self):
-        super(Norm2PixelBbox, self).__init__()
-    def apply(self, sample, context=None):
-        assert 'gt_bbox' in sample
-        bbox = sample['gt_bbox']
-        height, width = sample['image'].shape[:2]
-        bbox[:, 0::2] = bbox[:, 0::2] * width
-        bbox[:, 1::2] = bbox[:, 1::2] * height
-        sample['gt_bbox'] = bbox
-        return sample
-@register_op
-class BboxCXCYWH2XYXY(BaseOperator):
-    """
-    Convert bbox CXCYWH format to XYXY format.
-    [center_x, center_y, width, height] -> [x0, y0, x1, y1]
-    """
-    def __init__(self):
-        super(BboxCXCYWH2XYXY, self).__init__()
-    def apply(self, sample, context=None):
-        assert 'gt_bbox' in sample
-        bbox0 = sample['gt_bbox']
-        bbox = bbox0.copy()
-        bbox[:, :2] = bbox0[:, :2] - bbox0[:, 2:4] / 2.
-        bbox[:, 2:4] = bbox0[:, :2] + bbox0[:, 2:4] / 2.
-        sample['gt_bbox'] = bbox
-        return sample
-@register_op
-class RandomResizeCrop(BaseOperator):
-    """Random resize and crop image and bboxes.
-    Args:
-        resizes (list): resize image to one of resizes. if keep_ratio is True and mode is
-        'long', resize the image's long side to the maximum of target_size, if keep_ratio is
-        True and mode is 'short', resize the image's short side to the minimum of target_size.
-        cropsizes (list): crop sizes after resize, [(min_crop_1, max_crop_1), ...]
-        mode (str): resize mode, `long` or `short`. Details see resizes.
-        prob (float): probability of this op.
-        keep_ratio (bool): whether keep_ratio or not, default true
-        interp (int): the interpolation method
-        thresholds (list): iou thresholds for decide a valid bbox crop.
-        num_attempts (int): number of tries before giving up.
-        allow_no_crop (bool): allow return without actually cropping them.
-        cover_all_box (bool): ensure all bboxes are covered in the final crop.
-        is_mask_crop(bool): whether crop the segmentation.
-    """
-    def __init__(
-            self,
-            resizes,
-            cropsizes,
-            prob=0.5,
-            mode='short',
-            keep_ratio=True,
-            interp=cv2.INTER_LINEAR,
-            num_attempts=3,
-            cover_all_box=False,
-            allow_no_crop=False,
-            thresholds=[0.3, 0.5, 0.7],
-            is_mask_crop=False, ):
-        super(RandomResizeCrop, self).__init__()
-        self.resizes = resizes
-        self.cropsizes = cropsizes
-        self.prob = prob
-        self.mode = mode
-        self.resizer = Resize(0, keep_ratio=keep_ratio, interp=interp)
-        self.croper = RandomCrop(
-            num_attempts=num_attempts,
-            cover_all_box=cover_all_box,
-            thresholds=thresholds,
-            allow_no_crop=allow_no_crop,
-            is_mask_crop=is_mask_crop)
-    def _format_size(self, size):
-        if isinstance(size, Integral):
-            size = (size, size)
-        return size
-    def apply(self, sample, context=None):
-        if random.random() < self.prob:
-            _resize = self._format_size(random.choice(self.resizes))
-            _cropsize = self._format_size(random.choice(self.cropsizes))
-            sample = self._resize(
-                self.resizer,
-                sample,
-                size=_resize,
-                mode=self.mode,
-                context=context)
-            sample = self._random_crop(
-                self.croper, sample, size=_cropsize, context=context)
-        return sample
-    @staticmethod
-    def _random_crop(croper, sample, size, context=None):
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) == 0:
-            return sample
-        self = croper
-        h, w = sample['image'].shape[:2]
-        gt_bbox = sample['gt_bbox']
-        cropsize = size
-        min_crop = min(cropsize)
-        max_crop = max(cropsize)
-        thresholds = list(self.thresholds)
-        np.random.shuffle(thresholds)
-        for thresh in thresholds:
-            found = False
-            for _ in range(self.num_attempts):
-                crop_h = random.randint(min_crop, min(h, max_crop))
-                crop_w = random.randint(min_crop, min(w, max_crop))
-                crop_y = random.randint(0, h - crop_h)
-                crop_x = random.randint(0, w - crop_w)
-                crop_box = [crop_x, crop_y, crop_x + crop_w, crop_y + crop_h]
-                iou = self._iou_matrix(
-                    gt_bbox, np.array(
-                        [crop_box], dtype=np.float32))
-                if iou.max() < thresh:
-                    continue
-                if self.cover_all_box and iou.min() < thresh:
-                    continue
-                cropped_box, valid_ids = self._crop_box_with_center_constraint(
-                    gt_bbox, np.array(
-                        crop_box, dtype=np.float32))
-                if valid_ids.size > 0:
-                    found = True
-                    break
-            if found:
-                if self.is_mask_crop and 'gt_poly' in sample and len(sample[
-                        'gt_poly']) > 0:
-                    crop_polys = self.crop_segms(
-                        sample['gt_poly'],
-                        valid_ids,
-                        np.array(
-                            crop_box, dtype=np.int64),
-                        h,
-                        w)
-                    if [] in crop_polys:
-                        delete_id = list()
-                        valid_polys = list()
-                        for id, crop_poly in enumerate(crop_polys):
-                            if crop_poly == []:
-                                delete_id.append(id)
-                            else:
-                                valid_polys.append(crop_poly)
-                        valid_ids = np.delete(valid_ids, delete_id)
-                        if len(valid_polys) == 0:
-                            return sample
-                        sample['gt_poly'] = valid_polys
-                    else:
-                        sample['gt_poly'] = crop_polys
-                if 'gt_segm' in sample:
-                    sample['gt_segm'] = self._crop_segm(sample['gt_segm'],
-                                                        crop_box)
-                    sample['gt_segm'] = np.take(
-                        sample['gt_segm'], valid_ids, axis=0)
-                sample['image'] = self._crop_image(sample['image'], crop_box)
-                sample['gt_bbox'] = np.take(cropped_box, valid_ids, axis=0)
-                sample['gt_class'] = np.take(
-                    sample['gt_class'], valid_ids, axis=0)
-                if 'gt_score' in sample:
-                    sample['gt_score'] = np.take(
-                        sample['gt_score'], valid_ids, axis=0)
-                if 'is_crowd' in sample:
-                    sample['is_crowd'] = np.take(
-                        sample['is_crowd'], valid_ids, axis=0)
-                return sample
-        return sample
-    @staticmethod
-    def _resize(resizer, sample, size, mode='short', context=None):
-        self = resizer
-        im = sample['image']
-        target_size = size
-        if not isinstance(im, np.ndarray):
-            raise TypeError("{}: image type is not numpy.".format(self))
-        if len(im.shape) != 3:
-            raise ImageError('{}: image is not 3-dimensional.'.format(self))
-        # apply image
-        im_shape = im.shape
-        if self.keep_ratio:
-            im_size_min = np.min(im_shape[0:2])
-            im_size_max = np.max(im_shape[0:2])
-            target_size_min = np.min(target_size)
-            target_size_max = np.max(target_size)
-            if mode == 'long':
-                im_scale = min(target_size_min / im_size_min,
-                               target_size_max / im_size_max)
-            else:
-                im_scale = max(target_size_min / im_size_min,
-                               target_size_max / im_size_max)
-            resize_h = im_scale * float(im_shape[0])
-            resize_w = im_scale * float(im_shape[1])
-            im_scale_x = im_scale
-            im_scale_y = im_scale
-        else:
-            resize_h, resize_w = target_size
-            im_scale_y = resize_h / im_shape[0]
-            im_scale_x = resize_w / im_shape[1]
-        im = self.apply_image(sample['image'], [im_scale_x, im_scale_y])
-        sample['image'] = im
-        sample['im_shape'] = np.asarray([resize_h, resize_w], dtype=np.float32)
-        if 'scale_factor' in sample:
-            scale_factor = sample['scale_factor']
-            sample['scale_factor'] = np.asarray(
-                [scale_factor[0] * im_scale_y, scale_factor[1] * im_scale_x],
-                dtype=np.float32)
-        else:
-            sample['scale_factor'] = np.asarray(
-                [im_scale_y, im_scale_x], dtype=np.float32)
-        # apply bbox
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) > 0:
-            sample['gt_bbox'] = self.apply_bbox(sample['gt_bbox'],
-                                                [im_scale_x, im_scale_y],
-                                                [resize_w, resize_h])
-        # apply rbox
-        if 'gt_rbox2poly' in sample:
-            if np.array(sample['gt_rbox2poly']).shape[1] != 8:
-                logger.warn(
-                    "gt_rbox2poly's length shoule be 8, but actually is {}".
-                    format(len(sample['gt_rbox2poly'])))
-            sample['gt_rbox2poly'] = self.apply_bbox(sample['gt_rbox2poly'],
-                                                     [im_scale_x, im_scale_y],
-                                                     [resize_w, resize_h])
-        # apply polygon
-        if 'gt_poly' in sample and len(sample['gt_poly']) > 0:
-            sample['gt_poly'] = self.apply_segm(
-                sample['gt_poly'], im_shape[:2], [im_scale_x, im_scale_y])
-        # apply semantic
-        if 'semantic' in sample and sample['semantic']:
-            semantic = sample['semantic']
-            semantic = cv2.resize(
-                semantic.astype('float32'),
-                None,
-                None,
-                fx=im_scale_x,
-                fy=im_scale_y,
-                interpolation=self.interp)
-            semantic = np.asarray(semantic).astype('int32')
-            semantic = np.expand_dims(semantic, 0)
-            sample['semantic'] = semantic
-        # apply gt_segm
-        if 'gt_segm' in sample and len(sample['gt_segm']) > 0:
-            masks = [
-                cv2.resize(
-                    gt_segm,
-                    None,
-                    None,
-                    fx=im_scale_x,
-                    fy=im_scale_y,
-                    interpolation=cv2.INTER_NEAREST)
-                for gt_segm in sample['gt_segm']
-            ]
-            sample['gt_segm'] = np.asarray(masks).astype(np.uint8)
-        return sample
-@register_op
-class RandomSelect(BaseOperator):
-    """
-    Randomly choose a transformation between transforms1 and transforms2,
-    and the probability of choosing transforms1 is p.
-    The code is based on https://github.com/facebookresearch/detr/blob/main/datasets/transforms.py
-    """
-    def __init__(self, transforms1, transforms2, p=0.5):
-        super(RandomSelect, self).__init__()
-        self.transforms1 = Compose(transforms1)
-        self.transforms2 = Compose(transforms2)
-        self.p = p
-    def apply(self, sample, context=None):
-        if random.random() < self.p:
-            return self.transforms1(sample)
-        return self.transforms2(sample)
-@register_op
-class RandomShortSideResize(BaseOperator):
-    def __init__(self,
-                 short_side_sizes,
-                 max_size=None,
-                 interp=cv2.INTER_LINEAR,
-                 random_interp=False):
-        """
-        Resize the image randomly according to the short side. If max_size is not None,
-        the long side is scaled according to max_size. The whole process will be keep ratio.
-        Args:
-            short_side_sizes (list|tuple): Image target short side size.
-            max_size (int): The size of the longest side of image after resize.
-            interp (int): The interpolation method.
-            random_interp (bool): Whether random select interpolation method.
-        """
-        super(RandomShortSideResize, self).__init__()
-        assert isinstance(short_side_sizes,
-                          Sequence), "short_side_sizes must be List or Tuple"
-        self.short_side_sizes = short_side_sizes
-        self.max_size = max_size
-        self.interp = interp
-        self.random_interp = random_interp
-        self.interps = [
-            cv2.INTER_NEAREST,
-            cv2.INTER_LINEAR,
-            cv2.INTER_AREA,
-            cv2.INTER_CUBIC,
-            cv2.INTER_LANCZOS4,
-        ]
-    def get_size_with_aspect_ratio(self, image_shape, size, max_size=None):
-        h, w = image_shape
-        if max_size is not None:
-            min_original_size = float(min((w, h)))
-            max_original_size = float(max((w, h)))
-            if max_original_size / min_original_size * size > max_size:
-                size = int(
-                    round(max_size * min_original_size / max_original_size))
-        if (w <= h and w == size) or (h <= w and h == size):
-            return (w, h)
-        if w < h:
-            ow = size
-            oh = int(size * h / w)
-        else:
-            oh = size
-            ow = int(size * w / h)
-        return (ow, oh)
-    def resize(self,
-               sample,
-               target_size,
-               max_size=None,
-               interp=cv2.INTER_LINEAR):
-        im = sample['image']
-        if not isinstance(im, np.ndarray):
-            raise TypeError("{}: image type is not numpy.".format(self))
-        if len(im.shape) != 3:
-            raise ImageError('{}: image is not 3-dimensional.'.format(self))
-        target_size = self.get_size_with_aspect_ratio(im.shape[:2],
-                                                      target_size, max_size)
-        im_scale_y, im_scale_x = target_size[1] / im.shape[0], target_size[
-            0] / im.shape[1]
-        sample['image'] = cv2.resize(im, target_size, interpolation=interp)
-        sample['im_shape'] = np.asarray(target_size[::-1], dtype=np.float32)
-        if 'scale_factor' in sample:
-            scale_factor = sample['scale_factor']
-            sample['scale_factor'] = np.asarray(
-                [scale_factor[0] * im_scale_y, scale_factor[1] * im_scale_x],
-                dtype=np.float32)
-        else:
-            sample['scale_factor'] = np.asarray(
-                [im_scale_y, im_scale_x], dtype=np.float32)
-        # apply bbox
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) > 0:
-            sample['gt_bbox'] = self.apply_bbox(
-                sample['gt_bbox'], [im_scale_x, im_scale_y], target_size)
-        # apply polygon
-        if 'gt_poly' in sample and len(sample['gt_poly']) > 0:
-            sample['gt_poly'] = self.apply_segm(
-                sample['gt_poly'], im.shape[:2], [im_scale_x, im_scale_y])
-        # apply semantic
-        if 'semantic' in sample and sample['semantic']:
-            semantic = sample['semantic']
-            semantic = cv2.resize(
-                semantic.astype('float32'),
-                target_size,
-                interpolation=self.interp)
-            semantic = np.asarray(semantic).astype('int32')
-            semantic = np.expand_dims(semantic, 0)
-            sample['semantic'] = semantic
-        # apply gt_segm
-        if 'gt_segm' in sample and len(sample['gt_segm']) > 0:
-            masks = [
-                cv2.resize(
-                    gt_segm, target_size, interpolation=cv2.INTER_NEAREST)
-                for gt_segm in sample['gt_segm']
-            ]
-            sample['gt_segm'] = np.asarray(masks).astype(np.uint8)
-        return sample
-    def apply_bbox(self, bbox, scale, size):
-        im_scale_x, im_scale_y = scale
-        resize_w, resize_h = size
-        bbox[:, 0::2] *= im_scale_x
-        bbox[:, 1::2] *= im_scale_y
-        bbox[:, 0::2] = np.clip(bbox[:, 0::2], 0, resize_w)
-        bbox[:, 1::2] = np.clip(bbox[:, 1::2], 0, resize_h)
-        return bbox.astype('float32')
-    def apply_segm(self, segms, im_size, scale):
-        def _resize_poly(poly, im_scale_x, im_scale_y):
-            resized_poly = np.array(poly).astype('float32')
-            resized_poly[0::2] *= im_scale_x
-            resized_poly[1::2] *= im_scale_y
-            return resized_poly.tolist()
-        def _resize_rle(rle, im_h, im_w, im_scale_x, im_scale_y):
-            if 'counts' in rle and type(rle['counts']) == list:
-                rle = mask_util.frPyObjects(rle, im_h, im_w)
-            mask = mask_util.decode(rle)
-            mask = cv2.resize(
-                mask,
-                None,
-                None,
-                fx=im_scale_x,
-                fy=im_scale_y,
-                interpolation=self.interp)
-            rle = mask_util.encode(np.array(mask, order='F', dtype=np.uint8))
-            return rle
-        im_h, im_w = im_size
-        im_scale_x, im_scale_y = scale
-        resized_segms = []
-        for segm in segms:
-            if is_poly(segm):
-                # Polygon format
-                resized_segms.append([
-                    _resize_poly(poly, im_scale_x, im_scale_y) for poly in segm
-                ])
-            else:
-                # RLE format
-                import pycocotools.mask as mask_util
-                resized_segms.append(
-                    _resize_rle(segm, im_h, im_w, im_scale_x, im_scale_y))
-        return resized_segms
-    def apply(self, sample, context=None):
-        target_size = random.choice(self.short_side_sizes)
-        interp = random.choice(
-            self.interps) if self.random_interp else self.interp
-        return self.resize(sample, target_size, self.max_size, interp)
-@register_op
-class RandomSizeCrop(BaseOperator):
-    """
-    Cut the image randomly according to `min_size` and `max_size`
-    """
-    def __init__(self, min_size, max_size):
-        super(RandomSizeCrop, self).__init__()
-        self.min_size = min_size
-        self.max_size = max_size
-        from paddle.vision.transforms.functional import crop as paddle_crop
-        self.paddle_crop = paddle_crop
-    @staticmethod
-    def get_crop_params(img_shape, output_size):
-        """Get parameters for ``crop`` for a random crop.
-        Args:
-            img_shape (list|tuple): Image's height and width.
-            output_size (list|tuple): Expected output size of the crop.
-        Returns:
-            tuple: params (i, j, h, w) to be passed to ``crop`` for random crop.
-        """
-        h, w = img_shape
-        th, tw = output_size
-        if h + 1 < th or w + 1 < tw:
-            raise ValueError(
-                "Required crop size {} is larger then input image size {}".
-                format((th, tw), (h, w)))
-        if w == tw and h == th:
-            return 0, 0, h, w
-        i = random.randint(0, h - th + 1)
-        j = random.randint(0, w - tw + 1)
-        return i, j, th, tw
-    def crop(self, sample, region):
-        image_shape = sample['image'].shape[:2]
-        sample['image'] = self.paddle_crop(sample['image'], *region)
-        keep_index = None
-        # apply bbox
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) > 0:
-            sample['gt_bbox'] = self.apply_bbox(sample['gt_bbox'], region)
-            bbox = sample['gt_bbox'].reshape([-1, 2, 2])
-            area = (bbox[:, 1, :] - bbox[:, 0, :]).prod(axis=1)
-            keep_index = np.where(area > 0)[0]
-            sample['gt_bbox'] = sample['gt_bbox'][keep_index] if len(
-                keep_index) > 0 else np.zeros(
-                    [0, 4], dtype=np.float32)
-            sample['gt_class'] = sample['gt_class'][keep_index] if len(
-                keep_index) > 0 else np.zeros(
-                    [0, 1], dtype=np.float32)
-            if 'gt_score' in sample:
-                sample['gt_score'] = sample['gt_score'][keep_index] if len(
-                    keep_index) > 0 else np.zeros(
-                        [0, 1], dtype=np.float32)
-            if 'is_crowd' in sample:
-                sample['is_crowd'] = sample['is_crowd'][keep_index] if len(
-                    keep_index) > 0 else np.zeros(
-                        [0, 1], dtype=np.float32)
-        # apply polygon
-        if 'gt_poly' in sample and len(sample['gt_poly']) > 0:
-            sample['gt_poly'] = self.apply_segm(sample['gt_poly'], region,
-                                                image_shape)
-            if keep_index is not None:
-                sample['gt_poly'] = sample['gt_poly'][keep_index]
-        # apply gt_segm
-        if 'gt_segm' in sample and len(sample['gt_segm']) > 0:
-            i, j, h, w = region
-            sample['gt_segm'] = sample['gt_segm'][:, i:i + h, j:j + w]
-            if keep_index is not None:
-                sample['gt_segm'] = sample['gt_segm'][keep_index]
-        return sample
-    def apply_bbox(self, bbox, region):
-        i, j, h, w = region
-        region_size = np.asarray([w, h])
-        crop_bbox = bbox - np.asarray([j, i, j, i])
-        crop_bbox = np.minimum(crop_bbox.reshape([-1, 2, 2]), region_size)
-        crop_bbox = crop_bbox.clip(min=0)
-        return crop_bbox.reshape([-1, 4]).astype('float32')
-    def apply_segm(self, segms, region, image_shape):
-        def _crop_poly(segm, crop):
-            xmin, ymin, xmax, ymax = crop
-            crop_coord = [xmin, ymin, xmin, ymax, xmax, ymax, xmax, ymin]
-            crop_p = np.array(crop_coord).reshape(4, 2)
-            crop_p = Polygon(crop_p)
-            crop_segm = list()
-            for poly in segm:
-                poly = np.array(poly).reshape(len(poly) // 2, 2)
-                polygon = Polygon(poly)
-                if not polygon.is_valid:
-                    exterior = polygon.exterior
-                    multi_lines = exterior.intersection(exterior)
-                    polygons = shapely.ops.polygonize(multi_lines)
-                    polygon = MultiPolygon(polygons)
-                multi_polygon = list()
-                if isinstance(polygon, MultiPolygon):
-                    multi_polygon = copy.deepcopy(polygon)
-                else:
-                    multi_polygon.append(copy.deepcopy(polygon))
-                for per_polygon in multi_polygon:
-                    inter = per_polygon.intersection(crop_p)
-                    if not inter:
-                        continue
-                    if isinstance(inter, (MultiPolygon, GeometryCollection)):
-                        for part in inter:
-                            if not isinstance(part, Polygon):
-                                continue
-                            part = np.squeeze(
-                                np.array(part.exterior.coords[:-1]).reshape(
-                                    1, -1))
-                            part[0::2] -= xmin
-                            part[1::2] -= ymin
-                            crop_segm.append(part.tolist())
-                    elif isinstance(inter, Polygon):
-                        crop_poly = np.squeeze(
-                            np.array(inter.exterior.coords[:-1]).reshape(1,
-                                                                         -1))
-                        crop_poly[0::2] -= xmin
-                        crop_poly[1::2] -= ymin
-                        crop_segm.append(crop_poly.tolist())
-                    else:
-                        continue
-            return crop_segm
-        def _crop_rle(rle, crop, height, width):
-            if 'counts' in rle and type(rle['counts']) == list:
-                rle = mask_util.frPyObjects(rle, height, width)
-            mask = mask_util.decode(rle)
-            mask = mask[crop[1]:crop[3], crop[0]:crop[2]]
-            rle = mask_util.encode(np.array(mask, order='F', dtype=np.uint8))
-            return rle
-        i, j, h, w = region
-        crop = [j, i, j + w, i + h]
-        height, width = image_shape
-        crop_segms = []
-        for segm in segms:
-            if is_poly(segm):
-                import copy
-                import shapely.ops
-                from shapely.geometry import Polygon, MultiPolygon, GeometryCollection
-                # Polygon format
-                crop_segms.append(_crop_poly(segm, crop))
-            else:
-                # RLE format
-                import pycocotools.mask as mask_util
-                crop_segms.append(_crop_rle(segm, crop, height, width))
-        return crop_segms
-    def apply(self, sample, context=None):
-        h = random.randint(self.min_size,
-                           min(sample['image'].shape[0], self.max_size))
-        w = random.randint(self.min_size,
-                           min(sample['image'].shape[1], self.max_size))
-        region = self.get_crop_params(sample['image'].shape[:2], [h, w])
-        return self.crop(sample, region)
-@register_op
-class WarpAffine(BaseOperator):
-    def __init__(self,
-                 keep_res=False,
-                 pad=31,
-                 input_h=512,
-                 input_w=512,
-                 scale=0.4,
-                 shift=0.1):
-        """WarpAffine
-        Warp affine the image
-        The code is based on https://github.com/xingyizhou/CenterNet/blob/master/src/lib/datasets/sample/ctdet.py
-        """
-        super(WarpAffine, self).__init__()
-        self.keep_res = keep_res
-        self.pad = pad
-        self.input_h = input_h
-        self.input_w = input_w
-        self.scale = scale
-        self.shift = shift
-    def apply(self, sample, context=None):
-        img = sample['image']
-        img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) == 0:
-            return sample
-        h, w = img.shape[:2]
-        if self.keep_res:
-            input_h = (h | self.pad) + 1
-            input_w = (w | self.pad) + 1
-            s = np.array([input_w, input_h], dtype=np.float32)
-            c = np.array([w // 2, h // 2], dtype=np.float32)
-        else:
-            s = max(h, w) * 1.0
-            input_h, input_w = self.input_h, self.input_w
-            c = np.array([w / 2., h / 2.], dtype=np.float32)
-        trans_input = get_affine_transform(c, s, 0, [input_w, input_h])
-        img = cv2.resize(img, (w, h))
-        inp = cv2.warpAffine(
-            img, trans_input, (input_w, input_h), flags=cv2.INTER_LINEAR)
-        sample['image'] = inp
-        return sample
-@register_op
-class FlipWarpAffine(BaseOperator):
-    def __init__(self,
-                 keep_res=False,
-                 pad=31,
-                 input_h=512,
-                 input_w=512,
-                 not_rand_crop=False,
-                 scale=0.4,
-                 shift=0.1,
-                 flip=0.5,
-                 is_scale=True,
-                 use_random=True):
-        """FlipWarpAffine
-        1. Random Crop
-        2. Flip the image horizontal
-        3. Warp affine the image
-        """
-        super(FlipWarpAffine, self).__init__()
-        self.keep_res = keep_res
-        self.pad = pad
-        self.input_h = input_h
-        self.input_w = input_w
-        self.not_rand_crop = not_rand_crop
-        self.scale = scale
-        self.shift = shift
-        self.flip = flip
-        self.is_scale = is_scale
-        self.use_random = use_random
-    def apply(self, sample, context=None):
-        img = sample['image']
-        img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR)
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) == 0:
-            return sample
-        h, w = img.shape[:2]
-        if self.keep_res:
-            input_h = (h | self.pad) + 1
-            input_w = (w | self.pad) + 1
-            s = np.array([input_w, input_h], dtype=np.float32)
-            c = np.array([w // 2, h // 2], dtype=np.float32)
-        else:
-            s = max(h, w) * 1.0
-            input_h, input_w = self.input_h, self.input_w
-            c = np.array([w / 2., h / 2.], dtype=np.float32)
-        if self.use_random:
-            gt_bbox = sample['gt_bbox']
-            if not self.not_rand_crop:
-                s = s * np.random.choice(np.arange(0.6, 1.4, 0.1))
-                w_border = get_border(128, w)
-                h_border = get_border(128, h)
-                c[0] = np.random.randint(low=w_border, high=w - w_border)
-                c[1] = np.random.randint(low=h_border, high=h - h_border)
-            else:
-                sf = self.scale
-                cf = self.shift
-                c[0] += s * np.clip(np.random.randn() * cf, -2 * cf, 2 * cf)
-                c[1] += s * np.clip(np.random.randn() * cf, -2 * cf, 2 * cf)
-                s = s * np.clip(np.random.randn() * sf + 1, 1 - sf, 1 + sf)
-            if np.random.random() < self.flip:
-                img = img[:, ::-1, :]
-                c[0] = w - c[0] - 1
-                oldx1 = gt_bbox[:, 0].copy()
-                oldx2 = gt_bbox[:, 2].copy()
-                gt_bbox[:, 0] = w - oldx2 - 1
-                gt_bbox[:, 2] = w - oldx1 - 1
-            sample['gt_bbox'] = gt_bbox
-        trans_input = get_affine_transform(c, s, 0, [input_w, input_h])
-        if not self.use_random:
-            img = cv2.resize(img, (w, h))
-        inp = cv2.warpAffine(
-            img, trans_input, (input_w, input_h), flags=cv2.INTER_LINEAR)
-        if self.is_scale:
-            inp = (inp.astype(np.float32) / 255.)
-        sample['image'] = inp
-        sample['center'] = c
-        sample['scale'] = s
-        return sample
-@register_op
-class CenterRandColor(BaseOperator):
-    """Random color for CenterNet series models.
-    Args:
-        saturation (float): saturation settings.
-        contrast (float): contrast settings.
-        brightness (float): brightness settings.
-    """
-    def __init__(self, saturation=0.4, contrast=0.4, brightness=0.4):
-        super(CenterRandColor, self).__init__()
-        self.saturation = saturation
-        self.contrast = contrast
-        self.brightness = brightness
-    def apply_saturation(self, img, img_gray):
-        alpha = 1. + np.random.uniform(
-            low=-self.saturation, high=self.saturation)
-        self._blend(alpha, img, img_gray[:, :, None])
-        return img
-    def apply_contrast(self, img, img_gray):
-        alpha = 1. + np.random.uniform(low=-self.contrast, high=self.contrast)
-        img_mean = img_gray.mean()
-        self._blend(alpha, img, img_mean)
-        return img
-    def apply_brightness(self, img, img_gray):
-        alpha = 1 + np.random.uniform(
-            low=-self.brightness, high=self.brightness)
-        img *= alpha
-        return img
-    def _blend(self, alpha, img, img_mean):
-        img *= alpha
-        img_mean *= (1 - alpha)
-        img += img_mean
-    def __call__(self, sample, context=None):
-        img = sample['image']
-        img_gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
-        functions = [
-            self.apply_brightness,
-            self.apply_contrast,
-            self.apply_saturation,
-        ]
-        distortions = np.random.permutation(functions)
-        for func in distortions:
-            img = func(img, img_gray)
-        sample['image'] = img
-        return sample

paddlex 2.1.0__py3-none-any.whl → 3.0.0rc0__py3-none-any.whl

paddlex 2.1.0py3-none-any.whl → 3.0.0rc0py3-none-any.whl