PyPI - paddlex - Versions diffs - 2.0.0rc4__py3-none-any.whl → 3.0.0b2__py3-none-any.whl - Mend

paddlex 2.0.0rc4py3-none-any.whl → 3.0.0b2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (1087) hide show

paddlex/.version +1 -0
paddlex/__init__.py +51 -18
paddlex/__main__.py +40 -0
paddlex/configs/anomaly_detection/STFPM.yaml +41 -0
paddlex/configs/doc_text_orientation/PP-LCNet_x1_0_doc_ori.yaml +41 -0
paddlex/configs/face_detection/BlazeFace-FPN-SSH.yaml +40 -0
paddlex/configs/face_detection/BlazeFace.yaml +40 -0
paddlex/configs/face_detection/PP-YOLOE_plus-S_face.yaml +40 -0
paddlex/configs/face_detection/PicoDet_LCNet_x2_5_face.yaml +40 -0
paddlex/configs/face_recognition/MobileFaceNet.yaml +44 -0
paddlex/configs/face_recognition/ResNet50_face.yaml +44 -0
paddlex/configs/formula_recognition/LaTeX_OCR_rec.yaml +40 -0
paddlex/configs/general_recognition/PP-ShiTuV2_rec.yaml +42 -0
paddlex/configs/general_recognition/PP-ShiTuV2_rec_CLIP_vit_base.yaml +42 -0
paddlex/configs/general_recognition/PP-ShiTuV2_rec_CLIP_vit_large.yaml +41 -0
paddlex/configs/human_detection/PP-YOLOE-L_human.yaml +42 -0
paddlex/configs/human_detection/PP-YOLOE-S_human.yaml +42 -0
paddlex/configs/image_classification/CLIP_vit_base_patch16_224.yaml +41 -0
paddlex/configs/image_classification/CLIP_vit_large_patch14_224.yaml +41 -0
paddlex/configs/image_classification/ConvNeXt_base_224.yaml +41 -0
paddlex/configs/image_classification/ConvNeXt_base_384.yaml +41 -0
paddlex/configs/image_classification/ConvNeXt_large_224.yaml +41 -0
paddlex/configs/image_classification/ConvNeXt_large_384.yaml +41 -0
paddlex/configs/image_classification/ConvNeXt_small.yaml +41 -0
paddlex/configs/image_classification/ConvNeXt_tiny.yaml +41 -0
paddlex/configs/image_classification/FasterNet-L.yaml +40 -0
paddlex/configs/image_classification/FasterNet-M.yaml +40 -0
paddlex/configs/image_classification/FasterNet-S.yaml +40 -0
paddlex/configs/image_classification/FasterNet-T0.yaml +40 -0
paddlex/configs/image_classification/FasterNet-T1.yaml +40 -0
paddlex/configs/image_classification/FasterNet-T2.yaml +40 -0
paddlex/configs/image_classification/MobileNetV1_x0_25.yaml +41 -0
paddlex/configs/image_classification/MobileNetV1_x0_5.yaml +41 -0
paddlex/configs/image_classification/MobileNetV1_x0_75.yaml +41 -0
paddlex/configs/image_classification/MobileNetV1_x1_0.yaml +41 -0
paddlex/configs/image_classification/MobileNetV2_x0_25.yaml +41 -0
paddlex/configs/image_classification/MobileNetV2_x0_5.yaml +41 -0
paddlex/configs/image_classification/MobileNetV2_x1_0.yaml +41 -0
paddlex/configs/image_classification/MobileNetV2_x1_5.yaml +41 -0
paddlex/configs/image_classification/MobileNetV2_x2_0.yaml +41 -0
paddlex/configs/image_classification/MobileNetV3_large_x0_35.yaml +41 -0
paddlex/configs/image_classification/MobileNetV3_large_x0_5.yaml +41 -0
paddlex/configs/image_classification/MobileNetV3_large_x0_75.yaml +41 -0
paddlex/configs/image_classification/MobileNetV3_large_x1_0.yaml +41 -0
paddlex/configs/image_classification/MobileNetV3_large_x1_25.yaml +41 -0
paddlex/configs/image_classification/MobileNetV3_small_x0_35.yaml +41 -0
paddlex/configs/image_classification/MobileNetV3_small_x0_5.yaml +41 -0
paddlex/configs/image_classification/MobileNetV3_small_x0_75.yaml +41 -0
paddlex/configs/image_classification/MobileNetV3_small_x1_0.yaml +41 -0
paddlex/configs/image_classification/MobileNetV3_small_x1_25.yaml +41 -0
paddlex/configs/image_classification/MobileNetV4_conv_large.yaml +41 -0
paddlex/configs/image_classification/MobileNetV4_conv_medium.yaml +41 -0
paddlex/configs/image_classification/MobileNetV4_conv_small.yaml +41 -0
paddlex/configs/image_classification/MobileNetV4_hybrid_large.yaml +41 -0
paddlex/configs/image_classification/MobileNetV4_hybrid_medium.yaml +41 -0
paddlex/configs/image_classification/PP-HGNetV2-B0.yaml +41 -0
paddlex/configs/image_classification/PP-HGNetV2-B1.yaml +41 -0
paddlex/configs/image_classification/PP-HGNetV2-B2.yaml +41 -0
paddlex/configs/image_classification/PP-HGNetV2-B3.yaml +41 -0
paddlex/configs/image_classification/PP-HGNetV2-B4.yaml +41 -0
paddlex/configs/image_classification/PP-HGNetV2-B5.yaml +41 -0
paddlex/configs/image_classification/PP-HGNetV2-B6.yaml +41 -0
paddlex/configs/image_classification/PP-HGNet_base.yaml +41 -0
paddlex/configs/image_classification/PP-HGNet_small.yaml +41 -0
paddlex/configs/image_classification/PP-HGNet_tiny.yaml +41 -0
paddlex/configs/image_classification/PP-LCNetV2_base.yaml +41 -0
paddlex/configs/image_classification/PP-LCNetV2_large.yaml +41 -0
paddlex/configs/image_classification/PP-LCNetV2_small.yaml +41 -0
paddlex/configs/image_classification/PP-LCNet_x0_25.yaml +41 -0
paddlex/configs/image_classification/PP-LCNet_x0_35.yaml +41 -0
paddlex/configs/image_classification/PP-LCNet_x0_5.yaml +41 -0
paddlex/configs/image_classification/PP-LCNet_x0_75.yaml +41 -0
paddlex/configs/image_classification/PP-LCNet_x1_0.yaml +41 -0
paddlex/configs/image_classification/PP-LCNet_x1_5.yaml +41 -0
paddlex/configs/image_classification/PP-LCNet_x2_0.yaml +41 -0
paddlex/configs/image_classification/PP-LCNet_x2_5.yaml +41 -0
paddlex/configs/image_classification/ResNet101.yaml +41 -0
paddlex/configs/image_classification/ResNet101_vd.yaml +41 -0
paddlex/configs/image_classification/ResNet152.yaml +41 -0
paddlex/configs/image_classification/ResNet152_vd.yaml +41 -0
paddlex/configs/image_classification/ResNet18.yaml +41 -0
paddlex/configs/image_classification/ResNet18_vd.yaml +41 -0
paddlex/configs/image_classification/ResNet200_vd.yaml +41 -0
paddlex/configs/image_classification/ResNet34.yaml +41 -0
paddlex/configs/image_classification/ResNet34_vd.yaml +41 -0
paddlex/configs/image_classification/ResNet50.yaml +41 -0
paddlex/configs/image_classification/ResNet50_vd.yaml +41 -0
paddlex/configs/image_classification/StarNet-S1.yaml +41 -0
paddlex/configs/image_classification/StarNet-S2.yaml +41 -0
paddlex/configs/image_classification/StarNet-S3.yaml +41 -0
paddlex/configs/image_classification/StarNet-S4.yaml +41 -0
paddlex/configs/image_classification/SwinTransformer_base_patch4_window12_384.yaml +41 -0
paddlex/configs/image_classification/SwinTransformer_base_patch4_window7_224.yaml +41 -0
paddlex/configs/image_classification/SwinTransformer_large_patch4_window12_384.yaml +41 -0
paddlex/configs/image_classification/SwinTransformer_large_patch4_window7_224.yaml +41 -0
paddlex/configs/image_classification/SwinTransformer_small_patch4_window7_224.yaml +41 -0
paddlex/configs/image_classification/SwinTransformer_tiny_patch4_window7_224.yaml +41 -0
paddlex/configs/image_unwarping/UVDoc.yaml +12 -0
paddlex/configs/instance_segmentation/Cascade-MaskRCNN-ResNet50-FPN.yaml +40 -0
paddlex/configs/instance_segmentation/Cascade-MaskRCNN-ResNet50-vd-SSLDv2-FPN.yaml +40 -0
paddlex/configs/instance_segmentation/Mask-RT-DETR-H.yaml +40 -0
paddlex/configs/instance_segmentation/Mask-RT-DETR-L.yaml +40 -0
paddlex/configs/instance_segmentation/Mask-RT-DETR-M.yaml +40 -0
paddlex/configs/instance_segmentation/Mask-RT-DETR-S.yaml +40 -0
paddlex/configs/instance_segmentation/Mask-RT-DETR-X.yaml +40 -0
paddlex/configs/instance_segmentation/MaskRCNN-ResNeXt101-vd-FPN.yaml +39 -0
paddlex/configs/instance_segmentation/MaskRCNN-ResNet101-FPN.yaml +40 -0
paddlex/configs/instance_segmentation/MaskRCNN-ResNet101-vd-FPN.yaml +40 -0
paddlex/configs/instance_segmentation/MaskRCNN-ResNet50-FPN.yaml +40 -0
paddlex/configs/instance_segmentation/MaskRCNN-ResNet50-vd-FPN.yaml +40 -0
paddlex/configs/instance_segmentation/MaskRCNN-ResNet50.yaml +40 -0
paddlex/configs/instance_segmentation/PP-YOLOE_seg-S.yaml +40 -0
paddlex/configs/instance_segmentation/SOLOv2.yaml +40 -0
paddlex/configs/mainbody_detection/PP-ShiTuV2_det.yaml +41 -0
paddlex/configs/multilabel_classification/CLIP_vit_base_patch16_448_ML.yaml +41 -0
paddlex/configs/multilabel_classification/PP-HGNetV2-B0_ML.yaml +41 -0
paddlex/configs/multilabel_classification/PP-HGNetV2-B4_ML.yaml +41 -0
paddlex/configs/multilabel_classification/PP-HGNetV2-B6_ML.yaml +41 -0
paddlex/configs/multilabel_classification/PP-LCNet_x1_0_ML.yaml +41 -0
paddlex/configs/multilabel_classification/ResNet50_ML.yaml +41 -0
paddlex/configs/object_detection/Cascade-FasterRCNN-ResNet50-FPN.yaml +41 -0
paddlex/configs/object_detection/Cascade-FasterRCNN-ResNet50-vd-SSLDv2-FPN.yaml +42 -0
paddlex/configs/object_detection/CenterNet-DLA-34.yaml +41 -0
paddlex/configs/object_detection/CenterNet-ResNet50.yaml +41 -0
paddlex/configs/object_detection/DETR-R50.yaml +42 -0
paddlex/configs/object_detection/FCOS-ResNet50.yaml +41 -0
paddlex/configs/object_detection/FasterRCNN-ResNeXt101-vd-FPN.yaml +42 -0
paddlex/configs/object_detection/FasterRCNN-ResNet101-FPN.yaml +42 -0
paddlex/configs/object_detection/FasterRCNN-ResNet101.yaml +42 -0
paddlex/configs/object_detection/FasterRCNN-ResNet34-FPN.yaml +42 -0
paddlex/configs/object_detection/FasterRCNN-ResNet50-FPN.yaml +42 -0
paddlex/configs/object_detection/FasterRCNN-ResNet50-vd-FPN.yaml +42 -0
paddlex/configs/object_detection/FasterRCNN-ResNet50-vd-SSLDv2-FPN.yaml +42 -0
paddlex/configs/object_detection/FasterRCNN-ResNet50.yaml +42 -0
paddlex/configs/object_detection/FasterRCNN-Swin-Tiny-FPN.yaml +42 -0
paddlex/configs/object_detection/PP-YOLOE_plus-L.yaml +40 -0
paddlex/configs/object_detection/PP-YOLOE_plus-M.yaml +40 -0
paddlex/configs/object_detection/PP-YOLOE_plus-S.yaml +40 -0
paddlex/configs/object_detection/PP-YOLOE_plus-X.yaml +40 -0
paddlex/configs/object_detection/PicoDet-L.yaml +40 -0
paddlex/configs/object_detection/PicoDet-M.yaml +42 -0
paddlex/configs/object_detection/PicoDet-S.yaml +40 -0
paddlex/configs/object_detection/PicoDet-XS.yaml +42 -0
paddlex/configs/object_detection/RT-DETR-H.yaml +40 -0
paddlex/configs/object_detection/RT-DETR-L.yaml +40 -0
paddlex/configs/object_detection/RT-DETR-R18.yaml +40 -0
paddlex/configs/object_detection/RT-DETR-R50.yaml +40 -0
paddlex/configs/object_detection/RT-DETR-X.yaml +40 -0
paddlex/configs/object_detection/YOLOX-L.yaml +40 -0
paddlex/configs/object_detection/YOLOX-M.yaml +40 -0
paddlex/configs/object_detection/YOLOX-N.yaml +40 -0
paddlex/configs/object_detection/YOLOX-S.yaml +40 -0
paddlex/configs/object_detection/YOLOX-T.yaml +40 -0
paddlex/configs/object_detection/YOLOX-X.yaml +40 -0
paddlex/configs/object_detection/YOLOv3-DarkNet53.yaml +40 -0
paddlex/configs/object_detection/YOLOv3-MobileNetV3.yaml +40 -0
paddlex/configs/object_detection/YOLOv3-ResNet50_vd_DCN.yaml +40 -0
paddlex/configs/pedestrian_attribute/PP-LCNet_x1_0_pedestrian_attribute.yaml +41 -0
paddlex/configs/semantic_segmentation/Deeplabv3-R101.yaml +40 -0
paddlex/configs/semantic_segmentation/Deeplabv3-R50.yaml +40 -0
paddlex/configs/semantic_segmentation/Deeplabv3_Plus-R101.yaml +40 -0
paddlex/configs/semantic_segmentation/Deeplabv3_Plus-R50.yaml +40 -0
paddlex/configs/semantic_segmentation/OCRNet_HRNet-W18.yaml +40 -0
paddlex/configs/semantic_segmentation/OCRNet_HRNet-W48.yaml +40 -0
paddlex/configs/semantic_segmentation/PP-LiteSeg-B.yaml +41 -0
paddlex/configs/semantic_segmentation/PP-LiteSeg-T.yaml +40 -0
paddlex/configs/semantic_segmentation/SeaFormer_base.yaml +40 -0
paddlex/configs/semantic_segmentation/SeaFormer_large.yaml +40 -0
paddlex/configs/semantic_segmentation/SeaFormer_small.yaml +40 -0
paddlex/configs/semantic_segmentation/SeaFormer_tiny.yaml +40 -0
paddlex/configs/semantic_segmentation/SegFormer-B0.yaml +40 -0
paddlex/configs/semantic_segmentation/SegFormer-B1.yaml +40 -0
paddlex/configs/semantic_segmentation/SegFormer-B2.yaml +40 -0
paddlex/configs/semantic_segmentation/SegFormer-B3.yaml +40 -0
paddlex/configs/semantic_segmentation/SegFormer-B4.yaml +40 -0
paddlex/configs/semantic_segmentation/SegFormer-B5.yaml +40 -0
paddlex/configs/small_object_detection/PP-YOLOE_plus_SOD-L.yaml +42 -0
paddlex/configs/small_object_detection/PP-YOLOE_plus_SOD-S.yaml +42 -0
paddlex/configs/small_object_detection/PP-YOLOE_plus_SOD-largesize-L.yaml +42 -0
paddlex/configs/structure_analysis/PicoDet-L_layout_17cls.yaml +40 -0
paddlex/configs/structure_analysis/PicoDet-L_layout_3cls.yaml +40 -0
paddlex/configs/structure_analysis/PicoDet-S_layout_17cls.yaml +40 -0
paddlex/configs/structure_analysis/PicoDet-S_layout_3cls.yaml +40 -0
paddlex/configs/structure_analysis/PicoDet_layout_1x.yaml +40 -0
paddlex/configs/structure_analysis/PicoDet_layout_1x_table.yaml +40 -0
paddlex/configs/structure_analysis/RT-DETR-H_layout_17cls.yaml +40 -0
paddlex/configs/structure_analysis/RT-DETR-H_layout_3cls.yaml +40 -0
paddlex/configs/table_recognition/SLANet.yaml +39 -0
paddlex/configs/table_recognition/SLANet_plus.yaml +39 -0
paddlex/configs/text_detection/PP-OCRv4_mobile_det.yaml +40 -0
paddlex/configs/text_detection/PP-OCRv4_server_det.yaml +40 -0
paddlex/configs/text_detection_seal/PP-OCRv4_mobile_seal_det.yaml +40 -0
paddlex/configs/text_detection_seal/PP-OCRv4_server_seal_det.yaml +40 -0
paddlex/configs/text_recognition/PP-OCRv4_mobile_rec.yaml +39 -0
paddlex/configs/text_recognition/PP-OCRv4_server_rec.yaml +39 -0
paddlex/configs/text_recognition/ch_RepSVTR_rec.yaml +39 -0
paddlex/configs/text_recognition/ch_SVTRv2_rec.yaml +39 -0
paddlex/configs/ts_anomaly_detection/AutoEncoder_ad.yaml +37 -0
paddlex/configs/ts_anomaly_detection/DLinear_ad.yaml +37 -0
paddlex/configs/ts_anomaly_detection/Nonstationary_ad.yaml +37 -0
paddlex/configs/ts_anomaly_detection/PatchTST_ad.yaml +37 -0
paddlex/configs/ts_anomaly_detection/TimesNet_ad.yaml +37 -0
paddlex/configs/ts_classification/TimesNet_cls.yaml +37 -0
paddlex/configs/ts_forecast/DLinear.yaml +38 -0
paddlex/configs/ts_forecast/NLinear.yaml +38 -0
paddlex/configs/ts_forecast/Nonstationary.yaml +38 -0
paddlex/configs/ts_forecast/PatchTST.yaml +38 -0
paddlex/configs/ts_forecast/RLinear.yaml +38 -0
paddlex/configs/ts_forecast/TiDE.yaml +38 -0
paddlex/configs/ts_forecast/TimesNet.yaml +38 -0
paddlex/configs/vehicle_attribute/PP-LCNet_x1_0_vehicle_attribute.yaml +41 -0
paddlex/configs/vehicle_detection/PP-YOLOE-L_vehicle.yaml +41 -0
paddlex/configs/vehicle_detection/PP-YOLOE-S_vehicle.yaml +42 -0
paddlex/engine.py +54 -0
paddlex/inference/__init__.py +17 -0
paddlex/inference/components/__init__.py +18 -0
paddlex/inference/components/base.py +292 -0
paddlex/inference/components/llm/__init__.py +25 -0
paddlex/inference/components/llm/base.py +65 -0
paddlex/inference/components/llm/erniebot.py +212 -0
paddlex/inference/components/paddle_predictor/__init__.py +20 -0
paddlex/inference/components/paddle_predictor/predictor.py +332 -0
paddlex/inference/components/retrieval/__init__.py +15 -0
paddlex/inference/components/retrieval/faiss.py +359 -0
paddlex/inference/components/task_related/__init__.py +33 -0
paddlex/inference/components/task_related/clas.py +124 -0
paddlex/inference/components/task_related/det.py +284 -0
paddlex/inference/components/task_related/instance_seg.py +89 -0
paddlex/inference/components/task_related/seal_det_warp.py +940 -0
paddlex/inference/components/task_related/seg.py +40 -0
paddlex/inference/components/task_related/table_rec.py +191 -0
paddlex/inference/components/task_related/text_det.py +895 -0
paddlex/inference/components/task_related/text_rec.py +353 -0
paddlex/inference/components/task_related/warp.py +43 -0
paddlex/inference/components/transforms/__init__.py +16 -0
paddlex/inference/components/transforms/image/__init__.py +15 -0
paddlex/inference/components/transforms/image/common.py +598 -0
paddlex/inference/components/transforms/image/funcs.py +58 -0
paddlex/inference/components/transforms/read_data.py +67 -0
paddlex/inference/components/transforms/ts/__init__.py +15 -0
paddlex/inference/components/transforms/ts/common.py +393 -0
paddlex/inference/components/transforms/ts/funcs.py +424 -0
paddlex/inference/models/__init__.py +106 -0
paddlex/inference/models/anomaly_detection.py +87 -0
paddlex/inference/models/base/__init__.py +16 -0
paddlex/inference/models/base/base_predictor.py +76 -0
paddlex/inference/models/base/basic_predictor.py +122 -0
paddlex/inference/models/face_recognition.py +21 -0
paddlex/inference/models/formula_recognition.py +55 -0
paddlex/inference/models/general_recognition.py +99 -0
paddlex/inference/models/image_classification.py +101 -0
paddlex/inference/models/image_unwarping.py +43 -0
paddlex/inference/models/instance_segmentation.py +66 -0
paddlex/inference/models/multilabel_classification.py +33 -0
paddlex/inference/models/object_detection.py +129 -0
paddlex/inference/models/semantic_segmentation.py +86 -0
paddlex/inference/models/table_recognition.py +106 -0
paddlex/inference/models/text_detection.py +105 -0
paddlex/inference/models/text_recognition.py +78 -0
paddlex/inference/models/ts_ad.py +68 -0
paddlex/inference/models/ts_cls.py +57 -0
paddlex/inference/models/ts_fc.py +73 -0
paddlex/inference/pipelines/__init__.py +127 -0
paddlex/inference/pipelines/attribute_recognition.py +92 -0
paddlex/inference/pipelines/base.py +86 -0
paddlex/inference/pipelines/face_recognition.py +49 -0
paddlex/inference/pipelines/formula_recognition.py +102 -0
paddlex/inference/pipelines/layout_parsing/__init__.py +15 -0
paddlex/inference/pipelines/layout_parsing/layout_parsing.py +362 -0
paddlex/inference/pipelines/ocr.py +80 -0
paddlex/inference/pipelines/pp_shitu_v2.py +152 -0
paddlex/inference/pipelines/ppchatocrv3/__init__.py +15 -0
paddlex/inference/pipelines/ppchatocrv3/ch_prompt.yaml +14 -0
paddlex/inference/pipelines/ppchatocrv3/ppchatocrv3.py +717 -0
paddlex/inference/pipelines/ppchatocrv3/utils.py +168 -0
paddlex/inference/pipelines/seal_recognition.py +152 -0
paddlex/inference/pipelines/serving/__init__.py +17 -0
paddlex/inference/pipelines/serving/_pipeline_apps/__init__.py +205 -0
paddlex/inference/pipelines/serving/_pipeline_apps/anomaly_detection.py +80 -0
paddlex/inference/pipelines/serving/_pipeline_apps/face_recognition.py +317 -0
paddlex/inference/pipelines/serving/_pipeline_apps/formula_recognition.py +119 -0
paddlex/inference/pipelines/serving/_pipeline_apps/image_classification.py +101 -0
paddlex/inference/pipelines/serving/_pipeline_apps/instance_segmentation.py +112 -0
paddlex/inference/pipelines/serving/_pipeline_apps/layout_parsing.py +205 -0
paddlex/inference/pipelines/serving/_pipeline_apps/multi_label_image_classification.py +90 -0
paddlex/inference/pipelines/serving/_pipeline_apps/object_detection.py +90 -0
paddlex/inference/pipelines/serving/_pipeline_apps/ocr.py +98 -0
paddlex/inference/pipelines/serving/_pipeline_apps/pedestrian_attribute_recognition.py +102 -0
paddlex/inference/pipelines/serving/_pipeline_apps/pp_shitu_v2.py +319 -0
paddlex/inference/pipelines/serving/_pipeline_apps/ppchatocrv3.py +445 -0
paddlex/inference/pipelines/serving/_pipeline_apps/seal_recognition.py +110 -0
paddlex/inference/pipelines/serving/_pipeline_apps/semantic_segmentation.py +82 -0
paddlex/inference/pipelines/serving/_pipeline_apps/small_object_detection.py +92 -0
paddlex/inference/pipelines/serving/_pipeline_apps/table_recognition.py +110 -0
paddlex/inference/pipelines/serving/_pipeline_apps/ts_ad.py +68 -0
paddlex/inference/pipelines/serving/_pipeline_apps/ts_cls.py +68 -0
paddlex/inference/pipelines/serving/_pipeline_apps/ts_fc.py +68 -0
paddlex/inference/pipelines/serving/_pipeline_apps/vehicle_attribute_recognition.py +102 -0
paddlex/inference/pipelines/serving/app.py +164 -0
paddlex/inference/pipelines/serving/models.py +30 -0
paddlex/inference/pipelines/serving/server.py +25 -0
paddlex/inference/pipelines/serving/storage.py +161 -0
paddlex/inference/pipelines/serving/utils.py +190 -0
paddlex/inference/pipelines/single_model_pipeline.py +76 -0
paddlex/inference/pipelines/table_recognition/__init__.py +15 -0
paddlex/inference/pipelines/table_recognition/table_recognition.py +193 -0
paddlex/inference/pipelines/table_recognition/utils.py +457 -0
paddlex/inference/results/__init__.py +31 -0
paddlex/inference/results/attribute_rec.py +89 -0
paddlex/inference/results/base.py +43 -0
paddlex/inference/results/chat_ocr.py +158 -0
paddlex/inference/results/clas.py +133 -0
paddlex/inference/results/det.py +86 -0
paddlex/inference/results/face_rec.py +34 -0
paddlex/inference/results/formula_rec.py +363 -0
paddlex/inference/results/instance_seg.py +152 -0
paddlex/inference/results/ocr.py +157 -0
paddlex/inference/results/seal_rec.py +50 -0
paddlex/inference/results/seg.py +72 -0
paddlex/inference/results/shitu.py +35 -0
paddlex/inference/results/table_rec.py +109 -0
paddlex/inference/results/text_det.py +33 -0
paddlex/inference/results/text_rec.py +66 -0
paddlex/inference/results/ts.py +37 -0
paddlex/inference/results/utils/__init__.py +13 -0
paddlex/inference/results/utils/mixin.py +204 -0
paddlex/inference/results/warp.py +31 -0
paddlex/inference/utils/__init__.py +13 -0
paddlex/inference/utils/benchmark.py +214 -0
paddlex/inference/utils/color_map.py +123 -0
paddlex/inference/utils/get_pipeline_path.py +26 -0
paddlex/inference/utils/io/__init__.py +33 -0
paddlex/inference/utils/io/readers.py +353 -0
paddlex/inference/utils/io/style.py +374 -0
paddlex/inference/utils/io/tablepyxl.py +149 -0
paddlex/inference/utils/io/writers.py +376 -0
paddlex/inference/utils/new_ir_blacklist.py +22 -0
paddlex/inference/utils/official_models.py +286 -0
paddlex/inference/utils/pp_option.py +236 -0
paddlex/inference/utils/process_hook.py +54 -0
paddlex/model.py +106 -0
paddlex/modules/__init__.py +105 -0
paddlex/modules/anomaly_detection/__init__.py +18 -0
paddlex/modules/anomaly_detection/dataset_checker/__init__.py +95 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/analyse_dataset.py +79 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/check_dataset.py +87 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/convert_dataset.py +230 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/split_dataset.py +87 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/utils/visualizer.py +71 -0
paddlex/modules/anomaly_detection/evaluator.py +58 -0
paddlex/modules/anomaly_detection/exportor.py +22 -0
paddlex/modules/anomaly_detection/model_list.py +16 -0
paddlex/modules/anomaly_detection/trainer.py +71 -0
paddlex/modules/base/__init__.py +18 -0
paddlex/modules/base/build_model.py +34 -0
paddlex/modules/base/dataset_checker/__init__.py +16 -0
paddlex/modules/base/dataset_checker/dataset_checker.py +164 -0
paddlex/modules/base/dataset_checker/utils.py +110 -0
paddlex/modules/base/evaluator.py +154 -0
paddlex/modules/base/exportor.py +121 -0
paddlex/modules/base/trainer.py +111 -0
paddlex/modules/face_recognition/__init__.py +18 -0
paddlex/modules/face_recognition/dataset_checker/__init__.py +71 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/__init__.py +16 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/check_dataset.py +174 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/utils/visualizer.py +156 -0
paddlex/modules/face_recognition/evaluator.py +52 -0
paddlex/modules/face_recognition/exportor.py +22 -0
paddlex/modules/face_recognition/model_list.py +15 -0
paddlex/modules/face_recognition/trainer.py +97 -0
paddlex/modules/formula_recognition/__init__.py +13 -0
paddlex/modules/formula_recognition/model_list.py +17 -0
paddlex/modules/general_recognition/__init__.py +18 -0
paddlex/modules/general_recognition/dataset_checker/__init__.py +107 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/analyse_dataset.py +98 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/check_dataset.py +100 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/convert_dataset.py +99 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/split_dataset.py +82 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/utils/visualizer.py +150 -0
paddlex/modules/general_recognition/evaluator.py +31 -0
paddlex/modules/general_recognition/exportor.py +22 -0
paddlex/modules/general_recognition/model_list.py +19 -0
paddlex/modules/general_recognition/trainer.py +52 -0
paddlex/modules/image_classification/__init__.py +18 -0
paddlex/modules/image_classification/dataset_checker/__init__.py +104 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/analyse_dataset.py +93 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/check_dataset.py +131 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/convert_dataset.py +51 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/utils/visualizer.py +156 -0
paddlex/modules/image_classification/evaluator.py +43 -0
paddlex/modules/image_classification/exportor.py +22 -0
paddlex/modules/image_classification/model_list.py +97 -0
paddlex/modules/image_classification/trainer.py +82 -0
paddlex/modules/image_unwarping/__init__.py +13 -0
paddlex/modules/image_unwarping/model_list.py +17 -0
paddlex/modules/instance_segmentation/__init__.py +18 -0
paddlex/modules/instance_segmentation/dataset_checker/__init__.py +93 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/analyse_dataset.py +78 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/check_dataset.py +92 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/convert_dataset.py +241 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/split_dataset.py +119 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/utils/visualizer.py +221 -0
paddlex/modules/instance_segmentation/evaluator.py +32 -0
paddlex/modules/instance_segmentation/exportor.py +22 -0
paddlex/modules/instance_segmentation/model_list.py +33 -0
paddlex/modules/instance_segmentation/trainer.py +31 -0
paddlex/modules/multilabel_classification/__init__.py +18 -0
paddlex/modules/multilabel_classification/dataset_checker/__init__.py +106 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/analyse_dataset.py +95 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/check_dataset.py +131 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/convert_dataset.py +117 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/utils/visualizer.py +153 -0
paddlex/modules/multilabel_classification/evaluator.py +43 -0
paddlex/modules/multilabel_classification/exportor.py +22 -0
paddlex/modules/multilabel_classification/model_list.py +24 -0
paddlex/modules/multilabel_classification/trainer.py +85 -0
paddlex/modules/object_detection/__init__.py +18 -0
paddlex/modules/object_detection/dataset_checker/__init__.py +115 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/analyse_dataset.py +80 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/check_dataset.py +86 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/convert_dataset.py +433 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/split_dataset.py +119 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/utils/visualizer.py +192 -0
paddlex/modules/object_detection/evaluator.py +41 -0
paddlex/modules/object_detection/exportor.py +22 -0
paddlex/modules/object_detection/model_list.py +74 -0
paddlex/modules/object_detection/trainer.py +85 -0
paddlex/modules/semantic_segmentation/__init__.py +18 -0
paddlex/modules/semantic_segmentation/dataset_checker/__init__.py +95 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/analyse_dataset.py +73 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/check_dataset.py +80 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/convert_dataset.py +162 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/split_dataset.py +87 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/utils/visualizer.py +71 -0
paddlex/modules/semantic_segmentation/evaluator.py +58 -0
paddlex/modules/semantic_segmentation/exportor.py +22 -0
paddlex/modules/semantic_segmentation/model_list.py +35 -0
paddlex/modules/semantic_segmentation/trainer.py +71 -0
paddlex/modules/table_recognition/__init__.py +18 -0
paddlex/modules/table_recognition/dataset_checker/__init__.py +83 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/analyse_dataset.py +58 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/check_dataset.py +87 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/split_dataset.py +79 -0
paddlex/modules/table_recognition/evaluator.py +43 -0
paddlex/modules/table_recognition/exportor.py +22 -0
paddlex/modules/table_recognition/model_list.py +19 -0
paddlex/modules/table_recognition/trainer.py +70 -0
paddlex/modules/text_detection/__init__.py +18 -0
paddlex/modules/text_detection/dataset_checker/__init__.py +94 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/analyse_dataset.py +217 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/check_dataset.py +96 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/split_dataset.py +140 -0
paddlex/modules/text_detection/evaluator.py +41 -0
paddlex/modules/text_detection/exportor.py +22 -0
paddlex/modules/text_detection/model_list.py +22 -0
paddlex/modules/text_detection/trainer.py +68 -0
paddlex/modules/text_recognition/__init__.py +18 -0
paddlex/modules/text_recognition/dataset_checker/__init__.py +114 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/analyse_dataset.py +161 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/check_dataset.py +97 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/convert_dataset.py +94 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/text_recognition/evaluator.py +63 -0
paddlex/modules/text_recognition/exportor.py +25 -0
paddlex/modules/text_recognition/model_list.py +20 -0
paddlex/modules/text_recognition/trainer.py +105 -0
paddlex/modules/ts_anomaly_detection/__init__.py +19 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/__init__.py +97 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/analyse_dataset.py +27 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/convert_dataset.py +78 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/split_dataset.py +63 -0
paddlex/modules/ts_anomaly_detection/evaluator.py +67 -0
paddlex/modules/ts_anomaly_detection/exportor.py +45 -0
paddlex/modules/ts_anomaly_detection/model_list.py +22 -0
paddlex/modules/ts_anomaly_detection/trainer.py +97 -0
paddlex/modules/ts_classification/__init__.py +19 -0
paddlex/modules/ts_classification/dataset_checker/__init__.py +97 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/analyse_dataset.py +74 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/convert_dataset.py +78 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/split_dataset.py +88 -0
paddlex/modules/ts_classification/evaluator.py +66 -0
paddlex/modules/ts_classification/exportor.py +45 -0
paddlex/modules/ts_classification/model_list.py +18 -0
paddlex/modules/ts_classification/trainer.py +92 -0
paddlex/modules/ts_forecast/__init__.py +19 -0
paddlex/modules/ts_forecast/dataset_checker/__init__.py +97 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/analyse_dataset.py +27 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/convert_dataset.py +77 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/split_dataset.py +63 -0
paddlex/modules/ts_forecast/evaluator.py +66 -0
paddlex/modules/ts_forecast/exportor.py +45 -0
paddlex/modules/ts_forecast/model_list.py +24 -0
paddlex/modules/ts_forecast/trainer.py +92 -0
paddlex/paddlex_cli.py +197 -0
paddlex/pipelines/OCR.yaml +8 -0
paddlex/pipelines/PP-ChatOCRv3-doc.yaml +27 -0
paddlex/pipelines/PP-ShiTuV2.yaml +13 -0
paddlex/pipelines/anomaly_detection.yaml +7 -0
paddlex/pipelines/face_recognition.yaml +13 -0
paddlex/pipelines/formula_recognition.yaml +8 -0
paddlex/pipelines/image_classification.yaml +7 -0
paddlex/pipelines/instance_segmentation.yaml +7 -0
paddlex/pipelines/layout_parsing.yaml +14 -0
paddlex/pipelines/multi_label_image_classification.yaml +7 -0
paddlex/pipelines/object_detection.yaml +7 -0
paddlex/pipelines/pedestrian_attribute_recognition.yaml +7 -0
paddlex/pipelines/seal_recognition.yaml +10 -0
paddlex/pipelines/semantic_segmentation.yaml +7 -0
paddlex/pipelines/small_object_detection.yaml +7 -0
paddlex/pipelines/table_recognition.yaml +12 -0
paddlex/pipelines/ts_ad.yaml +7 -0
paddlex/pipelines/ts_cls.yaml +7 -0
paddlex/pipelines/ts_fc.yaml +7 -0
paddlex/pipelines/vehicle_attribute_recognition.yaml +7 -0
paddlex/repo_apis/PaddleClas_api/__init__.py +17 -0
paddlex/repo_apis/PaddleClas_api/cls/__init__.py +19 -0
paddlex/repo_apis/PaddleClas_api/cls/config.py +594 -0
paddlex/repo_apis/PaddleClas_api/cls/model.py +349 -0
paddlex/repo_apis/PaddleClas_api/cls/register.py +890 -0
paddlex/repo_apis/PaddleClas_api/cls/runner.py +219 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/__init__.py +18 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/config.py +141 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/model.py +23 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/register.py +68 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/runner.py +55 -0
paddlex/repo_apis/PaddleDetection_api/__init__.py +17 -0
paddlex/repo_apis/PaddleDetection_api/config_helper.py +280 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/__init__.py +18 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/config.py +454 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/model.py +397 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/register.py +263 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/runner.py +226 -0
paddlex/repo_apis/PaddleDetection_api/object_det/__init__.py +19 -0
paddlex/repo_apis/PaddleDetection_api/object_det/config.py +517 -0
paddlex/repo_apis/PaddleDetection_api/object_det/model.py +424 -0
paddlex/repo_apis/PaddleDetection_api/object_det/official_categories.py +139 -0
paddlex/repo_apis/PaddleDetection_api/object_det/register.py +927 -0
paddlex/repo_apis/PaddleDetection_api/object_det/runner.py +226 -0
paddlex/repo_apis/PaddleNLP_api/__init__.py +13 -0
paddlex/repo_apis/PaddleOCR_api/__init__.py +20 -0
paddlex/repo_apis/PaddleOCR_api/config_utils.py +53 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/config.py +64 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/model.py +126 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/register.py +53 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/runner.py +51 -0
paddlex/repo_apis/PaddleOCR_api/text_det/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/text_det/config.py +62 -0
paddlex/repo_apis/PaddleOCR_api/text_det/model.py +72 -0
paddlex/repo_apis/PaddleOCR_api/text_det/register.py +72 -0
paddlex/repo_apis/PaddleOCR_api/text_det/runner.py +53 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/config.py +542 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/model.py +396 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/register.py +80 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/runner.py +240 -0
paddlex/repo_apis/PaddleSeg_api/__init__.py +16 -0
paddlex/repo_apis/PaddleSeg_api/base_seg_config.py +134 -0
paddlex/repo_apis/PaddleSeg_api/seg/__init__.py +16 -0
paddlex/repo_apis/PaddleSeg_api/seg/config.py +177 -0
paddlex/repo_apis/PaddleSeg_api/seg/model.py +481 -0
paddlex/repo_apis/PaddleSeg_api/seg/register.py +253 -0
paddlex/repo_apis/PaddleSeg_api/seg/runner.py +262 -0
paddlex/repo_apis/PaddleTS_api/__init__.py +19 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/config.py +89 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/register.py +146 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_base/__init__.py +13 -0
paddlex/repo_apis/PaddleTS_api/ts_base/config.py +222 -0
paddlex/repo_apis/PaddleTS_api/ts_base/model.py +272 -0
paddlex/repo_apis/PaddleTS_api/ts_base/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/config.py +73 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/register.py +59 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/config.py +137 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/register.py +186 -0
paddlex/repo_apis/__init__.py +13 -0
paddlex/repo_apis/base/__init__.py +23 -0
paddlex/repo_apis/base/config.py +238 -0
paddlex/repo_apis/base/model.py +571 -0
paddlex/repo_apis/base/register.py +135 -0
paddlex/repo_apis/base/runner.py +390 -0
paddlex/repo_apis/base/utils/__init__.py +13 -0
paddlex/repo_apis/base/utils/arg.py +64 -0
paddlex/repo_apis/base/utils/subprocess.py +107 -0
paddlex/repo_manager/__init__.py +24 -0
paddlex/repo_manager/core.py +271 -0
paddlex/repo_manager/meta.py +143 -0
paddlex/repo_manager/repo.py +396 -0
paddlex/repo_manager/requirements.txt +18 -0
paddlex/repo_manager/utils.py +298 -0
paddlex/utils/__init__.py +1 -12
paddlex/utils/cache.py +148 -0
paddlex/utils/config.py +214 -0
paddlex/utils/device.py +103 -0
paddlex/utils/download.py +168 -182
paddlex/utils/errors/__init__.py +17 -0
paddlex/utils/errors/dataset_checker.py +78 -0
paddlex/utils/errors/others.py +152 -0
paddlex/utils/file_interface.py +212 -0
paddlex/utils/flags.py +61 -0
paddlex/utils/fonts/PingFang-SC-Regular.ttf +0 -0
paddlex/utils/fonts/__init__.py +24 -0
paddlex/utils/func_register.py +41 -0
paddlex/utils/interactive_get_pipeline.py +55 -0
paddlex/utils/lazy_loader.py +66 -0
paddlex/utils/logging.py +132 -33
paddlex/utils/misc.py +201 -0
paddlex/utils/result_saver.py +59 -0
paddlex/utils/subclass_register.py +101 -0
paddlex/version.py +54 -0
paddlex-3.0.0b2.dist-info/LICENSE +169 -0
paddlex-3.0.0b2.dist-info/METADATA +760 -0
paddlex-3.0.0b2.dist-info/RECORD +646 -0
paddlex-3.0.0b2.dist-info/WHEEL +5 -0
paddlex-3.0.0b2.dist-info/entry_points.txt +2 -0
paddlex-3.0.0b2.dist-info/top_level.txt +1 -0
PaddleClas/__init__.py +0 -16
PaddleClas/paddleclas.py +0 -375
PaddleClas/ppcls/__init__.py +0 -20
PaddleClas/ppcls/data/__init__.py +0 -15
PaddleClas/ppcls/data/imaug/__init__.py +0 -94
PaddleClas/ppcls/data/imaug/autoaugment.py +0 -264
PaddleClas/ppcls/data/imaug/batch_operators.py +0 -117
PaddleClas/ppcls/data/imaug/cutout.py +0 -41
PaddleClas/ppcls/data/imaug/fmix.py +0 -217
PaddleClas/ppcls/data/imaug/grid.py +0 -89
PaddleClas/ppcls/data/imaug/hide_and_seek.py +0 -44
PaddleClas/ppcls/data/imaug/operators.py +0 -244
PaddleClas/ppcls/data/imaug/randaugment.py +0 -106
PaddleClas/ppcls/data/imaug/random_erasing.py +0 -55
PaddleClas/ppcls/data/reader.py +0 -318
PaddleClas/ppcls/modeling/__init__.py +0 -20
PaddleClas/ppcls/modeling/architectures/__init__.py +0 -51
PaddleClas/ppcls/modeling/architectures/alexnet.py +0 -132
PaddleClas/ppcls/modeling/architectures/darknet.py +0 -161
PaddleClas/ppcls/modeling/architectures/densenet.py +0 -308
PaddleClas/ppcls/modeling/architectures/distillation_models.py +0 -65
PaddleClas/ppcls/modeling/architectures/distilled_vision_transformer.py +0 -196
PaddleClas/ppcls/modeling/architectures/dpn.py +0 -425
PaddleClas/ppcls/modeling/architectures/efficientnet.py +0 -901
PaddleClas/ppcls/modeling/architectures/ghostnet.py +0 -331
PaddleClas/ppcls/modeling/architectures/googlenet.py +0 -207
PaddleClas/ppcls/modeling/architectures/hrnet.py +0 -742
PaddleClas/ppcls/modeling/architectures/inception_v3.py +0 -481
PaddleClas/ppcls/modeling/architectures/inception_v4.py +0 -455
PaddleClas/ppcls/modeling/architectures/mixnet.py +0 -782
PaddleClas/ppcls/modeling/architectures/mobilenet_v1.py +0 -266
PaddleClas/ppcls/modeling/architectures/mobilenet_v2.py +0 -248
PaddleClas/ppcls/modeling/architectures/mobilenet_v3.py +0 -359
PaddleClas/ppcls/modeling/architectures/regnet.py +0 -383
PaddleClas/ppcls/modeling/architectures/repvgg.py +0 -339
PaddleClas/ppcls/modeling/architectures/res2net.py +0 -272
PaddleClas/ppcls/modeling/architectures/res2net_vd.py +0 -295
PaddleClas/ppcls/modeling/architectures/resnest.py +0 -705
PaddleClas/ppcls/modeling/architectures/resnet.py +0 -316
PaddleClas/ppcls/modeling/architectures/resnet_vc.py +0 -309
PaddleClas/ppcls/modeling/architectures/resnet_vd.py +0 -354
PaddleClas/ppcls/modeling/architectures/resnext.py +0 -253
PaddleClas/ppcls/modeling/architectures/resnext101_wsl.py +0 -447
PaddleClas/ppcls/modeling/architectures/resnext_vd.py +0 -266
PaddleClas/ppcls/modeling/architectures/rexnet.py +0 -240
PaddleClas/ppcls/modeling/architectures/se_resnet_vd.py +0 -378
PaddleClas/ppcls/modeling/architectures/se_resnext.py +0 -290
PaddleClas/ppcls/modeling/architectures/se_resnext_vd.py +0 -285
PaddleClas/ppcls/modeling/architectures/shufflenet_v2.py +0 -320
PaddleClas/ppcls/modeling/architectures/squeezenet.py +0 -154
PaddleClas/ppcls/modeling/architectures/vgg.py +0 -152
PaddleClas/ppcls/modeling/architectures/vision_transformer.py +0 -402
PaddleClas/ppcls/modeling/architectures/xception.py +0 -345
PaddleClas/ppcls/modeling/architectures/xception_deeplab.py +0 -386
PaddleClas/ppcls/modeling/loss.py +0 -154
PaddleClas/ppcls/modeling/utils.py +0 -53
PaddleClas/ppcls/optimizer/__init__.py +0 -19
PaddleClas/ppcls/optimizer/learning_rate.py +0 -159
PaddleClas/ppcls/optimizer/optimizer.py +0 -165
PaddleClas/ppcls/utils/__init__.py +0 -27
PaddleClas/ppcls/utils/check.py +0 -151
PaddleClas/ppcls/utils/config.py +0 -201
PaddleClas/ppcls/utils/logger.py +0 -120
PaddleClas/ppcls/utils/metrics.py +0 -107
PaddleClas/ppcls/utils/misc.py +0 -62
PaddleClas/ppcls/utils/model_zoo.py +0 -213
PaddleClas/ppcls/utils/save_load.py +0 -163
PaddleClas/setup.py +0 -55
PaddleClas/tools/__init__.py +0 -15
PaddleClas/tools/download.py +0 -50
PaddleClas/tools/ema.py +0 -58
PaddleClas/tools/eval.py +0 -112
PaddleClas/tools/export_model.py +0 -85
PaddleClas/tools/export_serving_model.py +0 -76
PaddleClas/tools/infer/__init__.py +0 -16
PaddleClas/tools/infer/infer.py +0 -94
PaddleClas/tools/infer/predict.py +0 -117
PaddleClas/tools/infer/utils.py +0 -233
PaddleClas/tools/program.py +0 -444
PaddleClas/tools/test_hubserving.py +0 -113
PaddleClas/tools/train.py +0 -141
paddlex/cls.py +0 -76
paddlex/command.py +0 -215
paddlex/cv/__init__.py +0 -17
paddlex/cv/datasets/__init__.py +0 -18
paddlex/cv/datasets/coco.py +0 -169
paddlex/cv/datasets/imagenet.py +0 -88
paddlex/cv/datasets/seg_dataset.py +0 -91
paddlex/cv/datasets/voc.py +0 -301
paddlex/cv/models/__init__.py +0 -18
paddlex/cv/models/base.py +0 -623
paddlex/cv/models/classifier.py +0 -814
paddlex/cv/models/detector.py +0 -1747
paddlex/cv/models/load_model.py +0 -126
paddlex/cv/models/segmenter.py +0 -673
paddlex/cv/models/slim/__init__.py +0 -13
paddlex/cv/models/slim/prune.py +0 -55
paddlex/cv/models/utils/__init__.py +0 -13
paddlex/cv/models/utils/det_metrics/__init__.py +0 -15
paddlex/cv/models/utils/det_metrics/coco_utils.py +0 -217
paddlex/cv/models/utils/det_metrics/metrics.py +0 -220
paddlex/cv/models/utils/ema.py +0 -48
paddlex/cv/models/utils/seg_metrics.py +0 -62
paddlex/cv/models/utils/visualize.py +0 -394
paddlex/cv/transforms/__init__.py +0 -46
paddlex/cv/transforms/batch_operators.py +0 -286
paddlex/cv/transforms/box_utils.py +0 -41
paddlex/cv/transforms/functions.py +0 -193
paddlex/cv/transforms/operators.py +0 -1402
paddlex/det.py +0 -43
paddlex/paddleseg/__init__.py +0 -17
paddlex/paddleseg/core/__init__.py +0 -20
paddlex/paddleseg/core/infer.py +0 -289
paddlex/paddleseg/core/predict.py +0 -145
paddlex/paddleseg/core/train.py +0 -258
paddlex/paddleseg/core/val.py +0 -172
paddlex/paddleseg/cvlibs/__init__.py +0 -17
paddlex/paddleseg/cvlibs/callbacks.py +0 -279
paddlex/paddleseg/cvlibs/config.py +0 -359
paddlex/paddleseg/cvlibs/manager.py +0 -142
paddlex/paddleseg/cvlibs/param_init.py +0 -91
paddlex/paddleseg/datasets/__init__.py +0 -21
paddlex/paddleseg/datasets/ade.py +0 -112
paddlex/paddleseg/datasets/cityscapes.py +0 -86
paddlex/paddleseg/datasets/cocostuff.py +0 -79
paddlex/paddleseg/datasets/dataset.py +0 -164
paddlex/paddleseg/datasets/mini_deep_globe_road_extraction.py +0 -95
paddlex/paddleseg/datasets/optic_disc_seg.py +0 -97
paddlex/paddleseg/datasets/pascal_context.py +0 -80
paddlex/paddleseg/datasets/voc.py +0 -113
paddlex/paddleseg/models/__init__.py +0 -39
paddlex/paddleseg/models/ann.py +0 -436
paddlex/paddleseg/models/attention_unet.py +0 -189
paddlex/paddleseg/models/backbones/__init__.py +0 -18
paddlex/paddleseg/models/backbones/hrnet.py +0 -815
paddlex/paddleseg/models/backbones/mobilenetv3.py +0 -365
paddlex/paddleseg/models/backbones/resnet_vd.py +0 -364
paddlex/paddleseg/models/backbones/xception_deeplab.py +0 -415
paddlex/paddleseg/models/bisenet.py +0 -311
paddlex/paddleseg/models/danet.py +0 -220
paddlex/paddleseg/models/decoupled_segnet.py +0 -233
paddlex/paddleseg/models/deeplab.py +0 -258
paddlex/paddleseg/models/dnlnet.py +0 -231
paddlex/paddleseg/models/emanet.py +0 -219
paddlex/paddleseg/models/fast_scnn.py +0 -318
paddlex/paddleseg/models/fcn.py +0 -135
paddlex/paddleseg/models/gcnet.py +0 -223
paddlex/paddleseg/models/gscnn.py +0 -357
paddlex/paddleseg/models/hardnet.py +0 -309
paddlex/paddleseg/models/isanet.py +0 -202
paddlex/paddleseg/models/layers/__init__.py +0 -19
paddlex/paddleseg/models/layers/activation.py +0 -73
paddlex/paddleseg/models/layers/attention.py +0 -146
paddlex/paddleseg/models/layers/layer_libs.py +0 -168
paddlex/paddleseg/models/layers/nonlocal2d.py +0 -155
paddlex/paddleseg/models/layers/pyramid_pool.py +0 -182
paddlex/paddleseg/models/losses/__init__.py +0 -27
paddlex/paddleseg/models/losses/binary_cross_entropy_loss.py +0 -174
paddlex/paddleseg/models/losses/bootstrapped_cross_entropy.py +0 -73
paddlex/paddleseg/models/losses/cross_entropy_loss.py +0 -94
paddlex/paddleseg/models/losses/decoupledsegnet_relax_boundary_loss.py +0 -129
paddlex/paddleseg/models/losses/dice_loss.py +0 -61
paddlex/paddleseg/models/losses/edge_attention_loss.py +0 -78
paddlex/paddleseg/models/losses/gscnn_dual_task_loss.py +0 -141
paddlex/paddleseg/models/losses/l1_loss.py +0 -76
paddlex/paddleseg/models/losses/lovasz_loss.py +0 -222
paddlex/paddleseg/models/losses/mean_square_error_loss.py +0 -65
paddlex/paddleseg/models/losses/mixed_loss.py +0 -58
paddlex/paddleseg/models/losses/ohem_cross_entropy_loss.py +0 -99
paddlex/paddleseg/models/losses/ohem_edge_attention_loss.py +0 -114
paddlex/paddleseg/models/ocrnet.py +0 -248
paddlex/paddleseg/models/pspnet.py +0 -147
paddlex/paddleseg/models/sfnet.py +0 -236
paddlex/paddleseg/models/shufflenet_slim.py +0 -268
paddlex/paddleseg/models/u2net.py +0 -574
paddlex/paddleseg/models/unet.py +0 -155
paddlex/paddleseg/models/unet_3plus.py +0 -316
paddlex/paddleseg/models/unet_plusplus.py +0 -237
paddlex/paddleseg/transforms/__init__.py +0 -16
paddlex/paddleseg/transforms/functional.py +0 -161
paddlex/paddleseg/transforms/transforms.py +0 -937
paddlex/paddleseg/utils/__init__.py +0 -22
paddlex/paddleseg/utils/config_check.py +0 -60
paddlex/paddleseg/utils/download.py +0 -163
paddlex/paddleseg/utils/env/__init__.py +0 -16
paddlex/paddleseg/utils/env/seg_env.py +0 -56
paddlex/paddleseg/utils/env/sys_env.py +0 -122
paddlex/paddleseg/utils/logger.py +0 -48
paddlex/paddleseg/utils/metrics.py +0 -146
paddlex/paddleseg/utils/progbar.py +0 -212
paddlex/paddleseg/utils/timer.py +0 -53
paddlex/paddleseg/utils/utils.py +0 -120
paddlex/paddleseg/utils/visualize.py +0 -90
paddlex/ppcls/__init__.py +0 -20
paddlex/ppcls/data/__init__.py +0 -15
paddlex/ppcls/data/imaug/__init__.py +0 -94
paddlex/ppcls/data/imaug/autoaugment.py +0 -264
paddlex/ppcls/data/imaug/batch_operators.py +0 -117
paddlex/ppcls/data/imaug/cutout.py +0 -41
paddlex/ppcls/data/imaug/fmix.py +0 -217
paddlex/ppcls/data/imaug/grid.py +0 -89
paddlex/ppcls/data/imaug/hide_and_seek.py +0 -44
paddlex/ppcls/data/imaug/operators.py +0 -256
paddlex/ppcls/data/imaug/randaugment.py +0 -106
paddlex/ppcls/data/imaug/random_erasing.py +0 -55
paddlex/ppcls/data/reader.py +0 -318
paddlex/ppcls/modeling/__init__.py +0 -20
paddlex/ppcls/modeling/architectures/__init__.py +0 -51
paddlex/ppcls/modeling/architectures/alexnet.py +0 -132
paddlex/ppcls/modeling/architectures/darknet.py +0 -161
paddlex/ppcls/modeling/architectures/densenet.py +0 -308
paddlex/ppcls/modeling/architectures/distillation_models.py +0 -65
paddlex/ppcls/modeling/architectures/distilled_vision_transformer.py +0 -196
paddlex/ppcls/modeling/architectures/dpn.py +0 -425
paddlex/ppcls/modeling/architectures/efficientnet.py +0 -901
paddlex/ppcls/modeling/architectures/ghostnet.py +0 -331
paddlex/ppcls/modeling/architectures/googlenet.py +0 -207
paddlex/ppcls/modeling/architectures/hrnet.py +0 -742
paddlex/ppcls/modeling/architectures/inception_v3.py +0 -541
paddlex/ppcls/modeling/architectures/inception_v4.py +0 -455
paddlex/ppcls/modeling/architectures/mixnet.py +0 -782
paddlex/ppcls/modeling/architectures/mobilenet_v1.py +0 -266
paddlex/ppcls/modeling/architectures/mobilenet_v2.py +0 -248
paddlex/ppcls/modeling/architectures/mobilenet_v3.py +0 -359
paddlex/ppcls/modeling/architectures/regnet.py +0 -383
paddlex/ppcls/modeling/architectures/repvgg.py +0 -339
paddlex/ppcls/modeling/architectures/res2net.py +0 -272
paddlex/ppcls/modeling/architectures/res2net_vd.py +0 -295
paddlex/ppcls/modeling/architectures/resnest.py +0 -705
paddlex/ppcls/modeling/architectures/resnet.py +0 -317
paddlex/ppcls/modeling/architectures/resnet_vc.py +0 -309
paddlex/ppcls/modeling/architectures/resnet_vd.py +0 -354
paddlex/ppcls/modeling/architectures/resnext.py +0 -259
paddlex/ppcls/modeling/architectures/resnext101_wsl.py +0 -447
paddlex/ppcls/modeling/architectures/resnext_vd.py +0 -266
paddlex/ppcls/modeling/architectures/rexnet.py +0 -240
paddlex/ppcls/modeling/architectures/se_resnet_vd.py +0 -378
paddlex/ppcls/modeling/architectures/se_resnext.py +0 -290
paddlex/ppcls/modeling/architectures/se_resnext_vd.py +0 -285
paddlex/ppcls/modeling/architectures/shufflenet_v2.py +0 -320
paddlex/ppcls/modeling/architectures/squeezenet.py +0 -154
paddlex/ppcls/modeling/architectures/vgg.py +0 -152
paddlex/ppcls/modeling/architectures/vision_transformer.py +0 -402
paddlex/ppcls/modeling/architectures/xception.py +0 -345
paddlex/ppcls/modeling/architectures/xception_deeplab.py +0 -386
paddlex/ppcls/modeling/loss.py +0 -158
paddlex/ppcls/modeling/utils.py +0 -53
paddlex/ppcls/optimizer/__init__.py +0 -19
paddlex/ppcls/optimizer/learning_rate.py +0 -159
paddlex/ppcls/optimizer/optimizer.py +0 -165
paddlex/ppcls/utils/__init__.py +0 -27
paddlex/ppcls/utils/check.py +0 -151
paddlex/ppcls/utils/config.py +0 -201
paddlex/ppcls/utils/logger.py +0 -120
paddlex/ppcls/utils/metrics.py +0 -112
paddlex/ppcls/utils/misc.py +0 -62
paddlex/ppcls/utils/model_zoo.py +0 -213
paddlex/ppcls/utils/save_load.py +0 -163
paddlex/ppdet/__init__.py +0 -16
paddlex/ppdet/core/__init__.py +0 -15
paddlex/ppdet/core/config/__init__.py +0 -13
paddlex/ppdet/core/config/schema.py +0 -248
paddlex/ppdet/core/config/yaml_helpers.py +0 -118
paddlex/ppdet/core/workspace.py +0 -279
paddlex/ppdet/data/__init__.py +0 -21
paddlex/ppdet/data/reader.py +0 -304
paddlex/ppdet/data/shm_utils.py +0 -67
paddlex/ppdet/data/source/__init__.py +0 -27
paddlex/ppdet/data/source/category.py +0 -823
paddlex/ppdet/data/source/coco.py +0 -243
paddlex/ppdet/data/source/dataset.py +0 -192
paddlex/ppdet/data/source/keypoint_coco.py +0 -656
paddlex/ppdet/data/source/mot.py +0 -360
paddlex/ppdet/data/source/voc.py +0 -204
paddlex/ppdet/data/source/widerface.py +0 -180
paddlex/ppdet/data/transform/__init__.py +0 -28
paddlex/ppdet/data/transform/autoaugment_utils.py +0 -1593
paddlex/ppdet/data/transform/batch_operators.py +0 -758
paddlex/ppdet/data/transform/gridmask_utils.py +0 -83
paddlex/ppdet/data/transform/keypoint_operators.py +0 -665
paddlex/ppdet/data/transform/mot_operators.py +0 -636
paddlex/ppdet/data/transform/op_helper.py +0 -468
paddlex/ppdet/data/transform/operators.py +0 -2103
paddlex/ppdet/engine/__init__.py +0 -29
paddlex/ppdet/engine/callbacks.py +0 -262
paddlex/ppdet/engine/env.py +0 -47
paddlex/ppdet/engine/export_utils.py +0 -118
paddlex/ppdet/engine/tracker.py +0 -425
paddlex/ppdet/engine/trainer.py +0 -535
paddlex/ppdet/metrics/__init__.py +0 -23
paddlex/ppdet/metrics/coco_utils.py +0 -184
paddlex/ppdet/metrics/json_results.py +0 -151
paddlex/ppdet/metrics/keypoint_metrics.py +0 -202
paddlex/ppdet/metrics/map_utils.py +0 -396
paddlex/ppdet/metrics/metrics.py +0 -300
paddlex/ppdet/metrics/mot_eval_utils.py +0 -192
paddlex/ppdet/metrics/mot_metrics.py +0 -184
paddlex/ppdet/metrics/widerface_utils.py +0 -393
paddlex/ppdet/model_zoo/__init__.py +0 -18
paddlex/ppdet/model_zoo/model_zoo.py +0 -86
paddlex/ppdet/model_zoo/tests/__init__.py +0 -13
paddlex/ppdet/model_zoo/tests/test_get_model.py +0 -48
paddlex/ppdet/model_zoo/tests/test_list_model.py +0 -68
paddlex/ppdet/modeling/__init__.py +0 -41
paddlex/ppdet/modeling/architectures/__init__.py +0 -40
paddlex/ppdet/modeling/architectures/cascade_rcnn.py +0 -144
paddlex/ppdet/modeling/architectures/centernet.py +0 -103
paddlex/ppdet/modeling/architectures/deepsort.py +0 -111
paddlex/ppdet/modeling/architectures/fairmot.py +0 -107
paddlex/ppdet/modeling/architectures/faster_rcnn.py +0 -106
paddlex/ppdet/modeling/architectures/fcos.py +0 -105
paddlex/ppdet/modeling/architectures/jde.py +0 -125
paddlex/ppdet/modeling/architectures/keypoint_hrhrnet.py +0 -286
paddlex/ppdet/modeling/architectures/keypoint_hrnet.py +0 -203
paddlex/ppdet/modeling/architectures/mask_rcnn.py +0 -135
paddlex/ppdet/modeling/architectures/meta_arch.py +0 -45
paddlex/ppdet/modeling/architectures/s2anet.py +0 -103
paddlex/ppdet/modeling/architectures/solov2.py +0 -110
paddlex/ppdet/modeling/architectures/ssd.py +0 -84
paddlex/ppdet/modeling/architectures/ttfnet.py +0 -98
paddlex/ppdet/modeling/architectures/yolo.py +0 -104
paddlex/ppdet/modeling/backbones/__init__.py +0 -37
paddlex/ppdet/modeling/backbones/blazenet.py +0 -322
paddlex/ppdet/modeling/backbones/darknet.py +0 -341
paddlex/ppdet/modeling/backbones/dla.py +0 -244
paddlex/ppdet/modeling/backbones/ghostnet.py +0 -476
paddlex/ppdet/modeling/backbones/hrnet.py +0 -724
paddlex/ppdet/modeling/backbones/mobilenet_v1.py +0 -410
paddlex/ppdet/modeling/backbones/mobilenet_v3.py +0 -497
paddlex/ppdet/modeling/backbones/name_adapter.py +0 -69
paddlex/ppdet/modeling/backbones/res2net.py +0 -358
paddlex/ppdet/modeling/backbones/resnet.py +0 -606
paddlex/ppdet/modeling/backbones/senet.py +0 -140
paddlex/ppdet/modeling/backbones/vgg.py +0 -216
paddlex/ppdet/modeling/bbox_utils.py +0 -464
paddlex/ppdet/modeling/heads/__init__.py +0 -41
paddlex/ppdet/modeling/heads/bbox_head.py +0 -379
paddlex/ppdet/modeling/heads/cascade_head.py +0 -285
paddlex/ppdet/modeling/heads/centernet_head.py +0 -194
paddlex/ppdet/modeling/heads/face_head.py +0 -113
paddlex/ppdet/modeling/heads/fcos_head.py +0 -270
paddlex/ppdet/modeling/heads/keypoint_hrhrnet_head.py +0 -108
paddlex/ppdet/modeling/heads/mask_head.py +0 -253
paddlex/ppdet/modeling/heads/roi_extractor.py +0 -111
paddlex/ppdet/modeling/heads/s2anet_head.py +0 -845
paddlex/ppdet/modeling/heads/solov2_head.py +0 -537
paddlex/ppdet/modeling/heads/ssd_head.py +0 -175
paddlex/ppdet/modeling/heads/ttf_head.py +0 -314
paddlex/ppdet/modeling/heads/yolo_head.py +0 -124
paddlex/ppdet/modeling/keypoint_utils.py +0 -302
paddlex/ppdet/modeling/layers.py +0 -1142
paddlex/ppdet/modeling/losses/__init__.py +0 -35
paddlex/ppdet/modeling/losses/ctfocal_loss.py +0 -67
paddlex/ppdet/modeling/losses/fairmot_loss.py +0 -41
paddlex/ppdet/modeling/losses/fcos_loss.py +0 -225
paddlex/ppdet/modeling/losses/iou_aware_loss.py +0 -48
paddlex/ppdet/modeling/losses/iou_loss.py +0 -210
paddlex/ppdet/modeling/losses/jde_loss.py +0 -182
paddlex/ppdet/modeling/losses/keypoint_loss.py +0 -228
paddlex/ppdet/modeling/losses/solov2_loss.py +0 -101
paddlex/ppdet/modeling/losses/ssd_loss.py +0 -163
paddlex/ppdet/modeling/losses/yolo_loss.py +0 -212
paddlex/ppdet/modeling/mot/__init__.py +0 -25
paddlex/ppdet/modeling/mot/matching/__init__.py +0 -19
paddlex/ppdet/modeling/mot/matching/deepsort_matching.py +0 -382
paddlex/ppdet/modeling/mot/matching/jde_matching.py +0 -145
paddlex/ppdet/modeling/mot/motion/__init__.py +0 -17
paddlex/ppdet/modeling/mot/motion/kalman_filter.py +0 -270
paddlex/ppdet/modeling/mot/tracker/__init__.py +0 -23
paddlex/ppdet/modeling/mot/tracker/base_jde_tracker.py +0 -267
paddlex/ppdet/modeling/mot/tracker/base_sde_tracker.py +0 -145
paddlex/ppdet/modeling/mot/tracker/deepsort_tracker.py +0 -165
paddlex/ppdet/modeling/mot/tracker/jde_tracker.py +0 -262
paddlex/ppdet/modeling/mot/utils.py +0 -181
paddlex/ppdet/modeling/mot/visualization.py +0 -130
paddlex/ppdet/modeling/necks/__init__.py +0 -25
paddlex/ppdet/modeling/necks/centernet_fpn.py +0 -185
paddlex/ppdet/modeling/necks/fpn.py +0 -233
paddlex/ppdet/modeling/necks/hrfpn.py +0 -131
paddlex/ppdet/modeling/necks/ttf_fpn.py +0 -243
paddlex/ppdet/modeling/necks/yolo_fpn.py +0 -1034
paddlex/ppdet/modeling/ops.py +0 -1599
paddlex/ppdet/modeling/post_process.py +0 -449
paddlex/ppdet/modeling/proposal_generator/__init__.py +0 -2
paddlex/ppdet/modeling/proposal_generator/anchor_generator.py +0 -135
paddlex/ppdet/modeling/proposal_generator/proposal_generator.py +0 -81
paddlex/ppdet/modeling/proposal_generator/rpn_head.py +0 -269
paddlex/ppdet/modeling/proposal_generator/target.py +0 -671
paddlex/ppdet/modeling/proposal_generator/target_layer.py +0 -476
paddlex/ppdet/modeling/reid/__init__.py +0 -23
paddlex/ppdet/modeling/reid/fairmot_embedding_head.py +0 -117
paddlex/ppdet/modeling/reid/jde_embedding_head.py +0 -189
paddlex/ppdet/modeling/reid/pyramidal_embedding.py +0 -151
paddlex/ppdet/modeling/reid/resnet.py +0 -320
paddlex/ppdet/modeling/shape_spec.py +0 -33
paddlex/ppdet/modeling/tests/__init__.py +0 -13
paddlex/ppdet/modeling/tests/test_architectures.py +0 -59
paddlex/ppdet/modeling/tests/test_base.py +0 -75
paddlex/ppdet/modeling/tests/test_ops.py +0 -839
paddlex/ppdet/modeling/tests/test_yolov3_loss.py +0 -420
paddlex/ppdet/optimizer.py +0 -285
paddlex/ppdet/slim/__init__.py +0 -62
paddlex/ppdet/slim/distill.py +0 -111
paddlex/ppdet/slim/prune.py +0 -85
paddlex/ppdet/slim/quant.py +0 -52
paddlex/ppdet/utils/__init__.py +0 -13
paddlex/ppdet/utils/check.py +0 -93
paddlex/ppdet/utils/checkpoint.py +0 -216
paddlex/ppdet/utils/cli.py +0 -151
paddlex/ppdet/utils/colormap.py +0 -56
paddlex/ppdet/utils/download.py +0 -477
paddlex/ppdet/utils/logger.py +0 -71
paddlex/ppdet/utils/stats.py +0 -95
paddlex/ppdet/utils/visualizer.py +0 -292
paddlex/ppdet/utils/voc_utils.py +0 -87
paddlex/seg.py +0 -38
paddlex/tools/__init__.py +0 -16
paddlex/tools/convert.py +0 -52
paddlex/tools/dataset_conversion/__init__.py +0 -24
paddlex/tools/dataset_conversion/x2coco.py +0 -379
paddlex/tools/dataset_conversion/x2imagenet.py +0 -82
paddlex/tools/dataset_conversion/x2seg.py +0 -343
paddlex/tools/dataset_conversion/x2voc.py +0 -230
paddlex/tools/dataset_split/__init__.py +0 -23
paddlex/tools/dataset_split/coco_split.py +0 -69
paddlex/tools/dataset_split/imagenet_split.py +0 -75
paddlex/tools/dataset_split/seg_split.py +0 -96
paddlex/tools/dataset_split/utils.py +0 -75
paddlex/tools/dataset_split/voc_split.py +0 -91
paddlex/tools/split.py +0 -41
paddlex/utils/checkpoint.py +0 -439
paddlex/utils/env.py +0 -71
paddlex/utils/shm.py +0 -67
paddlex/utils/stats.py +0 -68
paddlex/utils/utils.py +0 -140
paddlex-2.0.0rc4.dist-info/LICENSE +0 -201
paddlex-2.0.0rc4.dist-info/METADATA +0 -29
paddlex-2.0.0rc4.dist-info/RECORD +0 -445
paddlex-2.0.0rc4.dist-info/WHEEL +0 -5
paddlex-2.0.0rc4.dist-info/entry_points.txt +0 -3
paddlex-2.0.0rc4.dist-info/top_level.txt +0 -2

paddlex/ppdet/data/transform/operators.py DELETED Viewed

@@ -1,2103 +0,0 @@
-# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# function:
-#    operators to process sample,
-#    eg: decode/resize/crop image
-from __future__ import absolute_import
-from __future__ import print_function
-from __future__ import division
-try:
-    from collections.abc import Sequence
-except Exception:
-    from collections import Sequence
-from numbers import Number, Integral
-import uuid
-import random
-import math
-import numpy as np
-import os
-import copy
-import cv2
-from PIL import Image, ImageEnhance, ImageDraw
-from paddlex.ppdet.core.workspace import serializable
-from paddlex.ppdet.modeling.layers import AnchorGrid
-from paddlex.ppdet.modeling import bbox_utils
-from .op_helper import (
-    satisfy_sample_constraint, filter_and_process, generate_sample_bbox,
-    clip_bbox, data_anchor_sampling, satisfy_sample_constraint_coverage,
-    crop_image_sampling, generate_sample_bbox_square, bbox_area_sampling,
-    is_poly, gaussian_radius, draw_gaussian)
-from paddlex.ppdet.utils.logger import setup_logger
-logger = setup_logger(__name__)
-registered_ops = []
-def register_op(cls):
-    registered_ops.append(cls.__name__)
-    if not hasattr(BaseOperator, cls.__name__):
-        setattr(BaseOperator, cls.__name__, cls)
-    else:
-        raise KeyError("The {} class has been registered.".format(
-            cls.__name__))
-    return serializable(cls)
-class BboxError(ValueError):
-    pass
-class ImageError(ValueError):
-    pass
-class BaseOperator(object):
-    def __init__(self, name=None):
-        if name is None:
-            name = self.__class__.__name__
-        self._id = name + '_' + str(uuid.uuid4())[-6:]
-    def apply(self, sample, context=None):
-        """ Process a sample.
-        Args:
-            sample (dict): a dict of sample, eg: {'image':xx, 'label': xxx}
-            context (dict): info about this sample processing
-        Returns:
-            result (dict): a processed sample
-        """
-        return sample
-    def __call__(self, sample, context=None):
-        """ Process a sample.
-        Args:
-            sample (dict): a dict of sample, eg: {'image':xx, 'label': xxx}
-            context (dict): info about this sample processing
-        Returns:
-            result (dict): a processed sample
-        """
-        if isinstance(sample, Sequence):
-            for i in range(len(sample)):
-                sample[i] = self.apply(sample[i], context)
-        else:
-            sample = self.apply(sample, context)
-        return sample
-    def __str__(self):
-        return str(self._id)
-@register_op
-class Decode(BaseOperator):
-    def __init__(self):
-        """ Transform the image data to numpy format following the rgb format
-        """
-        super(Decode, self).__init__()
-    def apply(self, sample, context=None):
-        """ load image if 'im_file' field is not empty but 'image' is"""
-        if 'image' not in sample:
-            with open(sample['im_file'], 'rb') as f:
-                sample['image'] = f.read()
-            sample.pop('im_file')
-        im = sample['image']
-        data = np.frombuffer(im, dtype='uint8')
-        im = cv2.imdecode(data, 1)  # BGR mode, but need RGB mode
-        if 'keep_ori_im' in sample and sample['keep_ori_im']:
-            sample['ori_image'] = im
-        im = cv2.cvtColor(im, cv2.COLOR_BGR2RGB)
-        sample['image'] = im
-        if 'h' not in sample:
-            sample['h'] = im.shape[0]
-        elif sample['h'] != im.shape[0]:
-            logger.warn(
-                "The actual image height: {} is not equal to the "
-                "height: {} in annotation, and update sample['h'] by actual "
-                "image height.".format(im.shape[0], sample['h']))
-            sample['h'] = im.shape[0]
-        if 'w' not in sample:
-            sample['w'] = im.shape[1]
-        elif sample['w'] != im.shape[1]:
-            logger.warn(
-                "The actual image width: {} is not equal to the "
-                "width: {} in annotation, and update sample['w'] by actual "
-                "image width.".format(im.shape[1], sample['w']))
-            sample['w'] = im.shape[1]
-        sample['im_shape'] = np.array(im.shape[:2], dtype=np.float32)
-        sample['scale_factor'] = np.array([1., 1.], dtype=np.float32)
-        return sample
-@register_op
-class Permute(BaseOperator):
-    def __init__(self):
-        """
-        Change the channel to be (C, H, W)
-        """
-        super(Permute, self).__init__()
-    def apply(self, sample, context=None):
-        im = sample['image']
-        im = im.transpose((2, 0, 1))
-        sample['image'] = im
-        return sample
-@register_op
-class Lighting(BaseOperator):
-    """
-    Lighting the image by eigenvalues and eigenvectors
-    Args:
-        eigval (list): eigenvalues
-        eigvec (list): eigenvectors
-        alphastd (float): random weight of lighting, 0.1 by default
-    """
-    def __init__(self, eigval, eigvec, alphastd=0.1):
-        super(Lighting, self).__init__()
-        self.alphastd = alphastd
-        self.eigval = np.array(eigval).astype('float32')
-        self.eigvec = np.array(eigvec).astype('float32')
-    def apply(self, sample, context=None):
-        alpha = np.random.normal(scale=self.alphastd, size=(3, ))
-        sample['image'] += np.dot(self.eigvec, self.eigval * alpha)
-        return sample
-@register_op
-class RandomErasingImage(BaseOperator):
-    def __init__(self, prob=0.5, lower=0.02, higher=0.4, aspect_ratio=0.3):
-        """
-        Random Erasing Data Augmentation, see https://arxiv.org/abs/1708.04896
-        Args:
-            prob (float): probability to carry out random erasing
-            lower (float): lower limit of the erasing area ratio
-            heigher (float): upper limit of the erasing area ratio
-            aspect_ratio (float): aspect ratio of the erasing region
-        """
-        super(RandomErasingImage, self).__init__()
-        self.prob = prob
-        self.lower = lower
-        self.heigher = heigher
-        self.aspect_ratio = aspect_ratio
-    def apply(self, sample):
-        gt_bbox = sample['gt_bbox']
-        im = sample['image']
-        if not isinstance(im, np.ndarray):
-            raise TypeError("{}: image is not a numpy array.".format(self))
-        if len(im.shape) != 3:
-            raise ImageError("{}: image is not 3-dimensional.".format(self))
-        for idx in range(gt_bbox.shape[0]):
-            if self.prob <= np.random.rand():
-                continue
-            x1, y1, x2, y2 = gt_bbox[idx, :]
-            w_bbox = x2 - x1
-            h_bbox = y2 - y1
-            area = w_bbox * h_bbox
-            target_area = random.uniform(self.lower, self.higher) * area
-            aspect_ratio = random.uniform(self.aspect_ratio,
-                                          1 / self.aspect_ratio)
-            h = int(round(math.sqrt(target_area * aspect_ratio)))
-            w = int(round(math.sqrt(target_area / aspect_ratio)))
-            if w < w_bbox and h < h_bbox:
-                off_y1 = random.randint(0, int(h_bbox - h))
-                off_x1 = random.randint(0, int(w_bbox - w))
-                im[int(y1 + off_y1):int(y1 + off_y1 + h), int(x1 + off_x1):int(
-                    x1 + off_x1 + w), :] = 0
-        sample['image'] = im
-        return sample
-@register_op
-class NormalizeImage(BaseOperator):
-    def __init__(self,
-                 mean=[0.485, 0.456, 0.406],
-                 std=[1, 1, 1],
-                 is_scale=True):
-        """
-        Args:
-            mean (list): the pixel mean
-            std (list): the pixel variance
-        """
-        super(NormalizeImage, self).__init__()
-        self.mean = mean
-        self.std = std
-        self.is_scale = is_scale
-        if not (isinstance(self.mean, list) and isinstance(self.std, list) and
-                isinstance(self.is_scale, bool)):
-            raise TypeError("{}: input type is invalid.".format(self))
-        from functools import reduce
-        if reduce(lambda x, y: x * y, self.std) == 0:
-            raise ValueError('{}: std is invalid!'.format(self))
-    def apply(self, sample, context=None):
-        """Normalize the image.
-        Operators:
-            1.(optional) Scale the image to [0,1]
-            2. Each pixel minus mean and is divided by std
-        """
-        im = sample['image']
-        im = im.astype(np.float32, copy=False)
-        mean = np.array(self.mean)[np.newaxis, np.newaxis, :]
-        std = np.array(self.std)[np.newaxis, np.newaxis, :]
-        if self.is_scale:
-            im = im / 255.0
-        im -= mean
-        im /= std
-        sample['image'] = im
-        return sample
-@register_op
-class GridMask(BaseOperator):
-    def __init__(self,
-                 use_h=True,
-                 use_w=True,
-                 rotate=1,
-                 offset=False,
-                 ratio=0.5,
-                 mode=1,
-                 prob=0.7,
-                 upper_iter=360000):
-        """
-        GridMask Data Augmentation, see https://arxiv.org/abs/2001.04086
-        Args:
-            use_h (bool): whether to mask vertically
-            use_w (boo;): whether to mask horizontally
-            rotate (float): angle for the mask to rotate
-            offset (float): mask offset
-            ratio (float): mask ratio
-            mode (int): gridmask mode
-            prob (float): max probability to carry out gridmask
-            upper_iter (int): suggested to be equal to global max_iter
-        """
-        super(GridMask, self).__init__()
-        self.use_h = use_h
-        self.use_w = use_w
-        self.rotate = rotate
-        self.offset = offset
-        self.ratio = ratio
-        self.mode = mode
-        self.prob = prob
-        self.upper_iter = upper_iter
-        from .gridmask_utils import Gridmask
-        self.gridmask_op = Gridmask(
-            use_h,
-            use_w,
-            rotate=rotate,
-            offset=offset,
-            ratio=ratio,
-            mode=mode,
-            prob=prob,
-            upper_iter=upper_iter)
-    def apply(self, sample, context=None):
-        sample['image'] = self.gridmask_op(sample['image'],
-                                           sample['curr_iter'])
-        return sample
-@register_op
-class RandomDistort(BaseOperator):
-    """Random color distortion.
-    Args:
-        hue (list): hue settings. in [lower, upper, probability] format.
-        saturation (list): saturation settings. in [lower, upper, probability] format.
-        contrast (list): contrast settings. in [lower, upper, probability] format.
-        brightness (list): brightness settings. in [lower, upper, probability] format.
-        random_apply (bool): whether to apply in random (yolo) or fixed (SSD)
-            order.
-        count (int): the number of doing distrot
-        random_channel (bool): whether to swap channels randomly
-    """
-    def __init__(self,
-                 hue=[-18, 18, 0.5],
-                 saturation=[0.5, 1.5, 0.5],
-                 contrast=[0.5, 1.5, 0.5],
-                 brightness=[0.5, 1.5, 0.5],
-                 random_apply=True,
-                 count=4,
-                 random_channel=False):
-        super(RandomDistort, self).__init__()
-        self.hue = hue
-        self.saturation = saturation
-        self.contrast = contrast
-        self.brightness = brightness
-        self.random_apply = random_apply
-        self.count = count
-        self.random_channel = random_channel
-    def apply_hue(self, img):
-        low, high, prob = self.hue
-        if np.random.uniform(0., 1.) < prob:
-            return img
-        img = img.astype(np.float32)
-        # it works, but result differ from HSV version
-        delta = np.random.uniform(low, high)
-        u = np.cos(delta * np.pi)
-        w = np.sin(delta * np.pi)
-        bt = np.array([[1.0, 0.0, 0.0], [0.0, u, -w], [0.0, w, u]])
-        tyiq = np.array([[0.299, 0.587, 0.114], [0.596, -0.274, -0.321],
-                         [0.211, -0.523, 0.311]])
-        ityiq = np.array([[1.0, 0.956, 0.621], [1.0, -0.272, -0.647],
-                          [1.0, -1.107, 1.705]])
-        t = np.dot(np.dot(ityiq, bt), tyiq).T
-        img = np.dot(img, t)
-        return img
-    def apply_saturation(self, img):
-        low, high, prob = self.saturation
-        if np.random.uniform(0., 1.) < prob:
-            return img
-        delta = np.random.uniform(low, high)
-        img = img.astype(np.float32)
-        # it works, but result differ from HSV version
-        gray = img * np.array([[[0.299, 0.587, 0.114]]], dtype=np.float32)
-        gray = gray.sum(axis=2, keepdims=True)
-        gray *= (1.0 - delta)
-        img *= delta
-        img += gray
-        return img
-    def apply_contrast(self, img):
-        low, high, prob = self.contrast
-        if np.random.uniform(0., 1.) < prob:
-            return img
-        delta = np.random.uniform(low, high)
-        img = img.astype(np.float32)
-        img *= delta
-        return img
-    def apply_brightness(self, img):
-        low, high, prob = self.brightness
-        if np.random.uniform(0., 1.) < prob:
-            return img
-        delta = np.random.uniform(low, high)
-        img = img.astype(np.float32)
-        img += delta
-        return img
-    def apply(self, sample, context=None):
-        img = sample['image']
-        if self.random_apply:
-            functions = [
-                self.apply_brightness, self.apply_contrast,
-                self.apply_saturation, self.apply_hue
-            ]
-            distortions = np.random.permutation(functions)[:self.count]
-            for func in distortions:
-                img = func(img)
-            sample['image'] = img
-            return sample
-        img = self.apply_brightness(img)
-        mode = np.random.randint(0, 2)
-        if mode:
-            img = self.apply_contrast(img)
-        img = self.apply_saturation(img)
-        img = self.apply_hue(img)
-        if not mode:
-            img = self.apply_contrast(img)
-        if self.random_channel:
-            if np.random.randint(0, 2):
-                img = img[..., np.random.permutation(3)]
-        sample['image'] = img
-        return sample
-@register_op
-class AutoAugment(BaseOperator):
-    def __init__(self, autoaug_type="v1"):
-        """
-        Args:
-            autoaug_type (str): autoaug type, support v0, v1, v2, v3, test
-        """
-        super(AutoAugment, self).__init__()
-        self.autoaug_type = autoaug_type
-    def apply(self, sample, context=None):
-        """
-        Learning Data Augmentation Strategies for Object Detection, see https://arxiv.org/abs/1906.11172
-        """
-        im = sample['image']
-        gt_bbox = sample['gt_bbox']
-        if not isinstance(im, np.ndarray):
-            raise TypeError("{}: image is not a numpy array.".format(self))
-        if len(im.shape) != 3:
-            raise ImageError("{}: image is not 3-dimensional.".format(self))
-        if len(gt_bbox) == 0:
-            return sample
-        height, width, _ = im.shape
-        norm_gt_bbox = np.ones_like(gt_bbox, dtype=np.float32)
-        norm_gt_bbox[:, 0] = gt_bbox[:, 1] / float(height)
-        norm_gt_bbox[:, 1] = gt_bbox[:, 0] / float(width)
-        norm_gt_bbox[:, 2] = gt_bbox[:, 3] / float(height)
-        norm_gt_bbox[:, 3] = gt_bbox[:, 2] / float(width)
-        from .autoaugment_utils import distort_image_with_autoaugment
-        im, norm_gt_bbox = distort_image_with_autoaugment(im, norm_gt_bbox,
-                                                          self.autoaug_type)
-        gt_bbox[:, 0] = norm_gt_bbox[:, 1] * float(width)
-        gt_bbox[:, 1] = norm_gt_bbox[:, 0] * float(height)
-        gt_bbox[:, 2] = norm_gt_bbox[:, 3] * float(width)
-        gt_bbox[:, 3] = norm_gt_bbox[:, 2] * float(height)
-        sample['image'] = im
-        sample['gt_bbox'] = gt_bbox
-        return sample
-@register_op
-class RandomFlip(BaseOperator):
-    def __init__(self, prob=0.5):
-        """
-        Args:
-            prob (float): the probability of flipping image
-        """
-        super(RandomFlip, self).__init__()
-        self.prob = prob
-        if not (isinstance(self.prob, float)):
-            raise TypeError("{}: input type is invalid.".format(self))
-    def apply_segm(self, segms, height, width):
-        def _flip_poly(poly, width):
-            flipped_poly = np.array(poly)
-            flipped_poly[0::2] = width - np.array(poly[0::2])
-            return flipped_poly.tolist()
-        def _flip_rle(rle, height, width):
-            if 'counts' in rle and type(rle['counts']) == list:
-                rle = mask_util.frPyObjects(rle, height, width)
-            mask = mask_util.decode(rle)
-            mask = mask[:, ::-1]
-            rle = mask_util.encode(np.array(mask, order='F', dtype=np.uint8))
-            return rle
-        flipped_segms = []
-        for segm in segms:
-            if is_poly(segm):
-                # Polygon format
-                flipped_segms.append(
-                    [_flip_poly(poly, width) for poly in segm])
-            else:
-                # RLE format
-                import pycocotools.mask as mask_util
-                flipped_segms.append(_flip_rle(segm, height, width))
-        return flipped_segms
-    def apply_keypoint(self, gt_keypoint, width):
-        for i in range(gt_keypoint.shape[1]):
-            if i % 2 == 0:
-                old_x = gt_keypoint[:, i].copy()
-                gt_keypoint[:, i] = width - old_x
-        return gt_keypoint
-    def apply_image(self, image):
-        return image[:, ::-1, :]
-    def apply_bbox(self, bbox, width):
-        oldx1 = bbox[:, 0].copy()
-        oldx2 = bbox[:, 2].copy()
-        bbox[:, 0] = width - oldx2
-        bbox[:, 2] = width - oldx1
-        return bbox
-    def apply_rbox(self, bbox, width):
-        oldx1 = bbox[:, 0].copy()
-        oldx2 = bbox[:, 2].copy()
-        oldx3 = bbox[:, 4].copy()
-        oldx4 = bbox[:, 6].copy()
-        bbox[:, 0] = width - oldx1
-        bbox[:, 2] = width - oldx2
-        bbox[:, 4] = width - oldx3
-        bbox[:, 6] = width - oldx4
-        bbox = [bbox_utils.get_best_begin_point_single(e) for e in bbox]
-        return bbox
-    def apply(self, sample, context=None):
-        """Filp the image and bounding box.
-        Operators:
-            1. Flip the image numpy.
-            2. Transform the bboxes' x coordinates.
-              (Must judge whether the coordinates are normalized!)
-            3. Transform the segmentations' x coordinates.
-              (Must judge whether the coordinates are normalized!)
-        Output:
-            sample: the image, bounding box and segmentation part
-                    in sample are flipped.
-        """
-        if np.random.uniform(0, 1) < self.prob:
-            im = sample['image']
-            height, width = im.shape[:2]
-            im = self.apply_image(im)
-            if 'gt_bbox' in sample and len(sample['gt_bbox']) > 0:
-                sample['gt_bbox'] = self.apply_bbox(sample['gt_bbox'], width)
-            if 'gt_poly' in sample and len(sample['gt_poly']) > 0:
-                sample['gt_poly'] = self.apply_segm(sample['gt_poly'], height,
-                                                    width)
-            if 'gt_keypoint' in sample and len(sample['gt_keypoint']) > 0:
-                sample['gt_keypoint'] = self.apply_keypoint(
-                    sample['gt_keypoint'], width)
-            if 'semantic' in sample and sample['semantic']:
-                sample['semantic'] = sample['semantic'][:, ::-1]
-            if 'gt_segm' in sample and sample['gt_segm'].any():
-                sample['gt_segm'] = sample['gt_segm'][:, :, ::-1]
-            if 'gt_rbox2poly' in sample and sample['gt_rbox2poly'].any():
-                sample['gt_rbox2poly'] = self.apply_rbox(
-                    sample['gt_rbox2poly'], width)
-            sample['flipped'] = True
-            sample['image'] = im
-        return sample
-@register_op
-class Resize(BaseOperator):
-    def __init__(self, target_size, keep_ratio, interp=cv2.INTER_LINEAR):
-        """
-        Resize image to target size. if keep_ratio is True,
-        resize the image's long side to the maximum of target_size
-        if keep_ratio is False, resize the image to target size(h, w)
-        Args:
-            target_size (int|list): image target size
-            keep_ratio (bool): whether keep_ratio or not, default true
-            interp (int): the interpolation method
-        """
-        super(Resize, self).__init__()
-        self.keep_ratio = keep_ratio
-        self.interp = interp
-        if not isinstance(target_size, (Integral, Sequence)):
-            raise TypeError(
-                "Type of target_size is invalid. Must be Integer or List or Tuple, now is {}".
-                format(type(target_size)))
-        if isinstance(target_size, Integral):
-            target_size = [target_size, target_size]
-        self.target_size = target_size
-    def apply_image(self, image, scale):
-        im_scale_x, im_scale_y = scale
-        return cv2.resize(
-            image,
-            None,
-            None,
-            fx=im_scale_x,
-            fy=im_scale_y,
-            interpolation=self.interp)
-    def apply_bbox(self, bbox, scale, size):
-        im_scale_x, im_scale_y = scale
-        resize_w, resize_h = size
-        bbox[:, 0::2] *= im_scale_x
-        bbox[:, 1::2] *= im_scale_y
-        bbox[:, 0::2] = np.clip(bbox[:, 0::2], 0, resize_w)
-        bbox[:, 1::2] = np.clip(bbox[:, 1::2], 0, resize_h)
-        return bbox
-    def apply_segm(self, segms, im_size, scale):
-        def _resize_poly(poly, im_scale_x, im_scale_y):
-            resized_poly = np.array(poly).astype('float32')
-            resized_poly[0::2] *= im_scale_x
-            resized_poly[1::2] *= im_scale_y
-            return resized_poly.tolist()
-        def _resize_rle(rle, im_h, im_w, im_scale_x, im_scale_y):
-            if 'counts' in rle and type(rle['counts']) == list:
-                rle = mask_util.frPyObjects(rle, im_h, im_w)
-            mask = mask_util.decode(rle)
-            mask = cv2.resize(
-                image,
-                None,
-                None,
-                fx=im_scale_x,
-                fy=im_scale_y,
-                interpolation=self.interp)
-            rle = mask_util.encode(np.array(mask, order='F', dtype=np.uint8))
-            return rle
-        im_h, im_w = im_size
-        im_scale_x, im_scale_y = scale
-        resized_segms = []
-        for segm in segms:
-            if is_poly(segm):
-                # Polygon format
-                resized_segms.append([
-                    _resize_poly(poly, im_scale_x, im_scale_y) for poly in segm
-                ])
-            else:
-                # RLE format
-                import pycocotools.mask as mask_util
-                resized_segms.append(
-                    _resize_rle(segm, im_h, im_w, im_scale_x, im_scale_y))
-        return resized_segms
-    def apply(self, sample, context=None):
-        """ Resize the image numpy.
-        """
-        im = sample['image']
-        if not isinstance(im, np.ndarray):
-            raise TypeError("{}: image type is not numpy.".format(self))
-        if len(im.shape) != 3:
-            raise ImageError('{}: image is not 3-dimensional.'.format(self))
-        # apply image
-        im_shape = im.shape
-        if self.keep_ratio:
-            im_size_min = np.min(im_shape[0:2])
-            im_size_max = np.max(im_shape[0:2])
-            target_size_min = np.min(self.target_size)
-            target_size_max = np.max(self.target_size)
-            im_scale = min(target_size_min / im_size_min,
-                           target_size_max / im_size_max)
-            resize_h = im_scale * float(im_shape[0])
-            resize_w = im_scale * float(im_shape[1])
-            im_scale_x = im_scale
-            im_scale_y = im_scale
-        else:
-            resize_h, resize_w = self.target_size
-            im_scale_y = resize_h / im_shape[0]
-            im_scale_x = resize_w / im_shape[1]
-        im = self.apply_image(sample['image'], [im_scale_x, im_scale_y])
-        sample['image'] = im
-        sample['im_shape'] = np.asarray([resize_h, resize_w], dtype=np.float32)
-        if 'scale_factor' in sample:
-            scale_factor = sample['scale_factor']
-            sample['scale_factor'] = np.asarray(
-                [scale_factor[0] * im_scale_y, scale_factor[1] * im_scale_x],
-                dtype=np.float32)
-        else:
-            sample['scale_factor'] = np.asarray(
-                [im_scale_y, im_scale_x], dtype=np.float32)
-        # apply bbox
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) > 0:
-            sample['gt_bbox'] = self.apply_bbox(sample['gt_bbox'],
-                                                [im_scale_x, im_scale_y],
-                                                [resize_w, resize_h])
-        # apply rbox
-        if 'gt_rbox2poly' in sample:
-            if np.array(sample['gt_rbox2poly']).shape[1] != 8:
-                logger.warn(
-                    "gt_rbox2poly's length shoule be 8, but actually is {}".
-                    format(len(sample['gt_rbox2poly'])))
-            sample['gt_rbox2poly'] = self.apply_bbox(sample['gt_rbox2poly'],
-                                                     [im_scale_x, im_scale_y],
-                                                     [resize_w, resize_h])
-        # apply polygon
-        if 'gt_poly' in sample and len(sample['gt_poly']) > 0:
-            sample['gt_poly'] = self.apply_segm(
-                sample['gt_poly'], im_shape[:2], [im_scale_x, im_scale_y])
-        # apply semantic
-        if 'semantic' in sample and sample['semantic']:
-            semantic = sample['semantic']
-            semantic = cv2.resize(
-                semantic.astype('float32'),
-                None,
-                None,
-                fx=im_scale_x,
-                fy=im_scale_y,
-                interpolation=self.interp)
-            semantic = np.asarray(semantic).astype('int32')
-            semantic = np.expand_dims(semantic, 0)
-            sample['semantic'] = semantic
-        # apply gt_segm
-        if 'gt_segm' in sample and len(sample['gt_segm']) > 0:
-            masks = [
-                cv2.resize(
-                    gt_segm,
-                    None,
-                    None,
-                    fx=im_scale_x,
-                    fy=im_scale_y,
-                    interpolation=cv2.INTER_NEAREST)
-                for gt_segm in sample['gt_segm']
-            ]
-            sample['gt_segm'] = np.asarray(masks).astype(np.uint8)
-        return sample
-@register_op
-class MultiscaleTestResize(BaseOperator):
-    def __init__(self,
-                 origin_target_size=[800, 1333],
-                 target_size=[],
-                 interp=cv2.INTER_LINEAR,
-                 use_flip=True):
-        """
-        Rescale image to the each size in target size, and capped at max_size.
-        Args:
-            origin_target_size (list): origin target size of image
-            target_size (list): A list of target sizes of image.
-            interp (int): the interpolation method.
-            use_flip (bool): whether use flip augmentation.
-        """
-        super(MultiscaleTestResize, self).__init__()
-        self.interp = interp
-        self.use_flip = use_flip
-        if not isinstance(target_size, Sequence):
-            raise TypeError(
-                "Type of target_size is invalid. Must be List or Tuple, now is {}".
-                format(type(target_size)))
-        self.target_size = target_size
-        if not isinstance(origin_target_size, Sequence):
-            raise TypeError(
-                "Type of origin_target_size is invalid. Must be List or Tuple, now is {}".
-                format(type(origin_target_size)))
-        self.origin_target_size = origin_target_size
-    def apply(self, sample, context=None):
-        """ Resize the image numpy for multi-scale test.
-        """
-        samples = []
-        resizer = Resize(
-            self.origin_target_size, keep_ratio=True, interp=self.interp)
-        samples.append(resizer(sample.copy(), context))
-        if self.use_flip:
-            flipper = RandomFlip(1.1)
-            samples.append(flipper(sample.copy(), context=context))
-        for size in self.target_size:
-            resizer = Resize(size, keep_ratio=True, interp=self.interp)
-            samples.append(resizer(sample.copy(), context))
-        return samples
-@register_op
-class RandomResize(BaseOperator):
-    def __init__(self,
-                 target_size,
-                 keep_ratio=True,
-                 interp=cv2.INTER_LINEAR,
-                 random_size=True,
-                 random_interp=False):
-        """
-        Resize image to target size randomly. random target_size and interpolation method
-        Args:
-            target_size (int, list, tuple): image target size, if random size is True, must be list or tuple
-            keep_ratio (bool): whether keep_raio or not, default true
-            interp (int): the interpolation method
-            random_size (bool): whether random select target size of image
-            random_interp (bool): whether random select interpolation method
-        """
-        super(RandomResize, self).__init__()
-        self.keep_ratio = keep_ratio
-        self.interp = interp
-        self.interps = [
-            cv2.INTER_NEAREST,
-            cv2.INTER_LINEAR,
-            cv2.INTER_AREA,
-            cv2.INTER_CUBIC,
-            cv2.INTER_LANCZOS4,
-        ]
-        assert isinstance(target_size, (
-            Integral, Sequence)), "target_size must be Integer, List or Tuple"
-        if random_size and not isinstance(target_size, Sequence):
-            raise TypeError(
-                "Type of target_size is invalid when random_size is True. Must be List or Tuple, now is {}".
-                format(type(target_size)))
-        self.target_size = target_size
-        self.random_size = random_size
-        self.random_interp = random_interp
-    def apply(self, sample, context=None):
-        """ Resize the image numpy.
-        """
-        if self.random_size:
-            target_size = random.choice(self.target_size)
-        else:
-            target_size = self.target_size
-        if self.random_interp:
-            interp = random.choice(self.interps)
-        else:
-            interp = self.interp
-        resizer = Resize(target_size, self.keep_ratio, interp)
-        return resizer(sample, context=context)
-@register_op
-class RandomExpand(BaseOperator):
-    """Random expand the canvas.
-    Args:
-        ratio (float): maximum expansion ratio.
-        prob (float): probability to expand.
-        fill_value (list): color value used to fill the canvas. in RGB order.
-    """
-    def __init__(self, ratio=4., prob=0.5, fill_value=(127.5, 127.5, 127.5)):
-        super(RandomExpand, self).__init__()
-        assert ratio > 1.01, "expand ratio must be larger than 1.01"
-        self.ratio = ratio
-        self.prob = prob
-        assert isinstance(fill_value, (Number, Sequence)), \
-            "fill value must be either float or sequence"
-        if isinstance(fill_value, Number):
-            fill_value = (fill_value, ) * 3
-        if not isinstance(fill_value, tuple):
-            fill_value = tuple(fill_value)
-        self.fill_value = fill_value
-    def apply(self, sample, context=None):
-        if np.random.uniform(0., 1.) < self.prob:
-            return sample
-        im = sample['image']
-        height, width = im.shape[:2]
-        ratio = np.random.uniform(1., self.ratio)
-        h = int(height * ratio)
-        w = int(width * ratio)
-        if not h > height or not w > width:
-            return sample
-        y = np.random.randint(0, h - height)
-        x = np.random.randint(0, w - width)
-        offsets, size = [x, y], [h, w]
-        pad = Pad(size,
-                  pad_mode=-1,
-                  offsets=offsets,
-                  fill_value=self.fill_value)
-        return pad(sample, context=context)
-@register_op
-class CropWithSampling(BaseOperator):
-    def __init__(self, batch_sampler, satisfy_all=False, avoid_no_bbox=True):
-        """
-        Args:
-            batch_sampler (list): Multiple sets of different
-                                  parameters for cropping.
-            satisfy_all (bool): whether all boxes must satisfy.
-            e.g.[[1, 1, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0],
-                 [1, 50, 0.3, 1.0, 0.5, 2.0, 0.1, 1.0],
-                 [1, 50, 0.3, 1.0, 0.5, 2.0, 0.3, 1.0],
-                 [1, 50, 0.3, 1.0, 0.5, 2.0, 0.5, 1.0],
-                 [1, 50, 0.3, 1.0, 0.5, 2.0, 0.7, 1.0],
-                 [1, 50, 0.3, 1.0, 0.5, 2.0, 0.9, 1.0],
-                 [1, 50, 0.3, 1.0, 0.5, 2.0, 0.0, 1.0]]
-           [max sample, max trial, min scale, max scale,
-            min aspect ratio, max aspect ratio,
-            min overlap, max overlap]
-            avoid_no_bbox (bool): whether to to avoid the
-                                  situation where the box does not appear.
-        """
-        super(CropWithSampling, self).__init__()
-        self.batch_sampler = batch_sampler
-        self.satisfy_all = satisfy_all
-        self.avoid_no_bbox = avoid_no_bbox
-    def apply(self, sample, context):
-        """
-        Crop the image and modify bounding box.
-        Operators:
-            1. Scale the image width and height.
-            2. Crop the image according to a radom sample.
-            3. Rescale the bounding box.
-            4. Determine if the new bbox is satisfied in the new image.
-        Returns:
-            sample: the image, bounding box are replaced.
-        """
-        assert 'image' in sample, "image data not found"
-        im = sample['image']
-        gt_bbox = sample['gt_bbox']
-        gt_class = sample['gt_class']
-        im_height, im_width = im.shape[:2]
-        gt_score = None
-        if 'gt_score' in sample:
-            gt_score = sample['gt_score']
-        sampled_bbox = []
-        gt_bbox = gt_bbox.tolist()
-        for sampler in self.batch_sampler:
-            found = 0
-            for i in range(sampler[1]):
-                if found >= sampler[0]:
-                    break
-                sample_bbox = generate_sample_bbox(sampler)
-                if satisfy_sample_constraint(sampler, sample_bbox, gt_bbox,
-                                             self.satisfy_all):
-                    sampled_bbox.append(sample_bbox)
-                    found = found + 1
-        im = np.array(im)
-        while sampled_bbox:
-            idx = int(np.random.uniform(0, len(sampled_bbox)))
-            sample_bbox = sampled_bbox.pop(idx)
-            sample_bbox = clip_bbox(sample_bbox)
-            crop_bbox, crop_class, crop_score = \
-                filter_and_process(sample_bbox, gt_bbox, gt_class, scores=gt_score)
-            if self.avoid_no_bbox:
-                if len(crop_bbox) < 1:
-                    continue
-            xmin = int(sample_bbox[0] * im_width)
-            xmax = int(sample_bbox[2] * im_width)
-            ymin = int(sample_bbox[1] * im_height)
-            ymax = int(sample_bbox[3] * im_height)
-            im = im[ymin:ymax, xmin:xmax]
-            sample['image'] = im
-            sample['gt_bbox'] = crop_bbox
-            sample['gt_class'] = crop_class
-            sample['gt_score'] = crop_score
-            return sample
-        return sample
-@register_op
-class CropWithDataAchorSampling(BaseOperator):
-    def __init__(self,
-                 batch_sampler,
-                 anchor_sampler=None,
-                 target_size=None,
-                 das_anchor_scales=[16, 32, 64, 128],
-                 sampling_prob=0.5,
-                 min_size=8.,
-                 avoid_no_bbox=True):
-        """
-        Args:
-            anchor_sampler (list): anchor_sampling sets of different
-                                  parameters for cropping.
-            batch_sampler (list): Multiple sets of different
-                                  parameters for cropping.
-              e.g.[[1, 10, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.2, 0.0]]
-                  [[1, 50, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0],
-                   [1, 50, 0.3, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0],
-                   [1, 50, 0.3, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0],
-                   [1, 50, 0.3, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0],
-                   [1, 50, 0.3, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0]]
-              [max sample, max trial, min scale, max scale,
-               min aspect ratio, max aspect ratio,
-               min overlap, max overlap, min coverage, max coverage]
-            target_size (int): target image size.
-            das_anchor_scales (list[float]): a list of anchor scales in data
-                anchor smapling.
-            min_size (float): minimum size of sampled bbox.
-            avoid_no_bbox (bool): whether to to avoid the
-                                  situation where the box does not appear.
-        """
-        super(CropWithDataAchorSampling, self).__init__()
-        self.anchor_sampler = anchor_sampler
-        self.batch_sampler = batch_sampler
-        self.target_size = target_size
-        self.sampling_prob = sampling_prob
-        self.min_size = min_size
-        self.avoid_no_bbox = avoid_no_bbox
-        self.das_anchor_scales = np.array(das_anchor_scales)
-    def apply(self, sample, context):
-        """
-        Crop the image and modify bounding box.
-        Operators:
-            1. Scale the image width and height.
-            2. Crop the image according to a radom sample.
-            3. Rescale the bounding box.
-            4. Determine if the new bbox is satisfied in the new image.
-        Returns:
-            sample: the image, bounding box are replaced.
-        """
-        assert 'image' in sample, "image data not found"
-        im = sample['image']
-        gt_bbox = sample['gt_bbox']
-        gt_class = sample['gt_class']
-        image_height, image_width = im.shape[:2]
-        gt_bbox[:, 0] /= image_width
-        gt_bbox[:, 1] /= image_height
-        gt_bbox[:, 2] /= image_width
-        gt_bbox[:, 3] /= image_height
-        gt_score = None
-        if 'gt_score' in sample:
-            gt_score = sample['gt_score']
-        sampled_bbox = []
-        gt_bbox = gt_bbox.tolist()
-        prob = np.random.uniform(0., 1.)
-        if prob > self.sampling_prob:  # anchor sampling
-            assert self.anchor_sampler
-            for sampler in self.anchor_sampler:
-                found = 0
-                for i in range(sampler[1]):
-                    if found >= sampler[0]:
-                        break
-                    sample_bbox = data_anchor_sampling(
-                        gt_bbox, image_width, image_height,
-                        self.das_anchor_scales, self.target_size)
-                    if sample_bbox == 0:
-                        break
-                    if satisfy_sample_constraint_coverage(sampler, sample_bbox,
-                                                          gt_bbox):
-                        sampled_bbox.append(sample_bbox)
-                        found = found + 1
-            im = np.array(im)
-            while sampled_bbox:
-                idx = int(np.random.uniform(0, len(sampled_bbox)))
-                sample_bbox = sampled_bbox.pop(idx)
-                if 'gt_keypoint' in sample.keys():
-                    keypoints = (sample['gt_keypoint'],
-                                 sample['keypoint_ignore'])
-                    crop_bbox, crop_class, crop_score, gt_keypoints = \
-                        filter_and_process(sample_bbox, gt_bbox, gt_class,
-                                scores=gt_score,
-                                keypoints=keypoints)
-                else:
-                    crop_bbox, crop_class, crop_score = filter_and_process(
-                        sample_bbox, gt_bbox, gt_class, scores=gt_score)
-                crop_bbox, crop_class, crop_score = bbox_area_sampling(
-                    crop_bbox, crop_class, crop_score, self.target_size,
-                    self.min_size)
-                if self.avoid_no_bbox:
-                    if len(crop_bbox) < 1:
-                        continue
-                im = crop_image_sampling(im, sample_bbox, image_width,
-                                         image_height, self.target_size)
-                height, width = im.shape[:2]
-                crop_bbox[:, 0] *= width
-                crop_bbox[:, 1] *= height
-                crop_bbox[:, 2] *= width
-                crop_bbox[:, 3] *= height
-                sample['image'] = im
-                sample['gt_bbox'] = crop_bbox
-                sample['gt_class'] = crop_class
-                if 'gt_score' in sample:
-                    sample['gt_score'] = crop_score
-                if 'gt_keypoint' in sample.keys():
-                    sample['gt_keypoint'] = gt_keypoints[0]
-                    sample['keypoint_ignore'] = gt_keypoints[1]
-                return sample
-            return sample
-        else:
-            for sampler in self.batch_sampler:
-                found = 0
-                for i in range(sampler[1]):
-                    if found >= sampler[0]:
-                        break
-                    sample_bbox = generate_sample_bbox_square(
-                        sampler, image_width, image_height)
-                    if satisfy_sample_constraint_coverage(sampler, sample_bbox,
-                                                          gt_bbox):
-                        sampled_bbox.append(sample_bbox)
-                        found = found + 1
-            im = np.array(im)
-            while sampled_bbox:
-                idx = int(np.random.uniform(0, len(sampled_bbox)))
-                sample_bbox = sampled_bbox.pop(idx)
-                sample_bbox = clip_bbox(sample_bbox)
-                if 'gt_keypoint' in sample.keys():
-                    keypoints = (sample['gt_keypoint'],
-                                 sample['keypoint_ignore'])
-                    crop_bbox, crop_class, crop_score, gt_keypoints = \
-                        filter_and_process(sample_bbox, gt_bbox, gt_class,
-                                scores=gt_score,
-                                keypoints=keypoints)
-                else:
-                    crop_bbox, crop_class, crop_score = filter_and_process(
-                        sample_bbox, gt_bbox, gt_class, scores=gt_score)
-                # sampling bbox according the bbox area
-                crop_bbox, crop_class, crop_score = bbox_area_sampling(
-                    crop_bbox, crop_class, crop_score, self.target_size,
-                    self.min_size)
-                if self.avoid_no_bbox:
-                    if len(crop_bbox) < 1:
-                        continue
-                xmin = int(sample_bbox[0] * image_width)
-                xmax = int(sample_bbox[2] * image_width)
-                ymin = int(sample_bbox[1] * image_height)
-                ymax = int(sample_bbox[3] * image_height)
-                im = im[ymin:ymax, xmin:xmax]
-                height, width = im.shape[:2]
-                crop_bbox[:, 0] *= width
-                crop_bbox[:, 1] *= height
-                crop_bbox[:, 2] *= width
-                crop_bbox[:, 3] *= height
-                sample['image'] = im
-                sample['gt_bbox'] = crop_bbox
-                sample['gt_class'] = crop_class
-                if 'gt_score' in sample:
-                    sample['gt_score'] = crop_score
-                if 'gt_keypoint' in sample.keys():
-                    sample['gt_keypoint'] = gt_keypoints[0]
-                    sample['keypoint_ignore'] = gt_keypoints[1]
-                return sample
-            return sample
-@register_op
-class RandomCrop(BaseOperator):
-    """Random crop image and bboxes.
-    Args:
-        aspect_ratio (list): aspect ratio of cropped region.
-            in [min, max] format.
-        thresholds (list): iou thresholds for decide a valid bbox crop.
-        scaling (list): ratio between a cropped region and the original image.
-             in [min, max] format.
-        num_attempts (int): number of tries before giving up.
-        allow_no_crop (bool): allow return without actually cropping them.
-        cover_all_box (bool): ensure all bboxes are covered in the final crop.
-        is_mask_crop(bool): whether crop the segmentation.
-    """
-    def __init__(self,
-                 aspect_ratio=[.5, 2.],
-                 thresholds=[.0, .1, .3, .5, .7, .9],
-                 scaling=[.3, 1.],
-                 num_attempts=50,
-                 allow_no_crop=True,
-                 cover_all_box=False,
-                 is_mask_crop=False):
-        super(RandomCrop, self).__init__()
-        self.aspect_ratio = aspect_ratio
-        self.thresholds = thresholds
-        self.scaling = scaling
-        self.num_attempts = num_attempts
-        self.allow_no_crop = allow_no_crop
-        self.cover_all_box = cover_all_box
-        self.is_mask_crop = is_mask_crop
-    def crop_segms(self, segms, valid_ids, crop, height, width):
-        def _crop_poly(segm, crop):
-            xmin, ymin, xmax, ymax = crop
-            crop_coord = [xmin, ymin, xmin, ymax, xmax, ymax, xmax, ymin]
-            crop_p = np.array(crop_coord).reshape(4, 2)
-            crop_p = Polygon(crop_p)
-            crop_segm = list()
-            for poly in segm:
-                poly = np.array(poly).reshape(len(poly) // 2, 2)
-                polygon = Polygon(poly)
-                if not polygon.is_valid:
-                    exterior = polygon.exterior
-                    multi_lines = exterior.intersection(exterior)
-                    polygons = shapely.ops.polygonize(multi_lines)
-                    polygon = MultiPolygon(polygons)
-                multi_polygon = list()
-                if isinstance(polygon, MultiPolygon):
-                    multi_polygon = copy.deepcopy(polygon)
-                else:
-                    multi_polygon.append(copy.deepcopy(polygon))
-                for per_polygon in multi_polygon:
-                    inter = per_polygon.intersection(crop_p)
-                    if not inter:
-                        continue
-                    if isinstance(inter, (MultiPolygon, GeometryCollection)):
-                        for part in inter:
-                            if not isinstance(part, Polygon):
-                                continue
-                            part = np.squeeze(
-                                np.array(part.exterior.coords[:-1]).reshape(
-                                    1, -1))
-                            part[0::2] -= xmin
-                            part[1::2] -= ymin
-                            crop_segm.append(part.tolist())
-                    elif isinstance(inter, Polygon):
-                        crop_poly = np.squeeze(
-                            np.array(inter.exterior.coords[:-1]).reshape(1,
-                                                                         -1))
-                        crop_poly[0::2] -= xmin
-                        crop_poly[1::2] -= ymin
-                        crop_segm.append(crop_poly.tolist())
-                    else:
-                        continue
-            return crop_segm
-        def _crop_rle(rle, crop, height, width):
-            if 'counts' in rle and type(rle['counts']) == list:
-                rle = mask_util.frPyObjects(rle, height, width)
-            mask = mask_util.decode(rle)
-            mask = mask[crop[1]:crop[3], crop[0]:crop[2]]
-            rle = mask_util.encode(np.array(mask, order='F', dtype=np.uint8))
-            return rle
-        crop_segms = []
-        for id in valid_ids:
-            segm = segms[id]
-            if is_poly(segm):
-                import copy
-                import shapely.ops
-                from shapely.geometry import Polygon, MultiPolygon, GeometryCollection
-                logging.getLogger("shapely").setLevel(logging.WARNING)
-                # Polygon format
-                crop_segms.append(_crop_poly(segm, crop))
-            else:
-                # RLE format
-                import pycocotools.mask as mask_util
-                crop_segms.append(_crop_rle(segm, crop, height, width))
-        return crop_segms
-    def apply(self, sample, context=None):
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) == 0:
-            return sample
-        h, w = sample['image'].shape[:2]
-        gt_bbox = sample['gt_bbox']
-        # NOTE Original method attempts to generate one candidate for each
-        # threshold then randomly sample one from the resulting list.
-        # Here a short circuit approach is taken, i.e., randomly choose a
-        # threshold and attempt to find a valid crop, and simply return the
-        # first one found.
-        # The probability is not exactly the same, kinda resembling the
-        # "Monty Hall" problem. Actually carrying out the attempts will affect
-        # observability (just like opening doors in the "Monty Hall" game).
-        thresholds = list(self.thresholds)
-        if self.allow_no_crop:
-            thresholds.append('no_crop')
-        np.random.shuffle(thresholds)
-        for thresh in thresholds:
-            if thresh == 'no_crop':
-                return sample
-            found = False
-            for i in range(self.num_attempts):
-                scale = np.random.uniform(*self.scaling)
-                if self.aspect_ratio is not None:
-                    min_ar, max_ar = self.aspect_ratio
-                    aspect_ratio = np.random.uniform(
-                        max(min_ar, scale**2), min(max_ar, scale**-2))
-                    h_scale = scale / np.sqrt(aspect_ratio)
-                    w_scale = scale * np.sqrt(aspect_ratio)
-                else:
-                    h_scale = np.random.uniform(*self.scaling)
-                    w_scale = np.random.uniform(*self.scaling)
-                crop_h = h * h_scale
-                crop_w = w * w_scale
-                if self.aspect_ratio is None:
-                    if crop_h / crop_w < 0.5 or crop_h / crop_w > 2.0:
-                        continue
-                crop_h = int(crop_h)
-                crop_w = int(crop_w)
-                crop_y = np.random.randint(0, h - crop_h)
-                crop_x = np.random.randint(0, w - crop_w)
-                crop_box = [crop_x, crop_y, crop_x + crop_w, crop_y + crop_h]
-                iou = self._iou_matrix(
-                    gt_bbox, np.array(
-                        [crop_box], dtype=np.float32))
-                if iou.max() < thresh:
-                    continue
-                if self.cover_all_box and iou.min() < thresh:
-                    continue
-                cropped_box, valid_ids = self._crop_box_with_center_constraint(
-                    gt_bbox, np.array(
-                        crop_box, dtype=np.float32))
-                if valid_ids.size > 0:
-                    found = True
-                    break
-            if found:
-                if self.is_mask_crop and 'gt_poly' in sample and len(sample[
-                        'gt_poly']) > 0:
-                    crop_polys = self.crop_segms(
-                        sample['gt_poly'],
-                        valid_ids,
-                        np.array(
-                            crop_box, dtype=np.int64),
-                        h,
-                        w)
-                    if [] in crop_polys:
-                        delete_id = list()
-                        valid_polys = list()
-                        for id, crop_poly in enumerate(crop_polys):
-                            if crop_poly == []:
-                                delete_id.append(id)
-                            else:
-                                valid_polys.append(crop_poly)
-                        valid_ids = np.delete(valid_ids, delete_id)
-                        if len(valid_polys) == 0:
-                            return sample
-                        sample['gt_poly'] = valid_polys
-                    else:
-                        sample['gt_poly'] = crop_polys
-                if 'gt_segm' in sample:
-                    sample['gt_segm'] = self._crop_segm(sample['gt_segm'],
-                                                        crop_box)
-                    sample['gt_segm'] = np.take(
-                        sample['gt_segm'], valid_ids, axis=0)
-                sample['image'] = self._crop_image(sample['image'], crop_box)
-                sample['gt_bbox'] = np.take(cropped_box, valid_ids, axis=0)
-                sample['gt_class'] = np.take(
-                    sample['gt_class'], valid_ids, axis=0)
-                if 'gt_score' in sample:
-                    sample['gt_score'] = np.take(
-                        sample['gt_score'], valid_ids, axis=0)
-                if 'is_crowd' in sample:
-                    sample['is_crowd'] = np.take(
-                        sample['is_crowd'], valid_ids, axis=0)
-                return sample
-        return sample
-    def _iou_matrix(self, a, b):
-        tl_i = np.maximum(a[:, np.newaxis, :2], b[:, :2])
-        br_i = np.minimum(a[:, np.newaxis, 2:], b[:, 2:])
-        area_i = np.prod(br_i - tl_i, axis=2) * (tl_i < br_i).all(axis=2)
-        area_a = np.prod(a[:, 2:] - a[:, :2], axis=1)
-        area_b = np.prod(b[:, 2:] - b[:, :2], axis=1)
-        area_o = (area_a[:, np.newaxis] + area_b - area_i)
-        return area_i / (area_o + 1e-10)
-    def _crop_box_with_center_constraint(self, box, crop):
-        cropped_box = box.copy()
-        cropped_box[:, :2] = np.maximum(box[:, :2], crop[:2])
-        cropped_box[:, 2:] = np.minimum(box[:, 2:], crop[2:])
-        cropped_box[:, :2] -= crop[:2]
-        cropped_box[:, 2:] -= crop[:2]
-        centers = (box[:, :2] + box[:, 2:]) / 2
-        valid = np.logical_and(crop[:2] <= centers,
-                               centers < crop[2:]).all(axis=1)
-        valid = np.logical_and(
-            valid, (cropped_box[:, :2] < cropped_box[:, 2:]).all(axis=1))
-        return cropped_box, np.where(valid)[0]
-    def _crop_image(self, img, crop):
-        x1, y1, x2, y2 = crop
-        return img[y1:y2, x1:x2, :]
-    def _crop_segm(self, segm, crop):
-        x1, y1, x2, y2 = crop
-        return segm[:, y1:y2, x1:x2]
-@register_op
-class RandomScaledCrop(BaseOperator):
-    """Resize image and bbox based on long side (with optional random scaling),
-       then crop or pad image to target size.
-    Args:
-        target_dim (int): target size.
-        scale_range (list): random scale range.
-        interp (int): interpolation method, default to `cv2.INTER_LINEAR`.
-    """
-    def __init__(self,
-                 target_dim=512,
-                 scale_range=[.1, 2.],
-                 interp=cv2.INTER_LINEAR):
-        super(RandomScaledCrop, self).__init__()
-        self.target_dim = target_dim
-        self.scale_range = scale_range
-        self.interp = interp
-    def apply(self, sample, context=None):
-        img = sample['image']
-        h, w = img.shape[:2]
-        random_scale = np.random.uniform(*self.scale_range)
-        dim = self.target_dim
-        random_dim = int(dim * random_scale)
-        dim_max = max(h, w)
-        scale = random_dim / dim_max
-        resize_w = w * scale
-        resize_h = h * scale
-        offset_x = int(max(0, np.random.uniform(0., resize_w - dim)))
-        offset_y = int(max(0, np.random.uniform(0., resize_h - dim)))
-        img = cv2.resize(img, (resize_w, resize_h), interpolation=self.interp)
-        img = np.array(img)
-        canvas = np.zeros((dim, dim, 3), dtype=img.dtype)
-        canvas[:min(dim, resize_h), :min(dim, resize_w), :] = img[
-            offset_y:offset_y + dim, offset_x:offset_x + dim, :]
-        sample['image'] = canvas
-        sample['im_shape'] = np.asarray([resize_h, resize_w], dtype=np.float32)
-        scale_factor = sample['sacle_factor']
-        sample['scale_factor'] = np.asarray(
-            [scale_factor[0] * scale, scale_factor[1] * scale],
-            dtype=np.float32)
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) > 0:
-            scale_array = np.array([scale, scale] * 2, dtype=np.float32)
-            shift_array = np.array([offset_x, offset_y] * 2, dtype=np.float32)
-            boxes = sample['gt_bbox'] * scale_array - shift_array
-            boxes = np.clip(boxes, 0, dim - 1)
-            # filter boxes with no area
-            area = np.prod(boxes[..., 2:] - boxes[..., :2], axis=1)
-            valid = (area > 1.).nonzero()[0]
-            sample['gt_bbox'] = boxes[valid]
-            sample['gt_class'] = sample['gt_class'][valid]
-        return sample
-@register_op
-class Cutmix(BaseOperator):
-    def __init__(self, alpha=1.5, beta=1.5):
-        """
-        CutMix: Regularization Strategy to Train Strong Classifiers with Localizable Features, see https://arxiv.org/abs/1905.04899
-        Cutmix image and gt_bbbox/gt_score
-        Args:
-             alpha (float): alpha parameter of beta distribute
-             beta (float): beta parameter of beta distribute
-        """
-        super(Cutmix, self).__init__()
-        self.alpha = alpha
-        self.beta = beta
-        if self.alpha <= 0.0:
-            raise ValueError("alpha shold be positive in {}".format(self))
-        if self.beta <= 0.0:
-            raise ValueError("beta shold be positive in {}".format(self))
-    def apply_image(self, img1, img2, factor):
-        """ _rand_bbox """
-        h = max(img1.shape[0], img2.shape[0])
-        w = max(img1.shape[1], img2.shape[1])
-        cut_rat = np.sqrt(1. - factor)
-        cut_w = np.int(w * cut_rat)
-        cut_h = np.int(h * cut_rat)
-        # uniform
-        cx = np.random.randint(w)
-        cy = np.random.randint(h)
-        bbx1 = np.clip(cx - cut_w // 2, 0, w - 1)
-        bby1 = np.clip(cy - cut_h // 2, 0, h - 1)
-        bbx2 = np.clip(cx + cut_w // 2, 0, w - 1)
-        bby2 = np.clip(cy + cut_h // 2, 0, h - 1)
-        img_1_pad = np.zeros((h, w, img1.shape[2]), 'float32')
-        img_1_pad[:img1.shape[0], :img1.shape[1], :] = \
-            img1.astype('float32')
-        img_2_pad = np.zeros((h, w, img2.shape[2]), 'float32')
-        img_2_pad[:img2.shape[0], :img2.shape[1], :] = \
-            img2.astype('float32')
-        img_1_pad[bby1:bby2, bbx1:bbx2, :] = img_2_pad[bby1:bby2, bbx1:bbx2, :]
-        return img_1_pad
-    def __call__(self, sample, context=None):
-        if not isinstance(sample, Sequence):
-            return sample
-        assert len(sample) == 2, 'cutmix need two samples'
-        factor = np.random.beta(self.alpha, self.beta)
-        factor = max(0.0, min(1.0, factor))
-        if factor >= 1.0:
-            return sample[0]
-        if factor <= 0.0:
-            return sample[1]
-        img1 = sample[0]['image']
-        img2 = sample[1]['image']
-        img = self.apply_image(img1, img2, factor)
-        gt_bbox1 = sample[0]['gt_bbox']
-        gt_bbox2 = sample[1]['gt_bbox']
-        gt_bbox = np.concatenate((gt_bbox1, gt_bbox2), axis=0)
-        gt_class1 = sample[0]['gt_class']
-        gt_class2 = sample[1]['gt_class']
-        gt_class = np.concatenate((gt_class1, gt_class2), axis=0)
-        gt_score1 = np.ones_like(sample[0]['gt_class'])
-        gt_score2 = np.ones_like(sample[1]['gt_class'])
-        gt_score = np.concatenate(
-            (gt_score1 * factor, gt_score2 * (1. - factor)), axis=0)
-        result = copy.deepcopy(sample[0])
-        result['image'] = img
-        result['gt_bbox'] = gt_bbox
-        result['gt_score'] = gt_score
-        result['gt_class'] = gt_class
-        if 'is_crowd' in sample[0]:
-            is_crowd1 = sample[0]['is_crowd']
-            is_crowd2 = sample[1]['is_crowd']
-            is_crowd = np.concatenate((is_crowd1, is_crowd2), axis=0)
-            result['is_crowd'] = is_crowd
-        if 'difficult' in sample[0]:
-            is_difficult1 = sample[0]['difficult']
-            is_difficult2 = sample[1]['difficult']
-            is_difficult = np.concatenate(
-                (is_difficult1, is_difficult2), axis=0)
-            result['difficult'] = is_difficult
-        return result
-@register_op
-class Mixup(BaseOperator):
-    def __init__(self, alpha=1.5, beta=1.5):
-        """ Mixup image and gt_bbbox/gt_score
-        Args:
-            alpha (float): alpha parameter of beta distribute
-            beta (float): beta parameter of beta distribute
-        """
-        super(Mixup, self).__init__()
-        self.alpha = alpha
-        self.beta = beta
-        if self.alpha <= 0.0:
-            raise ValueError("alpha shold be positive in {}".format(self))
-        if self.beta <= 0.0:
-            raise ValueError("beta shold be positive in {}".format(self))
-    def apply_image(self, img1, img2, factor):
-        h = max(img1.shape[0], img2.shape[0])
-        w = max(img1.shape[1], img2.shape[1])
-        img = np.zeros((h, w, img1.shape[2]), 'float32')
-        img[:img1.shape[0], :img1.shape[1], :] = \
-            img1.astype('float32') * factor
-        img[:img2.shape[0], :img2.shape[1], :] += \
-            img2.astype('float32') * (1.0 - factor)
-        return img.astype('uint8')
-    def __call__(self, sample, context=None):
-        if not isinstance(sample, Sequence):
-            return sample
-        assert len(sample) == 2, 'mixup need two samples'
-        factor = np.random.beta(self.alpha, self.beta)
-        factor = max(0.0, min(1.0, factor))
-        if factor >= 1.0:
-            return sample[0]
-        if factor <= 0.0:
-            return sample[1]
-        im = self.apply_image(sample[0]['image'], sample[1]['image'], factor)
-        result = copy.deepcopy(sample[0])
-        result['image'] = im
-        # apply bbox and score
-        if 'gt_bbox' in sample[0]:
-            gt_bbox1 = sample[0]['gt_bbox']
-            gt_bbox2 = sample[1]['gt_bbox']
-            gt_bbox = np.concatenate((gt_bbox1, gt_bbox2), axis=0)
-            result['gt_bbox'] = gt_bbox
-        if 'gt_class' in sample[0]:
-            gt_class1 = sample[0]['gt_class']
-            gt_class2 = sample[1]['gt_class']
-            gt_class = np.concatenate((gt_class1, gt_class2), axis=0)
-            result['gt_class'] = gt_class
-            gt_score1 = np.ones_like(sample[0]['gt_class'])
-            gt_score2 = np.ones_like(sample[1]['gt_class'])
-            gt_score = np.concatenate(
-                (gt_score1 * factor, gt_score2 * (1. - factor)), axis=0)
-            result['gt_score'] = gt_score
-        if 'is_crowd' in sample[0]:
-            is_crowd1 = sample[0]['is_crowd']
-            is_crowd2 = sample[1]['is_crowd']
-            is_crowd = np.concatenate((is_crowd1, is_crowd2), axis=0)
-            result['is_crowd'] = is_crowd
-        if 'difficult' in sample[0]:
-            is_difficult1 = sample[0]['difficult']
-            is_difficult2 = sample[1]['difficult']
-            is_difficult = np.concatenate(
-                (is_difficult1, is_difficult2), axis=0)
-            result['difficult'] = is_difficult
-        if 'gt_ide' in sample[0]:
-            gt_ide1 = sample[0]['gt_ide']
-            gt_ide2 = sample[1]['gt_ide']
-            gt_ide = np.concatenate((gt_ide1, gt_ide2), axis=0)
-            result['gt_ide'] = gt_ide
-        return result
-@register_op
-class NormalizeBox(BaseOperator):
-    """Transform the bounding box's coornidates to [0,1]."""
-    def __init__(self):
-        super(NormalizeBox, self).__init__()
-    def apply(self, sample, context):
-        im = sample['image']
-        gt_bbox = sample['gt_bbox']
-        height, width, _ = im.shape
-        for i in range(gt_bbox.shape[0]):
-            gt_bbox[i][0] = gt_bbox[i][0] / width
-            gt_bbox[i][1] = gt_bbox[i][1] / height
-            gt_bbox[i][2] = gt_bbox[i][2] / width
-            gt_bbox[i][3] = gt_bbox[i][3] / height
-        sample['gt_bbox'] = gt_bbox
-        if 'gt_keypoint' in sample.keys():
-            gt_keypoint = sample['gt_keypoint']
-            for i in range(gt_keypoint.shape[1]):
-                if i % 2:
-                    gt_keypoint[:, i] = gt_keypoint[:, i] / height
-                else:
-                    gt_keypoint[:, i] = gt_keypoint[:, i] / width
-            sample['gt_keypoint'] = gt_keypoint
-        return sample
-@register_op
-class BboxXYXY2XYWH(BaseOperator):
-    """
-    Convert bbox XYXY format to XYWH format.
-    """
-    def __init__(self):
-        super(BboxXYXY2XYWH, self).__init__()
-    def apply(self, sample, context=None):
-        assert 'gt_bbox' in sample
-        bbox = sample['gt_bbox']
-        bbox[:, 2:4] = bbox[:, 2:4] - bbox[:, :2]
-        bbox[:, :2] = bbox[:, :2] + bbox[:, 2:4] / 2.
-        sample['gt_bbox'] = bbox
-        return sample
-@register_op
-class PadBox(BaseOperator):
-    def __init__(self, num_max_boxes=50):
-        """
-        Pad zeros to bboxes if number of bboxes is less than num_max_boxes.
-        Args:
-            num_max_boxes (int): the max number of bboxes
-        """
-        self.num_max_boxes = num_max_boxes
-        super(PadBox, self).__init__()
-    def apply(self, sample, context=None):
-        assert 'gt_bbox' in sample
-        bbox = sample['gt_bbox']
-        gt_num = min(self.num_max_boxes, len(bbox))
-        num_max = self.num_max_boxes
-        # fields = context['fields'] if context else []
-        pad_bbox = np.zeros((num_max, 4), dtype=np.float32)
-        if gt_num > 0:
-            pad_bbox[:gt_num, :] = bbox[:gt_num, :]
-        sample['gt_bbox'] = pad_bbox
-        if 'gt_class' in sample:
-            pad_class = np.zeros((num_max, ), dtype=np.int32)
-            if gt_num > 0:
-                pad_class[:gt_num] = sample['gt_class'][:gt_num, 0]
-            sample['gt_class'] = pad_class
-        if 'gt_score' in sample:
-            pad_score = np.zeros((num_max, ), dtype=np.float32)
-            if gt_num > 0:
-                pad_score[:gt_num] = sample['gt_score'][:gt_num, 0]
-            sample['gt_score'] = pad_score
-        # in training, for example in op ExpandImage,
-        # the bbox and gt_class is expandded, but the difficult is not,
-        # so, judging by it's length
-        if 'difficult' in sample:
-            pad_diff = np.zeros((num_max, ), dtype=np.int32)
-            if gt_num > 0:
-                pad_diff[:gt_num] = sample['difficult'][:gt_num, 0]
-            sample['difficult'] = pad_diff
-        if 'is_crowd' in sample:
-            pad_crowd = np.zeros((num_max, ), dtype=np.int32)
-            if gt_num > 0:
-                pad_crowd[:gt_num] = sample['is_crowd'][:gt_num, 0]
-            sample['is_crowd'] = pad_crowd
-        if 'gt_ide' in sample:
-            pad_ide = np.zeros((num_max, ), dtype=np.int32)
-            if gt_num > 0:
-                pad_ide[:gt_num] = sample['gt_ide'][:gt_num, 0]
-            sample['gt_ide'] = pad_ide
-        return sample
-@register_op
-class DebugVisibleImage(BaseOperator):
-    """
-    In debug mode, visualize images according to `gt_box`.
-    (Currently only supported when not cropping and flipping image.)
-    """
-    def __init__(self, output_dir='output/debug', is_normalized=False):
-        super(DebugVisibleImage, self).__init__()
-        self.is_normalized = is_normalized
-        self.output_dir = output_dir
-        if not os.path.isdir(output_dir):
-            os.makedirs(output_dir)
-        if not isinstance(self.is_normalized, bool):
-            raise TypeError("{}: input type is invalid.".format(self))
-    def apply(self, sample, context=None):
-        image = Image.open(sample['im_file']).convert('RGB')
-        out_file_name = sample['im_file'].split('/')[-1]
-        width = sample['w']
-        height = sample['h']
-        gt_bbox = sample['gt_bbox']
-        gt_class = sample['gt_class']
-        draw = ImageDraw.Draw(image)
-        for i in range(gt_bbox.shape[0]):
-            if self.is_normalized:
-                gt_bbox[i][0] = gt_bbox[i][0] * width
-                gt_bbox[i][1] = gt_bbox[i][1] * height
-                gt_bbox[i][2] = gt_bbox[i][2] * width
-                gt_bbox[i][3] = gt_bbox[i][3] * height
-            xmin, ymin, xmax, ymax = gt_bbox[i]
-            draw.line(
-                [(xmin, ymin), (xmin, ymax), (xmax, ymax), (xmax, ymin),
-                 (xmin, ymin)],
-                width=2,
-                fill='green')
-            # draw label
-            text = str(gt_class[i][0])
-            tw, th = draw.textsize(text)
-            draw.rectangle(
-                [(xmin + 1, ymin - th), (xmin + tw + 1, ymin)], fill='green')
-            draw.text((xmin + 1, ymin - th), text, fill=(255, 255, 255))
-        if 'gt_keypoint' in sample.keys():
-            gt_keypoint = sample['gt_keypoint']
-            if self.is_normalized:
-                for i in range(gt_keypoint.shape[1]):
-                    if i % 2:
-                        gt_keypoint[:, i] = gt_keypoint[:, i] * height
-                    else:
-                        gt_keypoint[:, i] = gt_keypoint[:, i] * width
-            for i in range(gt_keypoint.shape[0]):
-                keypoint = gt_keypoint[i]
-                for j in range(int(keypoint.shape[0] / 2)):
-                    x1 = round(keypoint[2 * j]).astype(np.int32)
-                    y1 = round(keypoint[2 * j + 1]).astype(np.int32)
-                    draw.ellipse(
-                        (x1, y1, x1 + 5, y1 + 5),
-                        fill='green',
-                        outline='green')
-        save_path = os.path.join(self.output_dir, out_file_name)
-        image.save(save_path, quality=95)
-        return sample
-@register_op
-class Pad(BaseOperator):
-    def __init__(self,
-                 size=None,
-                 size_divisor=32,
-                 pad_mode=0,
-                 offsets=None,
-                 fill_value=(127.5, 127.5, 127.5)):
-        """
-        Pad image to a specified size or multiple of size_divisor.
-        Args:
-            size (int, Sequence): image target size, if None, pad to multiple of size_divisor, default None
-            size_divisor (int): size divisor, default 32
-            pad_mode (int): pad mode, currently only supports four modes [-1, 0, 1, 2]. if -1, use specified offsets
-                if 0, only pad to right and bottom. if 1, pad according to center. if 2, only pad left and top
-            offsets (list): [offset_x, offset_y], specify offset while padding, only supported pad_mode=-1
-            fill_value (bool): rgb value of pad area, default (127.5, 127.5, 127.5)
-        """
-        super(Pad, self).__init__()
-        if not isinstance(size, (int, Sequence)):
-            raise TypeError(
-                "Type of target_size is invalid when random_size is True. \
-                            Must be List, now is {}".format(type(size)))
-        if isinstance(size, int):
-            size = [size, size]
-        assert pad_mode in [
-            -1, 0, 1, 2
-        ], 'currently only supports four modes [-1, 0, 1, 2]'
-        assert pad_mode == -1 and offsets, 'if pad_mode is -1, offsets should not be None'
-        self.size = size
-        self.size_divisor = size_divisor
-        self.pad_mode = pad_mode
-        self.fill_value = fill_value
-        self.offsets = offsets
-    def apply_segm(self, segms, offsets, im_size, size):
-        def _expand_poly(poly, x, y):
-            expanded_poly = np.array(poly)
-            expanded_poly[0::2] += x
-            expanded_poly[1::2] += y
-            return expanded_poly.tolist()
-        def _expand_rle(rle, x, y, height, width, h, w):
-            if 'counts' in rle and type(rle['counts']) == list:
-                rle = mask_util.frPyObjects(rle, height, width)
-            mask = mask_util.decode(rle)
-            expanded_mask = np.full((h, w), 0).astype(mask.dtype)
-            expanded_mask[y:y + height, x:x + width] = mask
-            rle = mask_util.encode(
-                np.array(
-                    expanded_mask, order='F', dtype=np.uint8))
-            return rle
-        x, y = offsets
-        height, width = im_size
-        h, w = size
-        expanded_segms = []
-        for segm in segms:
-            if is_poly(segm):
-                # Polygon format
-                expanded_segms.append(
-                    [_expand_poly(poly, x, y) for poly in segm])
-            else:
-                # RLE format
-                import pycocotools.mask as mask_util
-                expanded_segms.append(
-                    _expand_rle(segm, x, y, height, width, h, w))
-        return expanded_segms
-    def apply_bbox(self, bbox, offsets):
-        return bbox + np.array(offsets * 2, dtype=np.float32)
-    def apply_keypoint(self, keypoints, offsets):
-        n = len(keypoints[0]) // 2
-        return keypoints + np.array(offsets * n, dtype=np.float32)
-    def apply_image(self, image, offsets, im_size, size):
-        x, y = offsets
-        im_h, im_w = im_size
-        h, w = size
-        canvas = np.ones((h, w, 3), dtype=np.float32)
-        canvas *= np.array(self.fill_value, dtype=np.float32)
-        canvas[y:y + im_h, x:x + im_w, :] = image.astype(np.float32)
-        return canvas
-    def apply(self, sample, context=None):
-        im = sample['image']
-        im_h, im_w = im.shape[:2]
-        if self.size:
-            h, w = self.size
-            assert (
-                im_h < h and im_w < w
-            ), '(h, w) of target size should be greater than (im_h, im_w)'
-        else:
-            h = np.ceil(im_h // self.size_divisor) * self.size_divisor
-            w = np.ceil(im_w / self.size_divisor) * self.size_divisor
-        if h == im_h and w == im_w:
-            return sample
-        if self.pad_mode == -1:
-            offset_x, offset_y = self.offsets
-        elif self.pad_mode == 0:
-            offset_y, offset_x = 0, 0
-        elif self.pad_mode == 1:
-            offset_y, offset_x = (h - im_h) // 2, (w - im_w) // 2
-        else:
-            offset_y, offset_x = h - im_h, w - im_w
-        offsets, im_size, size = [offset_x, offset_y], [im_h, im_w], [h, w]
-        sample['image'] = self.apply_image(im, offsets, im_size, size)
-        if self.pad_mode == 0:
-            return sample
-        if 'gt_bbox' in sample and len(sample['gt_bbox']) > 0:
-            sample['gt_bbox'] = self.apply_bbox(sample['gt_bbox'], offsets)
-        if 'gt_poly' in sample and len(sample['gt_poly']) > 0:
-            sample['gt_poly'] = self.apply_segm(sample['gt_poly'], offsets,
-                                                im_size, size)
-        if 'gt_keypoint' in sample and len(sample['gt_keypoint']) > 0:
-            sample['gt_keypoint'] = self.apply_keypoint(sample['gt_keypoint'],
-                                                        offsets)
-        return sample
-@register_op
-class Poly2Mask(BaseOperator):
-    """
-    gt poly to mask annotations
-    """
-    def __init__(self):
-        super(Poly2Mask, self).__init__()
-        import pycocotools.mask as maskUtils
-        self.maskutils = maskUtils
-    def _poly2mask(self, mask_ann, img_h, img_w):
-        if isinstance(mask_ann, list):
-            # polygon -- a single object might consist of multiple parts
-            # we merge all parts into one mask rle code
-            rles = self.maskutils.frPyObjects(mask_ann, img_h, img_w)
-            rle = self.maskutils.merge(rles)
-        elif isinstance(mask_ann['counts'], list):
-            # uncompressed RLE
-            rle = self.maskutils.frPyObjects(mask_ann, img_h, img_w)
-        else:
-            # rle
-            rle = mask_ann
-        mask = self.maskutils.decode(rle)
-        return mask
-    def apply(self, sample, context=None):
-        assert 'gt_poly' in sample
-        im_h = sample['h']
-        im_w = sample['w']
-        masks = [
-            self._poly2mask(gt_poly, im_h, im_w)
-            for gt_poly in sample['gt_poly']
-        ]
-        sample['gt_segm'] = np.asarray(masks).astype(np.uint8)
-        return sample
-@register_op
-class Rbox2Poly(BaseOperator):
-    """
-    Convert rbbox format to poly format.
-    """
-    def __init__(self):
-        super(Rbox2Poly, self).__init__()
-    def apply(self, sample, context=None):
-        assert 'gt_rbox' in sample
-        assert sample['gt_rbox'].shape[1] == 5
-        rrects = sample['gt_rbox']
-        x_ctr = rrects[:, 0]
-        y_ctr = rrects[:, 1]
-        width = rrects[:, 2]
-        height = rrects[:, 3]
-        x1 = x_ctr - width / 2.0
-        y1 = y_ctr - height / 2.0
-        x2 = x_ctr + width / 2.0
-        y2 = y_ctr + height / 2.0
-        sample['gt_bbox'] = np.stack([x1, y1, x2, y2], axis=1)
-        polys = bbox_utils.rbox2poly_np(rrects)
-        sample['gt_rbox2poly'] = polys
-        return sample
-@register_op
-class AugmentHSV(BaseOperator):
-    def __init__(self, fraction=0.50, is_bgr=False):
-        """
-        Augment the SV channel of image data.
-        Args:
-            fraction (float): the fraction for augment
-            is_bgr (bool): whether the image is BGR mode
-        """
-        super(AugmentHSV, self).__init__()
-        self.fraction = fraction
-        self.is_bgr = is_bgr
-    def apply(self, sample, context=None):
-        img = sample['image']
-        if self.is_bgr:
-            img_hsv = cv2.cvtColor(img, cv2.COLOR_BGR2HSV)
-        else:
-            img_hsv = cv2.cvtColor(img, cv2.COLOR_RGB2HSV)
-        S = img_hsv[:, :, 1].astype(np.float32)
-        V = img_hsv[:, :, 2].astype(np.float32)
-        a = (random.random() * 2 - 1) * self.fraction + 1
-        S *= a
-        if a > 1:
-            np.clip(S, a_min=0, a_max=255, out=S)
-        a = (random.random() * 2 - 1) * self.fraction + 1
-        V *= a
-        if a > 1:
-            np.clip(V, a_min=0, a_max=255, out=V)
-        img_hsv[:, :, 1] = S.astype(np.uint8)
-        img_hsv[:, :, 2] = V.astype(np.uint8)
-        if self.is_bgr:
-            cv2.cvtColor(img_hsv, cv2.COLOR_HSV2BGR, dst=img)
-        else:
-            cv2.cvtColor(img_hsv, cv2.COLOR_HSV2RGB, dst=img)
-        sample['image'] = img
-        return sample
-@register_op
-class Norm2PixelBbox(BaseOperator):
-    """
-    Transform the bounding box's coornidates which is in [0,1] to pixels.
-    """
-    def __init__(self):
-        super(Norm2PixelBbox, self).__init__()
-    def apply(self, sample, context=None):
-        assert 'gt_bbox' in sample
-        bbox = sample['gt_bbox']
-        height, width = sample['image'].shape[:2]
-        bbox[:, 0::2] = bbox[:, 0::2] * width
-        bbox[:, 1::2] = bbox[:, 1::2] * height
-        sample['gt_bbox'] = bbox
-        return sample
-@register_op
-class BboxCXCYWH2XYXY(BaseOperator):
-    """
-    Convert bbox CXCYWH format to XYXY format.
-    [center_x, center_y, width, height] -> [x0, y0, x1, y1]
-    """
-    def __init__(self):
-        super(BboxCXCYWH2XYXY, self).__init__()
-    def apply(self, sample, context=None):
-        assert 'gt_bbox' in sample
-        bbox0 = sample['gt_bbox']
-        bbox = bbox0.copy()
-        bbox[:, :2] = bbox0[:, :2] - bbox0[:, 2:4] / 2.
-        bbox[:, 2:4] = bbox0[:, :2] + bbox0[:, 2:4] / 2.
-        sample['gt_bbox'] = bbox
-        return sample

paddlex 2.0.0rc4__py3-none-any.whl → 3.0.0b2__py3-none-any.whl

paddlex 2.0.0rc4py3-none-any.whl → 3.0.0b2py3-none-any.whl