PyPI - paddlex - Versions diffs - 2.1.0__py3-none-any.whl → 3.0.0rc0__py3-none-any.whl - Mend

paddlex 2.1.0py3-none-any.whl → 3.0.0rc0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (1708) hide show

paddlex/.version +1 -0
paddlex/__init__.py +52 -19
paddlex/__main__.py +39 -0
paddlex/configs/modules/3d_bev_detection/BEVFusion.yaml +38 -0
paddlex/configs/modules/doc_text_orientation/PP-LCNet_x1_0_doc_ori.yaml +41 -0
paddlex/configs/modules/face_detection/BlazeFace-FPN-SSH.yaml +40 -0
paddlex/configs/modules/face_detection/BlazeFace.yaml +40 -0
paddlex/configs/modules/face_detection/PP-YOLOE_plus-S_face.yaml +40 -0
paddlex/configs/modules/face_detection/PicoDet_LCNet_x2_5_face.yaml +40 -0
paddlex/configs/modules/face_feature/MobileFaceNet.yaml +41 -0
paddlex/configs/modules/face_feature/ResNet50_face.yaml +41 -0
paddlex/configs/modules/formula_recognition/LaTeX_OCR_rec.yaml +40 -0
paddlex/configs/modules/formula_recognition/PP-FormulaNet-L.yaml +40 -0
paddlex/configs/modules/formula_recognition/PP-FormulaNet-S.yaml +40 -0
paddlex/configs/modules/formula_recognition/UniMERNet.yaml +40 -0
paddlex/configs/modules/human_detection/PP-YOLOE-L_human.yaml +42 -0
paddlex/configs/modules/human_detection/PP-YOLOE-S_human.yaml +42 -0
paddlex/configs/modules/image_anomaly_detection/STFPM.yaml +41 -0
paddlex/configs/modules/image_classification/CLIP_vit_base_patch16_224.yaml +41 -0
paddlex/configs/modules/image_classification/CLIP_vit_large_patch14_224.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_base_224.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_base_384.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_large_224.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_large_384.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_small.yaml +41 -0
paddlex/configs/modules/image_classification/ConvNeXt_tiny.yaml +41 -0
paddlex/configs/modules/image_classification/FasterNet-L.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-M.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-S.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-T0.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-T1.yaml +40 -0
paddlex/configs/modules/image_classification/FasterNet-T2.yaml +40 -0
paddlex/configs/modules/image_classification/MobileNetV1_x0_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV1_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV1_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV1_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x0_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x1_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV2_x2_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x0_35.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_large_x1_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x0_35.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV3_small_x1_25.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_conv_large.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_conv_medium.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_conv_small.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_hybrid_large.yaml +41 -0
paddlex/configs/modules/image_classification/MobileNetV4_hybrid_medium.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B0.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B1.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B2.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B3.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B4.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B5.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNetV2-B6.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNet_base.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNet_small.yaml +41 -0
paddlex/configs/modules/image_classification/PP-HGNet_tiny.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNetV2_base.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNetV2_large.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNetV2_small.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_25.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_35.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_5.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x0_75.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x1_0.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x1_5.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x2_0.yaml +41 -0
paddlex/configs/modules/image_classification/PP-LCNet_x2_5.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet101.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet101_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet152.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet152_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet18.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet18_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet200_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet34.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet34_vd.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet50.yaml +41 -0
paddlex/configs/modules/image_classification/ResNet50_vd.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S1.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S2.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S3.yaml +41 -0
paddlex/configs/modules/image_classification/StarNet-S4.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_base_patch4_window12_384.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_base_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_large_patch4_window12_384.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_large_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_small_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_classification/SwinTransformer_tiny_patch4_window7_224.yaml +41 -0
paddlex/configs/modules/image_feature/PP-ShiTuV2_rec.yaml +42 -0
paddlex/configs/modules/image_feature/PP-ShiTuV2_rec_CLIP_vit_base.yaml +42 -0
paddlex/configs/modules/image_feature/PP-ShiTuV2_rec_CLIP_vit_large.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/CLIP_vit_base_patch16_448_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B0_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B4_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B6_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/PP-LCNet_x1_0_ML.yaml +41 -0
paddlex/configs/modules/image_multilabel_classification/ResNet50_ML.yaml +41 -0
paddlex/configs/modules/image_unwarping/UVDoc.yaml +12 -0
paddlex/configs/modules/instance_segmentation/Cascade-MaskRCNN-ResNet50-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Cascade-MaskRCNN-ResNet50-vd-SSLDv2-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-H.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-L.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-M.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-S.yaml +40 -0
paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-X.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNeXt101-vd-FPN.yaml +39 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet101-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet101-vd-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50-vd-FPN.yaml +40 -0
paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50.yaml +40 -0
paddlex/configs/modules/instance_segmentation/PP-YOLOE_seg-S.yaml +40 -0
paddlex/configs/modules/instance_segmentation/SOLOv2.yaml +40 -0
paddlex/configs/modules/keypoint_detection/PP-TinyPose_128x96.yaml +40 -0
paddlex/configs/modules/keypoint_detection/PP-TinyPose_256x192.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout-L.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout-M.yaml +40 -0
paddlex/configs/modules/layout_detection/PP-DocLayout-S.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-L_layout_17cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-L_layout_3cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-S_layout_17cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet-S_layout_3cls.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet_layout_1x.yaml +40 -0
paddlex/configs/modules/layout_detection/PicoDet_layout_1x_table.yaml +40 -0
paddlex/configs/modules/layout_detection/RT-DETR-H_layout_17cls.yaml +40 -0
paddlex/configs/modules/layout_detection/RT-DETR-H_layout_3cls.yaml +40 -0
paddlex/configs/modules/mainbody_detection/PP-ShiTuV2_det.yaml +41 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_base.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_large.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_medium.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_small.yaml +12 -0
paddlex/configs/modules/multilingual_speech_recognition/whisper_tiny.yaml +12 -0
paddlex/configs/modules/object_detection/Cascade-FasterRCNN-ResNet50-FPN.yaml +41 -0
paddlex/configs/modules/object_detection/Cascade-FasterRCNN-ResNet50-vd-SSLDv2-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/CenterNet-DLA-34.yaml +41 -0
paddlex/configs/modules/object_detection/CenterNet-ResNet50.yaml +41 -0
paddlex/configs/modules/object_detection/Co-DINO-R50.yaml +40 -0
paddlex/configs/modules/object_detection/Co-DINO-Swin-L.yaml +40 -0
paddlex/configs/modules/object_detection/Co-Deformable-DETR-R50.yaml +40 -0
paddlex/configs/modules/object_detection/Co-Deformable-DETR-Swin-T.yaml +40 -0
paddlex/configs/modules/object_detection/DETR-R50.yaml +42 -0
paddlex/configs/modules/object_detection/FCOS-ResNet50.yaml +41 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNeXt101-vd-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet101-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet101.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet34-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-vd-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-vd-SSLDv2-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-ResNet50.yaml +42 -0
paddlex/configs/modules/object_detection/FasterRCNN-Swin-Tiny-FPN.yaml +42 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-L.yaml +40 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-M.yaml +40 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-S.yaml +40 -0
paddlex/configs/modules/object_detection/PP-YOLOE_plus-X.yaml +40 -0
paddlex/configs/modules/object_detection/PicoDet-L.yaml +40 -0
paddlex/configs/modules/object_detection/PicoDet-M.yaml +42 -0
paddlex/configs/modules/object_detection/PicoDet-S.yaml +40 -0
paddlex/configs/modules/object_detection/PicoDet-XS.yaml +42 -0
paddlex/configs/modules/object_detection/RT-DETR-H.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-L.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-R18.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-R50.yaml +40 -0
paddlex/configs/modules/object_detection/RT-DETR-X.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-L.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-M.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-N.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-S.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-T.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOX-X.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOv3-DarkNet53.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOv3-MobileNetV3.yaml +40 -0
paddlex/configs/modules/object_detection/YOLOv3-ResNet50_vd_DCN.yaml +40 -0
paddlex/configs/modules/open_vocabulary_detection/GroundingDINO-T.yaml +13 -0
paddlex/configs/modules/open_vocabulary_segmentation/SAM-H_box.yaml +17 -0
paddlex/configs/modules/open_vocabulary_segmentation/SAM-H_point.yaml +15 -0
paddlex/configs/modules/pedestrian_attribute_recognition/PP-LCNet_x1_0_pedestrian_attribute.yaml +41 -0
paddlex/configs/modules/rotated_object_detection/PP-YOLOE-R-L.yaml +40 -0
paddlex/configs/modules/seal_text_detection/PP-OCRv4_mobile_seal_det.yaml +40 -0
paddlex/configs/modules/seal_text_detection/PP-OCRv4_server_seal_det.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3-R101.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3-R50.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3_Plus-R101.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/Deeplabv3_Plus-R50.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/MaskFormer_small.yaml +42 -0
paddlex/configs/modules/semantic_segmentation/MaskFormer_tiny.yaml +42 -0
paddlex/configs/modules/semantic_segmentation/OCRNet_HRNet-W18.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/OCRNet_HRNet-W48.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/PP-LiteSeg-B.yaml +41 -0
paddlex/configs/modules/semantic_segmentation/PP-LiteSeg-T.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_base.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_large.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_small.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SeaFormer_tiny.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B0.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B1.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B2.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B3.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B4.yaml +40 -0
paddlex/configs/modules/semantic_segmentation/SegFormer-B5.yaml +40 -0
paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-L.yaml +42 -0
paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-S.yaml +42 -0
paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-largesize-L.yaml +42 -0
paddlex/configs/modules/table_cells_detection/RT-DETR-L_wired_table_cell_det.yaml +40 -0
paddlex/configs/modules/table_cells_detection/RT-DETR-L_wireless_table_cell_det.yaml +40 -0
paddlex/configs/modules/table_classification/PP-LCNet_x1_0_table_cls.yaml +41 -0
paddlex/configs/modules/table_structure_recognition/SLANeXt_wired.yaml +39 -0
paddlex/configs/modules/table_structure_recognition/SLANeXt_wireless.yaml +39 -0
paddlex/configs/modules/table_structure_recognition/SLANet.yaml +39 -0
paddlex/configs/modules/table_structure_recognition/SLANet_plus.yaml +39 -0
paddlex/configs/modules/text_detection/PP-OCRv3_mobile_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv3_server_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv4_mobile_det.yaml +40 -0
paddlex/configs/modules/text_detection/PP-OCRv4_server_det.yaml +40 -0
paddlex/configs/modules/text_recognition/PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv4_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv4_server_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/PP-OCRv4_server_rec_doc.yaml +39 -0
paddlex/configs/modules/text_recognition/arabic_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ch_RepSVTR_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ch_SVTRv2_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/chinese_cht_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/cyrillic_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/devanagari_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/en_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/en_PP-OCRv4_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/japan_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ka_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/korean_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/latin_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/ta_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/text_recognition/te_PP-OCRv3_mobile_rec.yaml +39 -0
paddlex/configs/modules/textline_orientation/PP-LCNet_x0_25_textline_ori.yaml +41 -0
paddlex/configs/modules/ts_anomaly_detection/AutoEncoder_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/DLinear_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/Nonstationary_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/PatchTST_ad.yaml +37 -0
paddlex/configs/modules/ts_anomaly_detection/TimesNet_ad.yaml +37 -0
paddlex/configs/modules/ts_classification/TimesNet_cls.yaml +37 -0
paddlex/configs/modules/ts_forecast/DLinear.yaml +38 -0
paddlex/configs/modules/ts_forecast/NLinear.yaml +38 -0
paddlex/configs/modules/ts_forecast/Nonstationary.yaml +38 -0
paddlex/configs/modules/ts_forecast/PatchTST.yaml +38 -0
paddlex/configs/modules/ts_forecast/RLinear.yaml +38 -0
paddlex/configs/modules/ts_forecast/TiDE.yaml +38 -0
paddlex/configs/modules/ts_forecast/TimesNet.yaml +38 -0
paddlex/configs/modules/vehicle_attribute_recognition/PP-LCNet_x1_0_vehicle_attribute.yaml +41 -0
paddlex/configs/modules/vehicle_detection/PP-YOLOE-L_vehicle.yaml +41 -0
paddlex/configs/modules/vehicle_detection/PP-YOLOE-S_vehicle.yaml +42 -0
paddlex/configs/modules/video_classification/PP-TSM-R50_8frames_uniform.yaml +42 -0
paddlex/configs/modules/video_classification/PP-TSMv2-LCNetV2_16frames_uniform.yaml +42 -0
paddlex/configs/modules/video_classification/PP-TSMv2-LCNetV2_8frames_uniform.yaml +42 -0
paddlex/configs/modules/video_detection/YOWO.yaml +40 -0
paddlex/configs/pipelines/3d_bev_detection.yaml +9 -0
paddlex/configs/pipelines/OCR.yaml +44 -0
paddlex/configs/pipelines/PP-ChatOCRv3-doc.yaml +149 -0
paddlex/configs/pipelines/PP-ChatOCRv4-doc.yaml +184 -0
paddlex/configs/pipelines/PP-ShiTuV2.yaml +18 -0
paddlex/configs/pipelines/PP-StructureV3.yaml +226 -0
paddlex/configs/pipelines/anomaly_detection.yaml +8 -0
paddlex/configs/pipelines/doc_preprocessor.yaml +15 -0
paddlex/configs/pipelines/face_recognition.yaml +18 -0
paddlex/configs/pipelines/formula_recognition.yaml +39 -0
paddlex/configs/pipelines/human_keypoint_detection.yaml +17 -0
paddlex/configs/pipelines/image_classification.yaml +10 -0
paddlex/configs/pipelines/image_multilabel_classification.yaml +9 -0
paddlex/configs/pipelines/instance_segmentation.yaml +10 -0
paddlex/configs/pipelines/layout_parsing.yaml +101 -0
paddlex/configs/pipelines/multilingual_speech_recognition.yaml +9 -0
paddlex/configs/pipelines/object_detection.yaml +10 -0
paddlex/configs/pipelines/open_vocabulary_detection.yaml +12 -0
paddlex/configs/pipelines/open_vocabulary_segmentation.yaml +13 -0
paddlex/configs/pipelines/pedestrian_attribute_recognition.yaml +15 -0
paddlex/configs/pipelines/rotated_object_detection.yaml +10 -0
paddlex/configs/pipelines/seal_recognition.yaml +51 -0
paddlex/configs/pipelines/semantic_segmentation.yaml +10 -0
paddlex/configs/pipelines/small_object_detection.yaml +10 -0
paddlex/configs/pipelines/table_recognition.yaml +56 -0
paddlex/configs/pipelines/table_recognition_v2.yaml +76 -0
paddlex/configs/pipelines/ts_anomaly_detection.yaml +8 -0
paddlex/configs/pipelines/ts_classification.yaml +8 -0
paddlex/configs/pipelines/ts_forecast.yaml +8 -0
paddlex/configs/pipelines/vehicle_attribute_recognition.yaml +15 -0
paddlex/configs/pipelines/video_classification.yaml +9 -0
paddlex/configs/pipelines/video_detection.yaml +10 -0
paddlex/engine.py +54 -0
paddlex/hpip_links.html +19 -0
paddlex/inference/__init__.py +19 -0
paddlex/inference/common/__init__.py +13 -0
paddlex/inference/common/batch_sampler/__init__.py +20 -0
paddlex/inference/common/batch_sampler/audio_batch_sampler.py +84 -0
paddlex/inference/common/batch_sampler/base_batch_sampler.py +90 -0
paddlex/inference/common/batch_sampler/det_3d_batch_sampler.py +147 -0
paddlex/inference/common/batch_sampler/image_batch_sampler.py +136 -0
paddlex/inference/common/batch_sampler/ts_batch_sampler.py +110 -0
paddlex/inference/common/batch_sampler/video_batch_sampler.py +94 -0
paddlex/inference/common/reader/__init__.py +19 -0
paddlex/inference/common/reader/audio_reader.py +46 -0
paddlex/inference/common/reader/det_3d_reader.py +239 -0
paddlex/inference/common/reader/image_reader.py +69 -0
paddlex/inference/common/reader/ts_reader.py +45 -0
paddlex/inference/common/reader/video_reader.py +42 -0
paddlex/inference/common/result/__init__.py +29 -0
paddlex/inference/common/result/base_cv_result.py +31 -0
paddlex/inference/common/result/base_result.py +70 -0
paddlex/inference/common/result/base_ts_result.py +42 -0
paddlex/inference/common/result/base_video_result.py +36 -0
paddlex/inference/common/result/mixin.py +703 -0
paddlex/inference/models/3d_bev_detection/__init__.py +15 -0
paddlex/inference/models/3d_bev_detection/predictor.py +314 -0
paddlex/inference/models/3d_bev_detection/processors.py +978 -0
paddlex/inference/models/3d_bev_detection/result.py +65 -0
paddlex/inference/models/3d_bev_detection/visualizer_3d.py +131 -0
paddlex/inference/models/__init__.py +130 -0
paddlex/inference/models/anomaly_detection/__init__.py +15 -0
paddlex/inference/models/anomaly_detection/predictor.py +145 -0
paddlex/inference/models/anomaly_detection/processors.py +46 -0
paddlex/inference/models/anomaly_detection/result.py +70 -0
paddlex/inference/models/base/__init__.py +15 -0
paddlex/inference/models/base/predictor/__init__.py +16 -0
paddlex/inference/models/base/predictor/base_predictor.py +175 -0
paddlex/inference/models/base/predictor/basic_predictor.py +139 -0
paddlex/inference/models/common/__init__.py +35 -0
paddlex/inference/models/common/static_infer.py +329 -0
paddlex/inference/models/common/tokenizer/__init__.py +17 -0
paddlex/inference/models/common/tokenizer/bert_tokenizer.py +655 -0
paddlex/inference/models/common/tokenizer/gpt_tokenizer.py +451 -0
paddlex/inference/models/common/tokenizer/tokenizer_utils.py +2141 -0
paddlex/inference/models/common/tokenizer/tokenizer_utils_base.py +3504 -0
paddlex/inference/models/common/tokenizer/utils.py +66 -0
paddlex/inference/models/common/tokenizer/vocab.py +647 -0
paddlex/inference/models/common/ts/__init__.py +15 -0
paddlex/inference/models/common/ts/funcs.py +533 -0
paddlex/inference/models/common/ts/processors.py +313 -0
paddlex/inference/models/common/vision/__init__.py +23 -0
paddlex/inference/models/common/vision/funcs.py +93 -0
paddlex/inference/models/common/vision/processors.py +270 -0
paddlex/inference/models/face_feature/__init__.py +15 -0
paddlex/inference/models/face_feature/predictor.py +65 -0
paddlex/inference/models/formula_recognition/__init__.py +15 -0
paddlex/inference/models/formula_recognition/predictor.py +203 -0
paddlex/inference/models/formula_recognition/processors.py +986 -0
paddlex/inference/models/formula_recognition/result.py +403 -0
paddlex/inference/models/image_classification/__init__.py +15 -0
paddlex/inference/models/image_classification/predictor.py +182 -0
paddlex/inference/models/image_classification/processors.py +87 -0
paddlex/inference/models/image_classification/result.py +92 -0
paddlex/inference/models/image_feature/__init__.py +15 -0
paddlex/inference/models/image_feature/predictor.py +156 -0
paddlex/inference/models/image_feature/processors.py +29 -0
paddlex/inference/models/image_feature/result.py +33 -0
paddlex/inference/models/image_multilabel_classification/__init__.py +15 -0
paddlex/inference/models/image_multilabel_classification/predictor.py +94 -0
paddlex/inference/models/image_multilabel_classification/processors.py +85 -0
paddlex/inference/models/image_multilabel_classification/result.py +95 -0
paddlex/inference/models/image_unwarping/__init__.py +15 -0
paddlex/inference/models/image_unwarping/predictor.py +105 -0
paddlex/inference/models/image_unwarping/processors.py +88 -0
paddlex/inference/models/image_unwarping/result.py +45 -0
paddlex/inference/models/instance_segmentation/__init__.py +15 -0
paddlex/inference/models/instance_segmentation/predictor.py +210 -0
paddlex/inference/models/instance_segmentation/processors.py +105 -0
paddlex/inference/models/instance_segmentation/result.py +161 -0
paddlex/inference/models/keypoint_detection/__init__.py +15 -0
paddlex/inference/models/keypoint_detection/predictor.py +188 -0
paddlex/inference/models/keypoint_detection/processors.py +359 -0
paddlex/inference/models/keypoint_detection/result.py +192 -0
paddlex/inference/models/multilingual_speech_recognition/__init__.py +15 -0
paddlex/inference/models/multilingual_speech_recognition/predictor.py +141 -0
paddlex/inference/models/multilingual_speech_recognition/processors.py +1941 -0
paddlex/inference/models/multilingual_speech_recognition/result.py +21 -0
paddlex/inference/models/object_detection/__init__.py +15 -0
paddlex/inference/models/object_detection/predictor.py +348 -0
paddlex/inference/models/object_detection/processors.py +855 -0
paddlex/inference/models/object_detection/result.py +113 -0
paddlex/inference/models/object_detection/utils.py +68 -0
paddlex/inference/models/open_vocabulary_detection/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_detection/predictor.py +155 -0
paddlex/inference/models/open_vocabulary_detection/processors/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_detection/processors/groundingdino_processors.py +485 -0
paddlex/inference/models/open_vocabulary_segmentation/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_segmentation/predictor.py +120 -0
paddlex/inference/models/open_vocabulary_segmentation/processors/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_segmentation/processors/sam_processer.py +249 -0
paddlex/inference/models/open_vocabulary_segmentation/results/__init__.py +15 -0
paddlex/inference/models/open_vocabulary_segmentation/results/sam_result.py +147 -0
paddlex/inference/models/semantic_segmentation/__init__.py +15 -0
paddlex/inference/models/semantic_segmentation/predictor.py +167 -0
paddlex/inference/models/semantic_segmentation/processors.py +114 -0
paddlex/inference/models/semantic_segmentation/result.py +72 -0
paddlex/inference/models/table_structure_recognition/__init__.py +15 -0
paddlex/inference/models/table_structure_recognition/predictor.py +171 -0
paddlex/inference/models/table_structure_recognition/processors.py +235 -0
paddlex/inference/models/table_structure_recognition/result.py +70 -0
paddlex/inference/models/text_detection/__init__.py +15 -0
paddlex/inference/models/text_detection/predictor.py +191 -0
paddlex/inference/models/text_detection/processors.py +466 -0
paddlex/inference/models/text_detection/result.py +51 -0
paddlex/inference/models/text_recognition/__init__.py +15 -0
paddlex/inference/models/text_recognition/predictor.py +106 -0
paddlex/inference/models/text_recognition/processors.py +231 -0
paddlex/inference/models/text_recognition/result.py +75 -0
paddlex/inference/models/ts_anomaly_detection/__init__.py +15 -0
paddlex/inference/models/ts_anomaly_detection/predictor.py +146 -0
paddlex/inference/models/ts_anomaly_detection/processors.py +94 -0
paddlex/inference/models/ts_anomaly_detection/result.py +72 -0
paddlex/inference/models/ts_classification/__init__.py +15 -0
paddlex/inference/models/ts_classification/predictor.py +135 -0
paddlex/inference/models/ts_classification/processors.py +117 -0
paddlex/inference/models/ts_classification/result.py +78 -0
paddlex/inference/models/ts_forecasting/__init__.py +15 -0
paddlex/inference/models/ts_forecasting/predictor.py +159 -0
paddlex/inference/models/ts_forecasting/processors.py +149 -0
paddlex/inference/models/ts_forecasting/result.py +83 -0
paddlex/inference/models/video_classification/__init__.py +15 -0
paddlex/inference/models/video_classification/predictor.py +147 -0
paddlex/inference/models/video_classification/processors.py +409 -0
paddlex/inference/models/video_classification/result.py +92 -0
paddlex/inference/models/video_detection/__init__.py +15 -0
paddlex/inference/models/video_detection/predictor.py +136 -0
paddlex/inference/models/video_detection/processors.py +450 -0
paddlex/inference/models/video_detection/result.py +104 -0
paddlex/inference/pipelines/3d_bev_detection/__init__.py +15 -0
paddlex/inference/pipelines/3d_bev_detection/pipeline.py +67 -0
paddlex/inference/pipelines/__init__.py +228 -0
paddlex/inference/pipelines/anomaly_detection/__init__.py +15 -0
paddlex/inference/pipelines/anomaly_detection/pipeline.py +62 -0
paddlex/inference/pipelines/attribute_recognition/__init__.py +15 -0
paddlex/inference/pipelines/attribute_recognition/pipeline.py +105 -0
paddlex/inference/pipelines/attribute_recognition/result.py +100 -0
paddlex/inference/pipelines/base.py +132 -0
paddlex/inference/pipelines/components/__init__.py +23 -0
paddlex/inference/pipelines/components/chat_server/__init__.py +16 -0
paddlex/inference/pipelines/components/chat_server/base.py +39 -0
paddlex/inference/pipelines/components/chat_server/openai_bot_chat.py +236 -0
paddlex/inference/pipelines/components/common/__init__.py +18 -0
paddlex/inference/pipelines/components/common/base_operator.py +36 -0
paddlex/inference/pipelines/components/common/base_result.py +65 -0
paddlex/inference/pipelines/components/common/convert_points_and_boxes.py +46 -0
paddlex/inference/pipelines/components/common/crop_image_regions.py +550 -0
paddlex/inference/pipelines/components/common/seal_det_warp.py +941 -0
paddlex/inference/pipelines/components/common/sort_boxes.py +83 -0
paddlex/inference/pipelines/components/faisser.py +352 -0
paddlex/inference/pipelines/components/prompt_engineering/__init__.py +16 -0
paddlex/inference/pipelines/components/prompt_engineering/base.py +35 -0
paddlex/inference/pipelines/components/prompt_engineering/generate_ensemble_prompt.py +127 -0
paddlex/inference/pipelines/components/prompt_engineering/generate_kie_prompt.py +148 -0
paddlex/inference/pipelines/components/retriever/__init__.py +16 -0
paddlex/inference/pipelines/components/retriever/base.py +226 -0
paddlex/inference/pipelines/components/retriever/openai_bot_retriever.py +70 -0
paddlex/inference/pipelines/components/retriever/qianfan_bot_retriever.py +163 -0
paddlex/inference/pipelines/components/utils/__init__.py +13 -0
paddlex/inference/pipelines/components/utils/mixin.py +206 -0
paddlex/inference/pipelines/doc_preprocessor/__init__.py +15 -0
paddlex/inference/pipelines/doc_preprocessor/pipeline.py +190 -0
paddlex/inference/pipelines/doc_preprocessor/result.py +103 -0
paddlex/inference/pipelines/face_recognition/__init__.py +15 -0
paddlex/inference/pipelines/face_recognition/pipeline.py +61 -0
paddlex/inference/pipelines/face_recognition/result.py +43 -0
paddlex/inference/pipelines/formula_recognition/__init__.py +15 -0
paddlex/inference/pipelines/formula_recognition/pipeline.py +303 -0
paddlex/inference/pipelines/formula_recognition/result.py +291 -0
paddlex/inference/pipelines/image_classification/__init__.py +15 -0
paddlex/inference/pipelines/image_classification/pipeline.py +71 -0
paddlex/inference/pipelines/image_multilabel_classification/__init__.py +15 -0
paddlex/inference/pipelines/image_multilabel_classification/pipeline.py +78 -0
paddlex/inference/pipelines/instance_segmentation/__init__.py +15 -0
paddlex/inference/pipelines/instance_segmentation/pipeline.py +70 -0
paddlex/inference/pipelines/keypoint_detection/__init__.py +15 -0
paddlex/inference/pipelines/keypoint_detection/pipeline.py +137 -0
paddlex/inference/pipelines/layout_parsing/__init__.py +16 -0
paddlex/inference/pipelines/layout_parsing/pipeline.py +570 -0
paddlex/inference/pipelines/layout_parsing/pipeline_v2.py +739 -0
paddlex/inference/pipelines/layout_parsing/result.py +203 -0
paddlex/inference/pipelines/layout_parsing/result_v2.py +470 -0
paddlex/inference/pipelines/layout_parsing/utils.py +2385 -0
paddlex/inference/pipelines/multilingual_speech_recognition/__init__.py +15 -0
paddlex/inference/pipelines/multilingual_speech_recognition/pipeline.py +67 -0
paddlex/inference/pipelines/object_detection/__init__.py +15 -0
paddlex/inference/pipelines/object_detection/pipeline.py +95 -0
paddlex/inference/pipelines/ocr/__init__.py +15 -0
paddlex/inference/pipelines/ocr/pipeline.py +389 -0
paddlex/inference/pipelines/ocr/result.py +248 -0
paddlex/inference/pipelines/open_vocabulary_detection/__init__.py +15 -0
paddlex/inference/pipelines/open_vocabulary_detection/pipeline.py +75 -0
paddlex/inference/pipelines/open_vocabulary_segmentation/__init__.py +15 -0
paddlex/inference/pipelines/open_vocabulary_segmentation/pipeline.py +89 -0
paddlex/inference/pipelines/pp_chatocr/__init__.py +16 -0
paddlex/inference/pipelines/pp_chatocr/pipeline_base.py +102 -0
paddlex/inference/pipelines/pp_chatocr/pipeline_v3.py +773 -0
paddlex/inference/pipelines/pp_chatocr/pipeline_v4.py +977 -0
paddlex/inference/pipelines/pp_shitu_v2/__init__.py +15 -0
paddlex/inference/pipelines/pp_shitu_v2/pipeline.py +152 -0
paddlex/inference/pipelines/pp_shitu_v2/result.py +126 -0
paddlex/inference/pipelines/rotated_object_detection/__init__.py +15 -0
paddlex/inference/pipelines/rotated_object_detection/pipeline.py +74 -0
paddlex/inference/pipelines/seal_recognition/__init__.py +15 -0
paddlex/inference/pipelines/seal_recognition/pipeline.py +271 -0
paddlex/inference/pipelines/seal_recognition/result.py +87 -0
paddlex/inference/pipelines/semantic_segmentation/__init__.py +15 -0
paddlex/inference/pipelines/semantic_segmentation/pipeline.py +74 -0
paddlex/inference/pipelines/small_object_detection/__init__.py +15 -0
paddlex/inference/pipelines/small_object_detection/pipeline.py +74 -0
paddlex/inference/pipelines/table_recognition/__init__.py +16 -0
paddlex/inference/pipelines/table_recognition/pipeline.py +462 -0
paddlex/inference/pipelines/table_recognition/pipeline_v2.py +792 -0
paddlex/inference/pipelines/table_recognition/result.py +216 -0
paddlex/inference/pipelines/table_recognition/table_recognition_post_processing.py +362 -0
paddlex/inference/pipelines/table_recognition/table_recognition_post_processing_v2.py +470 -0
paddlex/inference/pipelines/table_recognition/utils.py +44 -0
paddlex/inference/pipelines/ts_anomaly_detection/__init__.py +15 -0
paddlex/inference/pipelines/ts_anomaly_detection/pipeline.py +62 -0
paddlex/inference/pipelines/ts_classification/__init__.py +15 -0
paddlex/inference/pipelines/ts_classification/pipeline.py +62 -0
paddlex/inference/pipelines/ts_forecasting/__init__.py +15 -0
paddlex/inference/pipelines/ts_forecasting/pipeline.py +62 -0
paddlex/inference/pipelines/video_classification/__init__.py +15 -0
paddlex/inference/pipelines/video_classification/pipeline.py +68 -0
paddlex/inference/pipelines/video_detection/__init__.py +15 -0
paddlex/inference/pipelines/video_detection/pipeline.py +73 -0
paddlex/inference/serving/__init__.py +13 -0
paddlex/inference/serving/basic_serving/__init__.py +18 -0
paddlex/inference/serving/basic_serving/_app.py +209 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/__init__.py +41 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/__init__.py +13 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/common.py +96 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/image_recognition.py +36 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/_common/ocr.py +90 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/anomaly_detection.py +64 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/doc_preprocessor.py +97 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/face_recognition.py +223 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/formula_recognition.py +97 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/human_keypoint_detection.py +78 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/image_classification.py +66 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/image_multilabel_classification.py +70 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/instance_segmentation.py +81 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/layout_parsing.py +115 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/m_3d_bev_detection.py +76 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/multilingual_speech_recognition.py +89 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/object_detection.py +74 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ocr.py +99 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/open_vocabulary_detection.py +78 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/open_vocabulary_segmentation.py +85 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pedestrian_attribute_recognition.py +81 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv3_doc.py +191 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv4_doc.py +221 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_shituv2.py +218 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/pp_structurev3.py +136 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/rotated_object_detection.py +78 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/seal_recognition.py +103 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/semantic_segmentation.py +64 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/small_object_detection.py +69 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition.py +105 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition_v2.py +107 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ts_anomaly_detection.py +62 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ts_classification.py +61 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/ts_forecast.py +62 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/vehicle_attribute_recognition.py +81 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/video_classification.py +73 -0
paddlex/inference/serving/basic_serving/_pipeline_apps/video_detection.py +89 -0
paddlex/inference/serving/basic_serving/_server.py +35 -0
paddlex/inference/serving/infra/__init__.py +13 -0
paddlex/inference/serving/infra/config.py +36 -0
paddlex/inference/serving/infra/models.py +72 -0
paddlex/inference/serving/infra/storage.py +175 -0
paddlex/inference/serving/infra/utils.py +259 -0
paddlex/inference/serving/schemas/__init__.py +13 -0
paddlex/inference/serving/schemas/anomaly_detection.py +39 -0
paddlex/inference/serving/schemas/doc_preprocessor.py +54 -0
paddlex/inference/serving/schemas/face_recognition.py +124 -0
paddlex/inference/serving/schemas/formula_recognition.py +56 -0
paddlex/inference/serving/schemas/human_keypoint_detection.py +55 -0
paddlex/inference/serving/schemas/image_classification.py +45 -0
paddlex/inference/serving/schemas/image_multilabel_classification.py +47 -0
paddlex/inference/serving/schemas/instance_segmentation.py +53 -0
paddlex/inference/serving/schemas/layout_parsing.py +72 -0
paddlex/inference/serving/schemas/m_3d_bev_detection.py +48 -0
paddlex/inference/serving/schemas/multilingual_speech_recognition.py +57 -0
paddlex/inference/serving/schemas/object_detection.py +52 -0
paddlex/inference/serving/schemas/ocr.py +60 -0
paddlex/inference/serving/schemas/open_vocabulary_detection.py +52 -0
paddlex/inference/serving/schemas/open_vocabulary_segmentation.py +52 -0
paddlex/inference/serving/schemas/pedestrian_attribute_recognition.py +61 -0
paddlex/inference/serving/schemas/pp_chatocrv3_doc.py +134 -0
paddlex/inference/serving/schemas/pp_chatocrv4_doc.py +151 -0
paddlex/inference/serving/schemas/pp_shituv2.py +124 -0
paddlex/inference/serving/schemas/pp_structurev3.py +84 -0
paddlex/inference/serving/schemas/rotated_object_detection.py +52 -0
paddlex/inference/serving/schemas/seal_recognition.py +62 -0
paddlex/inference/serving/schemas/semantic_segmentation.py +45 -0
paddlex/inference/serving/schemas/shared/__init__.py +13 -0
paddlex/inference/serving/schemas/shared/classification.py +23 -0
paddlex/inference/serving/schemas/shared/image_segmentation.py +28 -0
paddlex/inference/serving/schemas/shared/object_detection.py +24 -0
paddlex/inference/serving/schemas/shared/ocr.py +25 -0
paddlex/inference/serving/schemas/small_object_detection.py +52 -0
paddlex/inference/serving/schemas/table_recognition.py +64 -0
paddlex/inference/serving/schemas/table_recognition_v2.py +66 -0
paddlex/inference/serving/schemas/ts_anomaly_detection.py +37 -0
paddlex/inference/serving/schemas/ts_classification.py +38 -0
paddlex/inference/serving/schemas/ts_forecast.py +37 -0
paddlex/inference/serving/schemas/vehicle_attribute_recognition.py +61 -0
paddlex/inference/serving/schemas/video_classification.py +44 -0
paddlex/inference/serving/schemas/video_detection.py +56 -0
paddlex/inference/utils/__init__.py +13 -0
paddlex/inference/utils/benchmark.py +226 -0
paddlex/inference/utils/color_map.py +123 -0
paddlex/inference/utils/get_pipeline_path.py +27 -0
paddlex/inference/utils/io/__init__.py +36 -0
paddlex/inference/utils/io/readers.py +500 -0
paddlex/inference/utils/io/style.py +374 -0
paddlex/inference/utils/io/tablepyxl.py +149 -0
paddlex/inference/utils/io/writers.py +459 -0
paddlex/inference/utils/new_ir_blacklist.py +28 -0
paddlex/inference/utils/official_models.py +352 -0
paddlex/inference/utils/pp_option.py +256 -0
paddlex/model.py +113 -0
paddlex/modules/3d_bev_detection/__init__.py +18 -0
paddlex/modules/3d_bev_detection/dataset_checker/__init__.py +95 -0
paddlex/modules/3d_bev_detection/dataset_checker/dataset_src/__init__.py +17 -0
paddlex/modules/3d_bev_detection/dataset_checker/dataset_src/analyse_dataset.py +106 -0
paddlex/modules/3d_bev_detection/dataset_checker/dataset_src/check_dataset.py +102 -0
paddlex/modules/3d_bev_detection/evaluator.py +46 -0
paddlex/modules/3d_bev_detection/exportor.py +22 -0
paddlex/modules/3d_bev_detection/model_list.py +18 -0
paddlex/modules/3d_bev_detection/trainer.py +70 -0
paddlex/modules/__init__.py +138 -0
paddlex/modules/anomaly_detection/__init__.py +18 -0
paddlex/modules/anomaly_detection/dataset_checker/__init__.py +95 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/analyse_dataset.py +79 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/check_dataset.py +87 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/convert_dataset.py +230 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/split_dataset.py +87 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/anomaly_detection/dataset_checker/dataset_src/utils/visualizer.py +71 -0
paddlex/modules/anomaly_detection/evaluator.py +58 -0
paddlex/modules/anomaly_detection/exportor.py +22 -0
paddlex/modules/anomaly_detection/model_list.py +16 -0
paddlex/modules/anomaly_detection/trainer.py +71 -0
paddlex/modules/base/__init__.py +18 -0
paddlex/modules/base/build_model.py +34 -0
paddlex/modules/base/dataset_checker/__init__.py +16 -0
paddlex/modules/base/dataset_checker/dataset_checker.py +169 -0
paddlex/modules/base/dataset_checker/utils.py +110 -0
paddlex/modules/base/evaluator.py +170 -0
paddlex/modules/base/exportor.py +146 -0
paddlex/modules/base/trainer.py +134 -0
paddlex/modules/face_recognition/__init__.py +18 -0
paddlex/modules/face_recognition/dataset_checker/__init__.py +71 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/__init__.py +16 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/check_dataset.py +174 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/face_recognition/dataset_checker/dataset_src/utils/visualizer.py +156 -0
paddlex/modules/face_recognition/evaluator.py +52 -0
paddlex/modules/face_recognition/exportor.py +22 -0
paddlex/modules/face_recognition/model_list.py +15 -0
paddlex/modules/face_recognition/trainer.py +75 -0
paddlex/modules/formula_recognition/__init__.py +18 -0
paddlex/modules/formula_recognition/dataset_checker/__init__.py +113 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/analyse_dataset.py +157 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/check_dataset.py +80 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/convert_dataset.py +94 -0
paddlex/modules/formula_recognition/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/formula_recognition/evaluator.py +77 -0
paddlex/modules/formula_recognition/exportor.py +22 -0
paddlex/modules/formula_recognition/model_list.py +20 -0
paddlex/modules/formula_recognition/trainer.py +121 -0
paddlex/modules/general_recognition/__init__.py +18 -0
paddlex/modules/general_recognition/dataset_checker/__init__.py +107 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/analyse_dataset.py +98 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/check_dataset.py +100 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/convert_dataset.py +99 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/split_dataset.py +82 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/general_recognition/dataset_checker/dataset_src/utils/visualizer.py +150 -0
paddlex/modules/general_recognition/evaluator.py +31 -0
paddlex/modules/general_recognition/exportor.py +22 -0
paddlex/modules/general_recognition/model_list.py +19 -0
paddlex/modules/general_recognition/trainer.py +52 -0
paddlex/modules/image_classification/__init__.py +18 -0
paddlex/modules/image_classification/dataset_checker/__init__.py +104 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/analyse_dataset.py +93 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/check_dataset.py +131 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/convert_dataset.py +51 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/image_classification/dataset_checker/dataset_src/utils/visualizer.py +156 -0
paddlex/modules/image_classification/evaluator.py +43 -0
paddlex/modules/image_classification/exportor.py +22 -0
paddlex/modules/image_classification/model_list.py +99 -0
paddlex/modules/image_classification/trainer.py +82 -0
paddlex/modules/image_unwarping/__init__.py +13 -0
paddlex/modules/image_unwarping/model_list.py +17 -0
paddlex/modules/instance_segmentation/__init__.py +18 -0
paddlex/modules/instance_segmentation/dataset_checker/__init__.py +108 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/analyse_dataset.py +78 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/check_dataset.py +92 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/convert_dataset.py +241 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/split_dataset.py +119 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/instance_segmentation/dataset_checker/dataset_src/utils/visualizer.py +221 -0
paddlex/modules/instance_segmentation/evaluator.py +32 -0
paddlex/modules/instance_segmentation/exportor.py +22 -0
paddlex/modules/instance_segmentation/model_list.py +33 -0
paddlex/modules/instance_segmentation/trainer.py +31 -0
paddlex/modules/keypoint_detection/__init__.py +18 -0
paddlex/modules/keypoint_detection/dataset_checker/__init__.py +56 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/__init__.py +15 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/check_dataset.py +86 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/keypoint_detection/dataset_checker/dataset_src/utils/visualizer.py +119 -0
paddlex/modules/keypoint_detection/evaluator.py +41 -0
paddlex/modules/keypoint_detection/exportor.py +22 -0
paddlex/modules/keypoint_detection/model_list.py +16 -0
paddlex/modules/keypoint_detection/trainer.py +39 -0
paddlex/modules/multilabel_classification/__init__.py +18 -0
paddlex/modules/multilabel_classification/dataset_checker/__init__.py +106 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/analyse_dataset.py +95 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/check_dataset.py +131 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/convert_dataset.py +117 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/multilabel_classification/dataset_checker/dataset_src/utils/visualizer.py +153 -0
paddlex/modules/multilabel_classification/evaluator.py +43 -0
paddlex/modules/multilabel_classification/exportor.py +22 -0
paddlex/modules/multilabel_classification/model_list.py +24 -0
paddlex/modules/multilabel_classification/trainer.py +85 -0
paddlex/modules/multilingual_speech_recognition/__init__.py +18 -0
paddlex/modules/multilingual_speech_recognition/dataset_checker.py +27 -0
paddlex/modules/multilingual_speech_recognition/evaluator.py +27 -0
paddlex/modules/multilingual_speech_recognition/exportor.py +27 -0
paddlex/modules/multilingual_speech_recognition/model_list.py +22 -0
paddlex/modules/multilingual_speech_recognition/trainer.py +40 -0
paddlex/modules/object_detection/__init__.py +18 -0
paddlex/modules/object_detection/dataset_checker/__init__.py +115 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/analyse_dataset.py +80 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/check_dataset.py +86 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/convert_dataset.py +433 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/split_dataset.py +119 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/object_detection/dataset_checker/dataset_src/utils/visualizer.py +192 -0
paddlex/modules/object_detection/evaluator.py +52 -0
paddlex/modules/object_detection/exportor.py +22 -0
paddlex/modules/object_detection/model_list.py +84 -0
paddlex/modules/object_detection/trainer.py +99 -0
paddlex/modules/open_vocabulary_detection/__init__.py +18 -0
paddlex/modules/open_vocabulary_detection/dataset_checker.py +29 -0
paddlex/modules/open_vocabulary_detection/evaluator.py +29 -0
paddlex/modules/open_vocabulary_detection/exportor.py +29 -0
paddlex/modules/open_vocabulary_detection/model_list.py +18 -0
paddlex/modules/open_vocabulary_detection/trainer.py +42 -0
paddlex/modules/open_vocabulary_segmentation/__init__.py +18 -0
paddlex/modules/open_vocabulary_segmentation/dataset_checker.py +29 -0
paddlex/modules/open_vocabulary_segmentation/evaluator.py +29 -0
paddlex/modules/open_vocabulary_segmentation/exportor.py +29 -0
paddlex/modules/open_vocabulary_segmentation/model_list.py +19 -0
paddlex/modules/open_vocabulary_segmentation/trainer.py +42 -0
paddlex/modules/semantic_segmentation/__init__.py +18 -0
paddlex/modules/semantic_segmentation/dataset_checker/__init__.py +110 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/analyse_dataset.py +73 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/check_dataset.py +80 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/convert_dataset.py +162 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/split_dataset.py +87 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/utils/__init__.py +13 -0
paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/utils/visualizer.py +71 -0
paddlex/modules/semantic_segmentation/evaluator.py +58 -0
paddlex/modules/semantic_segmentation/exportor.py +31 -0
paddlex/modules/semantic_segmentation/model_list.py +37 -0
paddlex/modules/semantic_segmentation/trainer.py +73 -0
paddlex/modules/table_recognition/__init__.py +18 -0
paddlex/modules/table_recognition/dataset_checker/__init__.py +98 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/analyse_dataset.py +58 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/check_dataset.py +86 -0
paddlex/modules/table_recognition/dataset_checker/dataset_src/split_dataset.py +79 -0
paddlex/modules/table_recognition/evaluator.py +43 -0
paddlex/modules/table_recognition/exportor.py +22 -0
paddlex/modules/table_recognition/model_list.py +21 -0
paddlex/modules/table_recognition/trainer.py +70 -0
paddlex/modules/text_detection/__init__.py +18 -0
paddlex/modules/text_detection/dataset_checker/__init__.py +109 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/analyse_dataset.py +217 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/check_dataset.py +106 -0
paddlex/modules/text_detection/dataset_checker/dataset_src/split_dataset.py +140 -0
paddlex/modules/text_detection/evaluator.py +41 -0
paddlex/modules/text_detection/exportor.py +22 -0
paddlex/modules/text_detection/model_list.py +24 -0
paddlex/modules/text_detection/trainer.py +68 -0
paddlex/modules/text_recognition/__init__.py +18 -0
paddlex/modules/text_recognition/dataset_checker/__init__.py +126 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/analyse_dataset.py +161 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/check_dataset.py +107 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/convert_dataset.py +94 -0
paddlex/modules/text_recognition/dataset_checker/dataset_src/split_dataset.py +81 -0
paddlex/modules/text_recognition/evaluator.py +64 -0
paddlex/modules/text_recognition/exportor.py +22 -0
paddlex/modules/text_recognition/model_list.py +34 -0
paddlex/modules/text_recognition/trainer.py +106 -0
paddlex/modules/ts_anomaly_detection/__init__.py +19 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/__init__.py +112 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/analyse_dataset.py +27 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/convert_dataset.py +78 -0
paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/split_dataset.py +63 -0
paddlex/modules/ts_anomaly_detection/evaluator.py +67 -0
paddlex/modules/ts_anomaly_detection/exportor.py +45 -0
paddlex/modules/ts_anomaly_detection/model_list.py +22 -0
paddlex/modules/ts_anomaly_detection/trainer.py +113 -0
paddlex/modules/ts_classification/__init__.py +19 -0
paddlex/modules/ts_classification/dataset_checker/__init__.py +112 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/analyse_dataset.py +74 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/convert_dataset.py +78 -0
paddlex/modules/ts_classification/dataset_checker/dataset_src/split_dataset.py +88 -0
paddlex/modules/ts_classification/evaluator.py +66 -0
paddlex/modules/ts_classification/exportor.py +45 -0
paddlex/modules/ts_classification/model_list.py +18 -0
paddlex/modules/ts_classification/trainer.py +108 -0
paddlex/modules/ts_forecast/__init__.py +19 -0
paddlex/modules/ts_forecast/dataset_checker/__init__.py +112 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/__init__.py +19 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/analyse_dataset.py +27 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/check_dataset.py +64 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/convert_dataset.py +77 -0
paddlex/modules/ts_forecast/dataset_checker/dataset_src/split_dataset.py +63 -0
paddlex/modules/ts_forecast/evaluator.py +66 -0
paddlex/modules/ts_forecast/exportor.py +45 -0
paddlex/modules/ts_forecast/model_list.py +24 -0
paddlex/modules/ts_forecast/trainer.py +108 -0
paddlex/modules/video_classification/__init__.py +18 -0
paddlex/modules/video_classification/dataset_checker/__init__.py +93 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/__init__.py +18 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/analyse_dataset.py +93 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/check_dataset.py +121 -0
paddlex/modules/video_classification/dataset_checker/dataset_src/split_dataset.py +82 -0
paddlex/modules/video_classification/evaluator.py +44 -0
paddlex/modules/video_classification/exportor.py +22 -0
paddlex/modules/video_classification/model_list.py +19 -0
paddlex/modules/video_classification/trainer.py +88 -0
paddlex/modules/video_detection/__init__.py +18 -0
paddlex/modules/video_detection/dataset_checker/__init__.py +86 -0
paddlex/modules/video_detection/dataset_checker/dataset_src/__init__.py +17 -0
paddlex/modules/video_detection/dataset_checker/dataset_src/analyse_dataset.py +101 -0
paddlex/modules/video_detection/dataset_checker/dataset_src/check_dataset.py +134 -0
paddlex/modules/video_detection/evaluator.py +42 -0
paddlex/modules/video_detection/exportor.py +22 -0
paddlex/modules/video_detection/model_list.py +15 -0
paddlex/modules/video_detection/trainer.py +82 -0
paddlex/ops/__init__.py +149 -0
paddlex/ops/iou3d_nms/iou3d_cpu.cpp +264 -0
paddlex/ops/iou3d_nms/iou3d_cpu.h +27 -0
paddlex/ops/iou3d_nms/iou3d_nms.cpp +204 -0
paddlex/ops/iou3d_nms/iou3d_nms.h +33 -0
paddlex/ops/iou3d_nms/iou3d_nms_api.cpp +108 -0
paddlex/ops/iou3d_nms/iou3d_nms_kernel.cu +482 -0
paddlex/ops/setup.py +37 -0
paddlex/ops/voxel/voxelize_op.cc +191 -0
paddlex/ops/voxel/voxelize_op.cu +346 -0
paddlex/paddle2onnx_requirements.txt +1 -0
paddlex/paddlex_cli.py +464 -0
paddlex/repo_apis/Paddle3D_api/__init__.py +17 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/__init__.py +18 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/config.py +118 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/model.py +238 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/register.py +55 -0
paddlex/repo_apis/Paddle3D_api/bev_fusion/runner.py +104 -0
paddlex/repo_apis/Paddle3D_api/pp3d_config.py +144 -0
paddlex/repo_apis/PaddleClas_api/__init__.py +17 -0
paddlex/repo_apis/PaddleClas_api/cls/__init__.py +19 -0
paddlex/repo_apis/PaddleClas_api/cls/config.py +594 -0
paddlex/repo_apis/PaddleClas_api/cls/model.py +355 -0
paddlex/repo_apis/PaddleClas_api/cls/register.py +908 -0
paddlex/repo_apis/PaddleClas_api/cls/runner.py +219 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/__init__.py +18 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/config.py +141 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/model.py +23 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/register.py +68 -0
paddlex/repo_apis/PaddleClas_api/shitu_rec/runner.py +55 -0
paddlex/repo_apis/PaddleDetection_api/__init__.py +17 -0
paddlex/repo_apis/PaddleDetection_api/config_helper.py +280 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/__init__.py +18 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/config.py +458 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/model.py +403 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/register.py +263 -0
paddlex/repo_apis/PaddleDetection_api/instance_seg/runner.py +226 -0
paddlex/repo_apis/PaddleDetection_api/object_det/__init__.py +19 -0
paddlex/repo_apis/PaddleDetection_api/object_det/config.py +539 -0
paddlex/repo_apis/PaddleDetection_api/object_det/model.py +430 -0
paddlex/repo_apis/PaddleDetection_api/object_det/official_categories.py +220 -0
paddlex/repo_apis/PaddleDetection_api/object_det/register.py +1106 -0
paddlex/repo_apis/PaddleDetection_api/object_det/runner.py +226 -0
paddlex/repo_apis/PaddleNLP_api/__init__.py +13 -0
paddlex/repo_apis/PaddleOCR_api/__init__.py +21 -0
paddlex/repo_apis/PaddleOCR_api/config_utils.py +53 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/config.py +570 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/model.py +402 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/register.py +73 -0
paddlex/repo_apis/PaddleOCR_api/formula_rec/runner.py +240 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/config.py +64 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/model.py +126 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/register.py +71 -0
paddlex/repo_apis/PaddleOCR_api/table_rec/runner.py +51 -0
paddlex/repo_apis/PaddleOCR_api/text_det/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/text_det/config.py +62 -0
paddlex/repo_apis/PaddleOCR_api/text_det/model.py +72 -0
paddlex/repo_apis/PaddleOCR_api/text_det/register.py +90 -0
paddlex/repo_apis/PaddleOCR_api/text_det/runner.py +53 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/__init__.py +16 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/config.py +563 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/model.py +402 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/register.py +199 -0
paddlex/repo_apis/PaddleOCR_api/text_rec/runner.py +240 -0
paddlex/repo_apis/PaddleSeg_api/__init__.py +16 -0
paddlex/repo_apis/PaddleSeg_api/base_seg_config.py +134 -0
paddlex/repo_apis/PaddleSeg_api/seg/__init__.py +16 -0
paddlex/repo_apis/PaddleSeg_api/seg/config.py +186 -0
paddlex/repo_apis/PaddleSeg_api/seg/model.py +491 -0
paddlex/repo_apis/PaddleSeg_api/seg/register.py +273 -0
paddlex/repo_apis/PaddleSeg_api/seg/runner.py +262 -0
paddlex/repo_apis/PaddleTS_api/__init__.py +19 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/config.py +89 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/register.py +146 -0
paddlex/repo_apis/PaddleTS_api/ts_ad/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_base/__init__.py +13 -0
paddlex/repo_apis/PaddleTS_api/ts_base/config.py +246 -0
paddlex/repo_apis/PaddleTS_api/ts_base/model.py +276 -0
paddlex/repo_apis/PaddleTS_api/ts_base/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/config.py +73 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/register.py +59 -0
paddlex/repo_apis/PaddleTS_api/ts_cls/runner.py +158 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/__init__.py +16 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/config.py +137 -0
paddlex/repo_apis/PaddleTS_api/ts_fc/register.py +186 -0
paddlex/repo_apis/PaddleVideo_api/__init__.py +17 -0
paddlex/repo_apis/PaddleVideo_api/config_utils.py +51 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/__init__.py +19 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/config.py +547 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/model.py +346 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/register.py +71 -0
paddlex/repo_apis/PaddleVideo_api/video_cls/runner.py +205 -0
paddlex/repo_apis/PaddleVideo_api/video_det/__init__.py +19 -0
paddlex/repo_apis/PaddleVideo_api/video_det/config.py +548 -0
paddlex/repo_apis/PaddleVideo_api/video_det/model.py +298 -0
paddlex/repo_apis/PaddleVideo_api/video_det/register.py +45 -0
paddlex/repo_apis/PaddleVideo_api/video_det/runner.py +200 -0
paddlex/repo_apis/__init__.py +13 -0
paddlex/repo_apis/base/__init__.py +23 -0
paddlex/repo_apis/base/config.py +238 -0
paddlex/repo_apis/base/model.py +571 -0
paddlex/repo_apis/base/register.py +135 -0
paddlex/repo_apis/base/runner.py +391 -0
paddlex/repo_apis/base/utils/__init__.py +13 -0
paddlex/repo_apis/base/utils/arg.py +64 -0
paddlex/repo_apis/base/utils/subprocess.py +107 -0
paddlex/repo_manager/__init__.py +24 -0
paddlex/repo_manager/core.py +271 -0
paddlex/repo_manager/meta.py +170 -0
paddlex/repo_manager/repo.py +415 -0
paddlex/repo_manager/requirements.txt +21 -0
paddlex/repo_manager/utils.py +359 -0
paddlex/serving_requirements.txt +9 -0
paddlex/utils/__init__.py +1 -12
paddlex/utils/cache.py +148 -0
paddlex/utils/config.py +215 -0
paddlex/utils/custom_device_whitelist.py +457 -0
paddlex/utils/device.py +151 -0
paddlex/utils/download.py +168 -182
paddlex/utils/env.py +11 -50
paddlex/utils/errors/__init__.py +17 -0
paddlex/utils/errors/dataset_checker.py +78 -0
paddlex/utils/errors/others.py +152 -0
paddlex/utils/file_interface.py +212 -0
paddlex/utils/flags.py +65 -0
paddlex/utils/fonts/__init__.py +67 -0
paddlex/utils/func_register.py +41 -0
paddlex/utils/interactive_get_pipeline.py +55 -0
paddlex/utils/lazy_loader.py +68 -0
paddlex/utils/logging.py +131 -33
paddlex/utils/misc.py +201 -0
paddlex/utils/pipeline_arguments.py +711 -0
paddlex/utils/result_saver.py +59 -0
paddlex/utils/subclass_register.py +101 -0
paddlex/version.py +54 -0
paddlex-3.0.0rc0.dist-info/LICENSE +169 -0
paddlex-3.0.0rc0.dist-info/METADATA +1035 -0
paddlex-3.0.0rc0.dist-info/RECORD +1015 -0
paddlex-3.0.0rc0.dist-info/WHEEL +5 -0
paddlex-3.0.0rc0.dist-info/entry_points.txt +2 -0
paddlex-3.0.0rc0.dist-info/top_level.txt +1 -0
PaddleClas/__init__.py +0 -16
PaddleClas/deploy/__init__.py +0 -1
PaddleClas/deploy/paddleserving/__init__.py +0 -0
PaddleClas/deploy/paddleserving/classification_web_service.py +0 -74
PaddleClas/deploy/paddleserving/cpu_utilization.py +0 -4
PaddleClas/deploy/paddleserving/pipeline_http_client.py +0 -20
PaddleClas/deploy/paddleserving/pipeline_rpc_client.py +0 -33
PaddleClas/deploy/paddleserving/recognition/__init__.py +0 -0
PaddleClas/deploy/paddleserving/recognition/pipeline_http_client.py +0 -21
PaddleClas/deploy/paddleserving/recognition/pipeline_rpc_client.py +0 -34
PaddleClas/deploy/paddleserving/recognition/recognition_web_service.py +0 -209
PaddleClas/deploy/python/__init__.py +0 -0
PaddleClas/deploy/python/build_gallery.py +0 -214
PaddleClas/deploy/python/det_preprocess.py +0 -205
PaddleClas/deploy/python/postprocess.py +0 -161
PaddleClas/deploy/python/predict_cls.py +0 -142
PaddleClas/deploy/python/predict_det.py +0 -158
PaddleClas/deploy/python/predict_rec.py +0 -138
PaddleClas/deploy/python/predict_system.py +0 -144
PaddleClas/deploy/python/preprocess.py +0 -337
PaddleClas/deploy/utils/__init__.py +0 -5
PaddleClas/deploy/utils/config.py +0 -197
PaddleClas/deploy/utils/draw_bbox.py +0 -61
PaddleClas/deploy/utils/encode_decode.py +0 -31
PaddleClas/deploy/utils/get_image_list.py +0 -49
PaddleClas/deploy/utils/logger.py +0 -120
PaddleClas/deploy/utils/predictor.py +0 -71
PaddleClas/deploy/vector_search/__init__.py +0 -1
PaddleClas/deploy/vector_search/interface.py +0 -272
PaddleClas/deploy/vector_search/test.py +0 -34
PaddleClas/hubconf.py +0 -788
PaddleClas/paddleclas.py +0 -552
PaddleClas/ppcls/__init__.py +0 -20
PaddleClas/ppcls/arch/__init__.py +0 -127
PaddleClas/ppcls/arch/backbone/__init__.py +0 -80
PaddleClas/ppcls/arch/backbone/base/__init__.py +0 -0
PaddleClas/ppcls/arch/backbone/base/theseus_layer.py +0 -126
PaddleClas/ppcls/arch/backbone/legendary_models/__init__.py +0 -6
PaddleClas/ppcls/arch/backbone/legendary_models/esnet.py +0 -355
PaddleClas/ppcls/arch/backbone/legendary_models/hrnet.py +0 -744
PaddleClas/ppcls/arch/backbone/legendary_models/inception_v3.py +0 -539
PaddleClas/ppcls/arch/backbone/legendary_models/mobilenet_v1.py +0 -234
PaddleClas/ppcls/arch/backbone/legendary_models/mobilenet_v3.py +0 -561
PaddleClas/ppcls/arch/backbone/legendary_models/pp_lcnet.py +0 -399
PaddleClas/ppcls/arch/backbone/legendary_models/resnet.py +0 -534
PaddleClas/ppcls/arch/backbone/legendary_models/vgg.py +0 -231
PaddleClas/ppcls/arch/backbone/model_zoo/__init__.py +0 -0
PaddleClas/ppcls/arch/backbone/model_zoo/alexnet.py +0 -168
PaddleClas/ppcls/arch/backbone/model_zoo/cspnet.py +0 -376
PaddleClas/ppcls/arch/backbone/model_zoo/darknet.py +0 -197
PaddleClas/ppcls/arch/backbone/model_zoo/densenet.py +0 -344
PaddleClas/ppcls/arch/backbone/model_zoo/distilled_vision_transformer.py +0 -272
PaddleClas/ppcls/arch/backbone/model_zoo/dla.py +0 -528
PaddleClas/ppcls/arch/backbone/model_zoo/dpn.py +0 -451
PaddleClas/ppcls/arch/backbone/model_zoo/efficientnet.py +0 -976
PaddleClas/ppcls/arch/backbone/model_zoo/ghostnet.py +0 -363
PaddleClas/ppcls/arch/backbone/model_zoo/googlenet.py +0 -229
PaddleClas/ppcls/arch/backbone/model_zoo/gvt.py +0 -693
PaddleClas/ppcls/arch/backbone/model_zoo/hardnet.py +0 -293
PaddleClas/ppcls/arch/backbone/model_zoo/inception_v4.py +0 -477
PaddleClas/ppcls/arch/backbone/model_zoo/levit.py +0 -589
PaddleClas/ppcls/arch/backbone/model_zoo/mixnet.py +0 -815
PaddleClas/ppcls/arch/backbone/model_zoo/mobilenet_v2.py +0 -287
PaddleClas/ppcls/arch/backbone/model_zoo/rednet.py +0 -203
PaddleClas/ppcls/arch/backbone/model_zoo/regnet.py +0 -431
PaddleClas/ppcls/arch/backbone/model_zoo/repvgg.py +0 -422
PaddleClas/ppcls/arch/backbone/model_zoo/res2net.py +0 -264
PaddleClas/ppcls/arch/backbone/model_zoo/res2net_vd.py +0 -305
PaddleClas/ppcls/arch/backbone/model_zoo/resnest.py +0 -740
PaddleClas/ppcls/arch/backbone/model_zoo/resnet_vc.py +0 -309
PaddleClas/ppcls/arch/backbone/model_zoo/resnext.py +0 -298
PaddleClas/ppcls/arch/backbone/model_zoo/resnext101_wsl.py +0 -490
PaddleClas/ppcls/arch/backbone/model_zoo/resnext_vd.py +0 -317
PaddleClas/ppcls/arch/backbone/model_zoo/rexnet.py +0 -281
PaddleClas/ppcls/arch/backbone/model_zoo/se_resnet_vd.py +0 -390
PaddleClas/ppcls/arch/backbone/model_zoo/se_resnext.py +0 -364
PaddleClas/ppcls/arch/backbone/model_zoo/se_resnext_vd.py +0 -309
PaddleClas/ppcls/arch/backbone/model_zoo/shufflenet_v2.py +0 -362
PaddleClas/ppcls/arch/backbone/model_zoo/squeezenet.py +0 -194
PaddleClas/ppcls/arch/backbone/model_zoo/swin_transformer.py +0 -857
PaddleClas/ppcls/arch/backbone/model_zoo/tnt.py +0 -385
PaddleClas/ppcls/arch/backbone/model_zoo/vision_transformer.py +0 -495
PaddleClas/ppcls/arch/backbone/model_zoo/xception.py +0 -377
PaddleClas/ppcls/arch/backbone/model_zoo/xception_deeplab.py +0 -421
PaddleClas/ppcls/arch/backbone/variant_models/__init__.py +0 -3
PaddleClas/ppcls/arch/backbone/variant_models/pp_lcnet_variant.py +0 -29
PaddleClas/ppcls/arch/backbone/variant_models/resnet_variant.py +0 -23
PaddleClas/ppcls/arch/backbone/variant_models/vgg_variant.py +0 -28
PaddleClas/ppcls/arch/gears/__init__.py +0 -32
PaddleClas/ppcls/arch/gears/arcmargin.py +0 -72
PaddleClas/ppcls/arch/gears/circlemargin.py +0 -59
PaddleClas/ppcls/arch/gears/cosmargin.py +0 -55
PaddleClas/ppcls/arch/gears/fc.py +0 -35
PaddleClas/ppcls/arch/gears/identity_head.py +0 -9
PaddleClas/ppcls/arch/gears/vehicle_neck.py +0 -52
PaddleClas/ppcls/arch/utils.py +0 -53
PaddleClas/ppcls/data/__init__.py +0 -144
PaddleClas/ppcls/data/dataloader/DistributedRandomIdentitySampler.py +0 -90
PaddleClas/ppcls/data/dataloader/__init__.py +0 -9
PaddleClas/ppcls/data/dataloader/common_dataset.py +0 -84
PaddleClas/ppcls/data/dataloader/dali.py +0 -319
PaddleClas/ppcls/data/dataloader/icartoon_dataset.py +0 -36
PaddleClas/ppcls/data/dataloader/imagenet_dataset.py +0 -38
PaddleClas/ppcls/data/dataloader/logo_dataset.py +0 -46
PaddleClas/ppcls/data/dataloader/mix_dataset.py +0 -49
PaddleClas/ppcls/data/dataloader/mix_sampler.py +0 -79
PaddleClas/ppcls/data/dataloader/multilabel_dataset.py +0 -59
PaddleClas/ppcls/data/dataloader/pk_sampler.py +0 -105
PaddleClas/ppcls/data/dataloader/vehicle_dataset.py +0 -138
PaddleClas/ppcls/data/postprocess/__init__.py +0 -41
PaddleClas/ppcls/data/postprocess/topk.py +0 -85
PaddleClas/ppcls/data/preprocess/__init__.py +0 -100
PaddleClas/ppcls/data/preprocess/batch_ops/__init__.py +0 -1
PaddleClas/ppcls/data/preprocess/batch_ops/batch_operators.py +0 -231
PaddleClas/ppcls/data/preprocess/ops/__init__.py +0 -1
PaddleClas/ppcls/data/preprocess/ops/autoaugment.py +0 -264
PaddleClas/ppcls/data/preprocess/ops/cutout.py +0 -41
PaddleClas/ppcls/data/preprocess/ops/fmix.py +0 -217
PaddleClas/ppcls/data/preprocess/ops/functional.py +0 -138
PaddleClas/ppcls/data/preprocess/ops/grid.py +0 -89
PaddleClas/ppcls/data/preprocess/ops/hide_and_seek.py +0 -44
PaddleClas/ppcls/data/preprocess/ops/operators.py +0 -384
PaddleClas/ppcls/data/preprocess/ops/randaugment.py +0 -106
PaddleClas/ppcls/data/preprocess/ops/random_erasing.py +0 -90
PaddleClas/ppcls/data/preprocess/ops/timm_autoaugment.py +0 -877
PaddleClas/ppcls/data/utils/__init__.py +0 -13
PaddleClas/ppcls/data/utils/get_image_list.py +0 -49
PaddleClas/ppcls/engine/__init__.py +0 -0
PaddleClas/ppcls/engine/engine.py +0 -436
PaddleClas/ppcls/engine/evaluation/__init__.py +0 -16
PaddleClas/ppcls/engine/evaluation/classification.py +0 -143
PaddleClas/ppcls/engine/evaluation/retrieval.py +0 -169
PaddleClas/ppcls/engine/slim/__init__.py +0 -16
PaddleClas/ppcls/engine/slim/prune.py +0 -66
PaddleClas/ppcls/engine/slim/quant.py +0 -55
PaddleClas/ppcls/engine/train/__init__.py +0 -14
PaddleClas/ppcls/engine/train/train.py +0 -79
PaddleClas/ppcls/engine/train/utils.py +0 -72
PaddleClas/ppcls/loss/__init__.py +0 -65
PaddleClas/ppcls/loss/celoss.py +0 -67
PaddleClas/ppcls/loss/centerloss.py +0 -54
PaddleClas/ppcls/loss/comfunc.py +0 -45
PaddleClas/ppcls/loss/deephashloss.py +0 -92
PaddleClas/ppcls/loss/distanceloss.py +0 -43
PaddleClas/ppcls/loss/distillationloss.py +0 -141
PaddleClas/ppcls/loss/dmlloss.py +0 -46
PaddleClas/ppcls/loss/emlloss.py +0 -97
PaddleClas/ppcls/loss/googlenetloss.py +0 -41
PaddleClas/ppcls/loss/msmloss.py +0 -78
PaddleClas/ppcls/loss/multilabelloss.py +0 -43
PaddleClas/ppcls/loss/npairsloss.py +0 -38
PaddleClas/ppcls/loss/pairwisecosface.py +0 -55
PaddleClas/ppcls/loss/supconloss.py +0 -108
PaddleClas/ppcls/loss/trihardloss.py +0 -82
PaddleClas/ppcls/loss/triplet.py +0 -137
PaddleClas/ppcls/metric/__init__.py +0 -51
PaddleClas/ppcls/metric/metrics.py +0 -308
PaddleClas/ppcls/optimizer/__init__.py +0 -72
PaddleClas/ppcls/optimizer/learning_rate.py +0 -326
PaddleClas/ppcls/optimizer/optimizer.py +0 -207
PaddleClas/ppcls/utils/__init__.py +0 -27
PaddleClas/ppcls/utils/check.py +0 -151
PaddleClas/ppcls/utils/config.py +0 -210
PaddleClas/ppcls/utils/download.py +0 -319
PaddleClas/ppcls/utils/ema.py +0 -63
PaddleClas/ppcls/utils/logger.py +0 -137
PaddleClas/ppcls/utils/metrics.py +0 -107
PaddleClas/ppcls/utils/misc.py +0 -63
PaddleClas/ppcls/utils/model_zoo.py +0 -213
PaddleClas/ppcls/utils/profiler.py +0 -111
PaddleClas/ppcls/utils/save_load.py +0 -136
PaddleClas/setup.py +0 -58
PaddleClas/tools/__init__.py +0 -15
PaddleClas/tools/eval.py +0 -31
PaddleClas/tools/export_model.py +0 -34
PaddleClas/tools/infer.py +0 -31
PaddleClas/tools/train.py +0 -32
paddlex/cls.py +0 -82
paddlex/command.py +0 -215
paddlex/cv/__init__.py +0 -17
paddlex/cv/datasets/__init__.py +0 -18
paddlex/cv/datasets/coco.py +0 -208
paddlex/cv/datasets/imagenet.py +0 -88
paddlex/cv/datasets/seg_dataset.py +0 -91
paddlex/cv/datasets/voc.py +0 -445
paddlex/cv/models/__init__.py +0 -18
paddlex/cv/models/base.py +0 -631
paddlex/cv/models/classifier.py +0 -989
paddlex/cv/models/detector.py +0 -2292
paddlex/cv/models/load_model.py +0 -148
paddlex/cv/models/segmenter.py +0 -768
paddlex/cv/models/slim/__init__.py +0 -13
paddlex/cv/models/slim/prune.py +0 -55
paddlex/cv/models/utils/__init__.py +0 -13
paddlex/cv/models/utils/det_metrics/__init__.py +0 -15
paddlex/cv/models/utils/det_metrics/coco_utils.py +0 -476
paddlex/cv/models/utils/det_metrics/metrics.py +0 -220
paddlex/cv/models/utils/infer_nets.py +0 -45
paddlex/cv/models/utils/seg_metrics.py +0 -62
paddlex/cv/models/utils/visualize.py +0 -399
paddlex/cv/transforms/__init__.py +0 -46
paddlex/cv/transforms/batch_operators.py +0 -286
paddlex/cv/transforms/box_utils.py +0 -41
paddlex/cv/transforms/functions.py +0 -193
paddlex/cv/transforms/operators.py +0 -1402
paddlex/deploy.py +0 -268
paddlex/det.py +0 -49
paddlex/paddleseg/__init__.py +0 -17
paddlex/paddleseg/core/__init__.py +0 -20
paddlex/paddleseg/core/infer.py +0 -289
paddlex/paddleseg/core/predict.py +0 -145
paddlex/paddleseg/core/train.py +0 -258
paddlex/paddleseg/core/val.py +0 -172
paddlex/paddleseg/cvlibs/__init__.py +0 -17
paddlex/paddleseg/cvlibs/callbacks.py +0 -279
paddlex/paddleseg/cvlibs/config.py +0 -359
paddlex/paddleseg/cvlibs/manager.py +0 -142
paddlex/paddleseg/cvlibs/param_init.py +0 -91
paddlex/paddleseg/datasets/__init__.py +0 -21
paddlex/paddleseg/datasets/ade.py +0 -112
paddlex/paddleseg/datasets/cityscapes.py +0 -86
paddlex/paddleseg/datasets/cocostuff.py +0 -79
paddlex/paddleseg/datasets/dataset.py +0 -164
paddlex/paddleseg/datasets/mini_deep_globe_road_extraction.py +0 -95
paddlex/paddleseg/datasets/optic_disc_seg.py +0 -97
paddlex/paddleseg/datasets/pascal_context.py +0 -80
paddlex/paddleseg/datasets/voc.py +0 -113
paddlex/paddleseg/models/__init__.py +0 -39
paddlex/paddleseg/models/ann.py +0 -436
paddlex/paddleseg/models/attention_unet.py +0 -189
paddlex/paddleseg/models/backbones/__init__.py +0 -18
paddlex/paddleseg/models/backbones/hrnet.py +0 -815
paddlex/paddleseg/models/backbones/mobilenetv3.py +0 -365
paddlex/paddleseg/models/backbones/resnet_vd.py +0 -364
paddlex/paddleseg/models/backbones/xception_deeplab.py +0 -415
paddlex/paddleseg/models/bisenet.py +0 -311
paddlex/paddleseg/models/danet.py +0 -220
paddlex/paddleseg/models/decoupled_segnet.py +0 -233
paddlex/paddleseg/models/deeplab.py +0 -258
paddlex/paddleseg/models/dnlnet.py +0 -231
paddlex/paddleseg/models/emanet.py +0 -219
paddlex/paddleseg/models/fast_scnn.py +0 -318
paddlex/paddleseg/models/fcn.py +0 -135
paddlex/paddleseg/models/gcnet.py +0 -223
paddlex/paddleseg/models/gscnn.py +0 -357
paddlex/paddleseg/models/hardnet.py +0 -309
paddlex/paddleseg/models/isanet.py +0 -202
paddlex/paddleseg/models/layers/__init__.py +0 -19
paddlex/paddleseg/models/layers/activation.py +0 -73
paddlex/paddleseg/models/layers/attention.py +0 -146
paddlex/paddleseg/models/layers/layer_libs.py +0 -168
paddlex/paddleseg/models/layers/nonlocal2d.py +0 -155
paddlex/paddleseg/models/layers/pyramid_pool.py +0 -182
paddlex/paddleseg/models/losses/__init__.py +0 -27
paddlex/paddleseg/models/losses/binary_cross_entropy_loss.py +0 -174
paddlex/paddleseg/models/losses/bootstrapped_cross_entropy.py +0 -73
paddlex/paddleseg/models/losses/cross_entropy_loss.py +0 -94
paddlex/paddleseg/models/losses/decoupledsegnet_relax_boundary_loss.py +0 -129
paddlex/paddleseg/models/losses/dice_loss.py +0 -61
paddlex/paddleseg/models/losses/edge_attention_loss.py +0 -78
paddlex/paddleseg/models/losses/gscnn_dual_task_loss.py +0 -141
paddlex/paddleseg/models/losses/l1_loss.py +0 -76
paddlex/paddleseg/models/losses/lovasz_loss.py +0 -222
paddlex/paddleseg/models/losses/mean_square_error_loss.py +0 -65
paddlex/paddleseg/models/losses/mixed_loss.py +0 -58
paddlex/paddleseg/models/losses/ohem_cross_entropy_loss.py +0 -99
paddlex/paddleseg/models/losses/ohem_edge_attention_loss.py +0 -114
paddlex/paddleseg/models/ocrnet.py +0 -248
paddlex/paddleseg/models/pspnet.py +0 -147
paddlex/paddleseg/models/sfnet.py +0 -236
paddlex/paddleseg/models/shufflenet_slim.py +0 -268
paddlex/paddleseg/models/u2net.py +0 -574
paddlex/paddleseg/models/unet.py +0 -155
paddlex/paddleseg/models/unet_3plus.py +0 -316
paddlex/paddleseg/models/unet_plusplus.py +0 -237
paddlex/paddleseg/transforms/__init__.py +0 -16
paddlex/paddleseg/transforms/functional.py +0 -161
paddlex/paddleseg/transforms/transforms.py +0 -937
paddlex/paddleseg/utils/__init__.py +0 -22
paddlex/paddleseg/utils/config_check.py +0 -60
paddlex/paddleseg/utils/download.py +0 -163
paddlex/paddleseg/utils/env/__init__.py +0 -16
paddlex/paddleseg/utils/env/seg_env.py +0 -56
paddlex/paddleseg/utils/env/sys_env.py +0 -122
paddlex/paddleseg/utils/logger.py +0 -48
paddlex/paddleseg/utils/metrics.py +0 -146
paddlex/paddleseg/utils/progbar.py +0 -212
paddlex/paddleseg/utils/timer.py +0 -53
paddlex/paddleseg/utils/utils.py +0 -120
paddlex/paddleseg/utils/visualize.py +0 -90
paddlex/ppcls/__init__.py +0 -20
paddlex/ppcls/arch/__init__.py +0 -127
paddlex/ppcls/arch/backbone/__init__.py +0 -80
paddlex/ppcls/arch/backbone/base/__init__.py +0 -0
paddlex/ppcls/arch/backbone/base/theseus_layer.py +0 -130
paddlex/ppcls/arch/backbone/legendary_models/__init__.py +0 -6
paddlex/ppcls/arch/backbone/legendary_models/esnet.py +0 -355
paddlex/ppcls/arch/backbone/legendary_models/hrnet.py +0 -748
paddlex/ppcls/arch/backbone/legendary_models/inception_v3.py +0 -539
paddlex/ppcls/arch/backbone/legendary_models/mobilenet_v1.py +0 -234
paddlex/ppcls/arch/backbone/legendary_models/mobilenet_v3.py +0 -561
paddlex/ppcls/arch/backbone/legendary_models/pp_lcnet.py +0 -399
paddlex/ppcls/arch/backbone/legendary_models/resnet.py +0 -534
paddlex/ppcls/arch/backbone/legendary_models/vgg.py +0 -235
paddlex/ppcls/arch/backbone/model_zoo/__init__.py +0 -0
paddlex/ppcls/arch/backbone/model_zoo/alexnet.py +0 -168
paddlex/ppcls/arch/backbone/model_zoo/cspnet.py +0 -376
paddlex/ppcls/arch/backbone/model_zoo/darknet.py +0 -197
paddlex/ppcls/arch/backbone/model_zoo/densenet.py +0 -344
paddlex/ppcls/arch/backbone/model_zoo/distilled_vision_transformer.py +0 -272
paddlex/ppcls/arch/backbone/model_zoo/dla.py +0 -528
paddlex/ppcls/arch/backbone/model_zoo/dpn.py +0 -451
paddlex/ppcls/arch/backbone/model_zoo/efficientnet.py +0 -976
paddlex/ppcls/arch/backbone/model_zoo/ghostnet.py +0 -363
paddlex/ppcls/arch/backbone/model_zoo/googlenet.py +0 -229
paddlex/ppcls/arch/backbone/model_zoo/gvt.py +0 -693
paddlex/ppcls/arch/backbone/model_zoo/hardnet.py +0 -293
paddlex/ppcls/arch/backbone/model_zoo/inception_v4.py +0 -477
paddlex/ppcls/arch/backbone/model_zoo/levit.py +0 -589
paddlex/ppcls/arch/backbone/model_zoo/mixnet.py +0 -815
paddlex/ppcls/arch/backbone/model_zoo/mobilenet_v2.py +0 -287
paddlex/ppcls/arch/backbone/model_zoo/rednet.py +0 -203
paddlex/ppcls/arch/backbone/model_zoo/regnet.py +0 -431
paddlex/ppcls/arch/backbone/model_zoo/repvgg.py +0 -422
paddlex/ppcls/arch/backbone/model_zoo/res2net.py +0 -264
paddlex/ppcls/arch/backbone/model_zoo/res2net_vd.py +0 -305
paddlex/ppcls/arch/backbone/model_zoo/resnest.py +0 -740
paddlex/ppcls/arch/backbone/model_zoo/resnet_vc.py +0 -309
paddlex/ppcls/arch/backbone/model_zoo/resnext.py +0 -298
paddlex/ppcls/arch/backbone/model_zoo/resnext101_wsl.py +0 -490
paddlex/ppcls/arch/backbone/model_zoo/resnext_vd.py +0 -317
paddlex/ppcls/arch/backbone/model_zoo/rexnet.py +0 -281
paddlex/ppcls/arch/backbone/model_zoo/se_resnet_vd.py +0 -390
paddlex/ppcls/arch/backbone/model_zoo/se_resnext.py +0 -364
paddlex/ppcls/arch/backbone/model_zoo/se_resnext_vd.py +0 -309
paddlex/ppcls/arch/backbone/model_zoo/shufflenet_v2.py +0 -362
paddlex/ppcls/arch/backbone/model_zoo/squeezenet.py +0 -194
paddlex/ppcls/arch/backbone/model_zoo/swin_transformer.py +0 -857
paddlex/ppcls/arch/backbone/model_zoo/tnt.py +0 -385
paddlex/ppcls/arch/backbone/model_zoo/vision_transformer.py +0 -495
paddlex/ppcls/arch/backbone/model_zoo/xception.py +0 -377
paddlex/ppcls/arch/backbone/model_zoo/xception_deeplab.py +0 -421
paddlex/ppcls/arch/backbone/variant_models/__init__.py +0 -3
paddlex/ppcls/arch/backbone/variant_models/pp_lcnet_variant.py +0 -29
paddlex/ppcls/arch/backbone/variant_models/resnet_variant.py +0 -23
paddlex/ppcls/arch/backbone/variant_models/vgg_variant.py +0 -28
paddlex/ppcls/arch/gears/__init__.py +0 -32
paddlex/ppcls/arch/gears/arcmargin.py +0 -72
paddlex/ppcls/arch/gears/circlemargin.py +0 -59
paddlex/ppcls/arch/gears/cosmargin.py +0 -55
paddlex/ppcls/arch/gears/fc.py +0 -35
paddlex/ppcls/arch/gears/identity_head.py +0 -9
paddlex/ppcls/arch/gears/vehicle_neck.py +0 -52
paddlex/ppcls/arch/utils.py +0 -53
paddlex/ppcls/data/__init__.py +0 -144
paddlex/ppcls/data/dataloader/DistributedRandomIdentitySampler.py +0 -90
paddlex/ppcls/data/dataloader/__init__.py +0 -9
paddlex/ppcls/data/dataloader/common_dataset.py +0 -84
paddlex/ppcls/data/dataloader/dali.py +0 -319
paddlex/ppcls/data/dataloader/icartoon_dataset.py +0 -36
paddlex/ppcls/data/dataloader/imagenet_dataset.py +0 -38
paddlex/ppcls/data/dataloader/logo_dataset.py +0 -46
paddlex/ppcls/data/dataloader/mix_dataset.py +0 -49
paddlex/ppcls/data/dataloader/mix_sampler.py +0 -79
paddlex/ppcls/data/dataloader/multilabel_dataset.py +0 -59
paddlex/ppcls/data/dataloader/pk_sampler.py +0 -105
paddlex/ppcls/data/dataloader/vehicle_dataset.py +0 -138
paddlex/ppcls/data/postprocess/__init__.py +0 -41
paddlex/ppcls/data/postprocess/topk.py +0 -85
paddlex/ppcls/data/preprocess/__init__.py +0 -100
paddlex/ppcls/data/preprocess/batch_ops/__init__.py +0 -0
paddlex/ppcls/data/preprocess/batch_ops/batch_operators.py +0 -231
paddlex/ppcls/data/preprocess/ops/__init__.py +0 -0
paddlex/ppcls/data/preprocess/ops/autoaugment.py +0 -264
paddlex/ppcls/data/preprocess/ops/cutout.py +0 -41
paddlex/ppcls/data/preprocess/ops/fmix.py +0 -217
paddlex/ppcls/data/preprocess/ops/functional.py +0 -141
paddlex/ppcls/data/preprocess/ops/grid.py +0 -89
paddlex/ppcls/data/preprocess/ops/hide_and_seek.py +0 -44
paddlex/ppcls/data/preprocess/ops/operators.py +0 -384
paddlex/ppcls/data/preprocess/ops/randaugment.py +0 -106
paddlex/ppcls/data/preprocess/ops/random_erasing.py +0 -90
paddlex/ppcls/data/preprocess/ops/timm_autoaugment.py +0 -877
paddlex/ppcls/data/utils/__init__.py +0 -13
paddlex/ppcls/data/utils/get_image_list.py +0 -49
paddlex/ppcls/engine/__init__.py +0 -0
paddlex/ppcls/engine/engine.py +0 -436
paddlex/ppcls/engine/evaluation/__init__.py +0 -16
paddlex/ppcls/engine/evaluation/classification.py +0 -143
paddlex/ppcls/engine/evaluation/retrieval.py +0 -169
paddlex/ppcls/engine/slim/__init__.py +0 -16
paddlex/ppcls/engine/slim/prune.py +0 -66
paddlex/ppcls/engine/slim/quant.py +0 -55
paddlex/ppcls/engine/train/__init__.py +0 -14
paddlex/ppcls/engine/train/train.py +0 -79
paddlex/ppcls/engine/train/utils.py +0 -72
paddlex/ppcls/loss/__init__.py +0 -65
paddlex/ppcls/loss/celoss.py +0 -67
paddlex/ppcls/loss/centerloss.py +0 -54
paddlex/ppcls/loss/comfunc.py +0 -45
paddlex/ppcls/loss/deephashloss.py +0 -96
paddlex/ppcls/loss/distanceloss.py +0 -43
paddlex/ppcls/loss/distillationloss.py +0 -141
paddlex/ppcls/loss/dmlloss.py +0 -46
paddlex/ppcls/loss/emlloss.py +0 -97
paddlex/ppcls/loss/googlenetloss.py +0 -42
paddlex/ppcls/loss/msmloss.py +0 -78
paddlex/ppcls/loss/multilabelloss.py +0 -43
paddlex/ppcls/loss/npairsloss.py +0 -38
paddlex/ppcls/loss/pairwisecosface.py +0 -59
paddlex/ppcls/loss/supconloss.py +0 -108
paddlex/ppcls/loss/trihardloss.py +0 -82
paddlex/ppcls/loss/triplet.py +0 -137
paddlex/ppcls/metric/__init__.py +0 -51
paddlex/ppcls/metric/metrics.py +0 -308
paddlex/ppcls/optimizer/__init__.py +0 -72
paddlex/ppcls/optimizer/learning_rate.py +0 -326
paddlex/ppcls/optimizer/optimizer.py +0 -208
paddlex/ppcls/utils/__init__.py +0 -27
paddlex/ppcls/utils/check.py +0 -151
paddlex/ppcls/utils/config.py +0 -210
paddlex/ppcls/utils/download.py +0 -319
paddlex/ppcls/utils/ema.py +0 -63
paddlex/ppcls/utils/logger.py +0 -137
paddlex/ppcls/utils/metrics.py +0 -112
paddlex/ppcls/utils/misc.py +0 -63
paddlex/ppcls/utils/model_zoo.py +0 -213
paddlex/ppcls/utils/profiler.py +0 -111
paddlex/ppcls/utils/save_load.py +0 -136
paddlex/ppdet/__init__.py +0 -16
paddlex/ppdet/core/__init__.py +0 -15
paddlex/ppdet/core/config/__init__.py +0 -13
paddlex/ppdet/core/config/schema.py +0 -248
paddlex/ppdet/core/config/yaml_helpers.py +0 -118
paddlex/ppdet/core/workspace.py +0 -278
paddlex/ppdet/data/__init__.py +0 -21
paddlex/ppdet/data/crop_utils/__init__.py +0 -13
paddlex/ppdet/data/crop_utils/annotation_cropper.py +0 -585
paddlex/ppdet/data/crop_utils/chip_box_utils.py +0 -170
paddlex/ppdet/data/reader.py +0 -302
paddlex/ppdet/data/shm_utils.py +0 -67
paddlex/ppdet/data/source/__init__.py +0 -29
paddlex/ppdet/data/source/category.py +0 -904
paddlex/ppdet/data/source/coco.py +0 -251
paddlex/ppdet/data/source/dataset.py +0 -197
paddlex/ppdet/data/source/keypoint_coco.py +0 -669
paddlex/ppdet/data/source/mot.py +0 -636
paddlex/ppdet/data/source/sniper_coco.py +0 -191
paddlex/ppdet/data/source/voc.py +0 -231
paddlex/ppdet/data/source/widerface.py +0 -180
paddlex/ppdet/data/transform/__init__.py +0 -28
paddlex/ppdet/data/transform/atss_assigner.py +0 -270
paddlex/ppdet/data/transform/autoaugment_utils.py +0 -1591
paddlex/ppdet/data/transform/batch_operators.py +0 -1080
paddlex/ppdet/data/transform/gridmask_utils.py +0 -86
paddlex/ppdet/data/transform/keypoint_operators.py +0 -868
paddlex/ppdet/data/transform/mot_operators.py +0 -628
paddlex/ppdet/data/transform/op_helper.py +0 -498
paddlex/ppdet/data/transform/operators.py +0 -3025
paddlex/ppdet/engine/__init__.py +0 -30
paddlex/ppdet/engine/callbacks.py +0 -340
paddlex/ppdet/engine/env.py +0 -50
paddlex/ppdet/engine/export_utils.py +0 -177
paddlex/ppdet/engine/tracker.py +0 -538
paddlex/ppdet/engine/trainer.py +0 -723
paddlex/ppdet/metrics/__init__.py +0 -29
paddlex/ppdet/metrics/coco_utils.py +0 -184
paddlex/ppdet/metrics/json_results.py +0 -149
paddlex/ppdet/metrics/keypoint_metrics.py +0 -401
paddlex/ppdet/metrics/map_utils.py +0 -444
paddlex/ppdet/metrics/mcmot_metrics.py +0 -470
paddlex/ppdet/metrics/metrics.py +0 -434
paddlex/ppdet/metrics/mot_metrics.py +0 -1236
paddlex/ppdet/metrics/munkres.py +0 -428
paddlex/ppdet/metrics/widerface_utils.py +0 -393
paddlex/ppdet/model_zoo/__init__.py +0 -18
paddlex/ppdet/model_zoo/model_zoo.py +0 -84
paddlex/ppdet/modeling/__init__.py +0 -45
paddlex/ppdet/modeling/architectures/__init__.py +0 -51
paddlex/ppdet/modeling/architectures/blazeface.py +0 -91
paddlex/ppdet/modeling/architectures/cascade_rcnn.py +0 -144
paddlex/ppdet/modeling/architectures/centernet.py +0 -108
paddlex/ppdet/modeling/architectures/deepsort.py +0 -69
paddlex/ppdet/modeling/architectures/detr.py +0 -93
paddlex/ppdet/modeling/architectures/fairmot.py +0 -100
paddlex/ppdet/modeling/architectures/faster_rcnn.py +0 -106
paddlex/ppdet/modeling/architectures/fcos.py +0 -105
paddlex/ppdet/modeling/architectures/gfl.py +0 -87
paddlex/ppdet/modeling/architectures/jde.py +0 -111
paddlex/ppdet/modeling/architectures/keypoint_hrhrnet.py +0 -287
paddlex/ppdet/modeling/architectures/keypoint_hrnet.py +0 -267
paddlex/ppdet/modeling/architectures/mask_rcnn.py +0 -135
paddlex/ppdet/modeling/architectures/meta_arch.py +0 -128
paddlex/ppdet/modeling/architectures/picodet.py +0 -91
paddlex/ppdet/modeling/architectures/s2anet.py +0 -102
paddlex/ppdet/modeling/architectures/solov2.py +0 -110
paddlex/ppdet/modeling/architectures/sparse_rcnn.py +0 -99
paddlex/ppdet/modeling/architectures/ssd.py +0 -93
paddlex/ppdet/modeling/architectures/tood.py +0 -78
paddlex/ppdet/modeling/architectures/ttfnet.py +0 -98
paddlex/ppdet/modeling/architectures/yolo.py +0 -124
paddlex/ppdet/modeling/assigners/__init__.py +0 -23
paddlex/ppdet/modeling/assigners/atss_assigner.py +0 -211
paddlex/ppdet/modeling/assigners/simota_assigner.py +0 -262
paddlex/ppdet/modeling/assigners/task_aligned_assigner.py +0 -158
paddlex/ppdet/modeling/assigners/utils.py +0 -195
paddlex/ppdet/modeling/backbones/__init__.py +0 -49
paddlex/ppdet/modeling/backbones/blazenet.py +0 -323
paddlex/ppdet/modeling/backbones/darknet.py +0 -340
paddlex/ppdet/modeling/backbones/dla.py +0 -244
paddlex/ppdet/modeling/backbones/esnet.py +0 -290
paddlex/ppdet/modeling/backbones/ghostnet.py +0 -470
paddlex/ppdet/modeling/backbones/hardnet.py +0 -224
paddlex/ppdet/modeling/backbones/hrnet.py +0 -727
paddlex/ppdet/modeling/backbones/lcnet.py +0 -259
paddlex/ppdet/modeling/backbones/lite_hrnet.py +0 -886
paddlex/ppdet/modeling/backbones/mobilenet_v1.py +0 -418
paddlex/ppdet/modeling/backbones/mobilenet_v3.py +0 -483
paddlex/ppdet/modeling/backbones/name_adapter.py +0 -69
paddlex/ppdet/modeling/backbones/res2net.py +0 -358
paddlex/ppdet/modeling/backbones/resnet.py +0 -613
paddlex/ppdet/modeling/backbones/senet.py +0 -139
paddlex/ppdet/modeling/backbones/shufflenet_v2.py +0 -246
paddlex/ppdet/modeling/backbones/swin_transformer.py +0 -743
paddlex/ppdet/modeling/backbones/vgg.py +0 -210
paddlex/ppdet/modeling/bbox_utils.py +0 -778
paddlex/ppdet/modeling/heads/__init__.py +0 -53
paddlex/ppdet/modeling/heads/bbox_head.py +0 -377
paddlex/ppdet/modeling/heads/cascade_head.py +0 -284
paddlex/ppdet/modeling/heads/centernet_head.py +0 -292
paddlex/ppdet/modeling/heads/detr_head.py +0 -368
paddlex/ppdet/modeling/heads/face_head.py +0 -110
paddlex/ppdet/modeling/heads/fcos_head.py +0 -259
paddlex/ppdet/modeling/heads/gfl_head.py +0 -487
paddlex/ppdet/modeling/heads/keypoint_hrhrnet_head.py +0 -108
paddlex/ppdet/modeling/heads/mask_head.py +0 -250
paddlex/ppdet/modeling/heads/pico_head.py +0 -278
paddlex/ppdet/modeling/heads/roi_extractor.py +0 -111
paddlex/ppdet/modeling/heads/s2anet_head.py +0 -1056
paddlex/ppdet/modeling/heads/simota_head.py +0 -506
paddlex/ppdet/modeling/heads/solov2_head.py +0 -560
paddlex/ppdet/modeling/heads/sparsercnn_head.py +0 -375
paddlex/ppdet/modeling/heads/ssd_head.py +0 -215
paddlex/ppdet/modeling/heads/tood_head.py +0 -366
paddlex/ppdet/modeling/heads/ttf_head.py +0 -316
paddlex/ppdet/modeling/heads/yolo_head.py +0 -124
paddlex/ppdet/modeling/initializer.py +0 -317
paddlex/ppdet/modeling/keypoint_utils.py +0 -342
paddlex/ppdet/modeling/layers.py +0 -1430
paddlex/ppdet/modeling/losses/__init__.py +0 -43
paddlex/ppdet/modeling/losses/ctfocal_loss.py +0 -68
paddlex/ppdet/modeling/losses/detr_loss.py +0 -233
paddlex/ppdet/modeling/losses/fairmot_loss.py +0 -41
paddlex/ppdet/modeling/losses/fcos_loss.py +0 -225
paddlex/ppdet/modeling/losses/gfocal_loss.py +0 -217
paddlex/ppdet/modeling/losses/iou_aware_loss.py +0 -47
paddlex/ppdet/modeling/losses/iou_loss.py +0 -210
paddlex/ppdet/modeling/losses/jde_loss.py +0 -193
paddlex/ppdet/modeling/losses/keypoint_loss.py +0 -229
paddlex/ppdet/modeling/losses/solov2_loss.py +0 -101
paddlex/ppdet/modeling/losses/sparsercnn_loss.py +0 -425
paddlex/ppdet/modeling/losses/ssd_loss.py +0 -170
paddlex/ppdet/modeling/losses/varifocal_loss.py +0 -152
paddlex/ppdet/modeling/losses/yolo_loss.py +0 -212
paddlex/ppdet/modeling/mot/__init__.py +0 -25
paddlex/ppdet/modeling/mot/matching/__init__.py +0 -19
paddlex/ppdet/modeling/mot/matching/deepsort_matching.py +0 -382
paddlex/ppdet/modeling/mot/matching/jde_matching.py +0 -144
paddlex/ppdet/modeling/mot/motion/__init__.py +0 -17
paddlex/ppdet/modeling/mot/motion/kalman_filter.py +0 -270
paddlex/ppdet/modeling/mot/tracker/__init__.py +0 -23
paddlex/ppdet/modeling/mot/tracker/base_jde_tracker.py +0 -297
paddlex/ppdet/modeling/mot/tracker/base_sde_tracker.py +0 -156
paddlex/ppdet/modeling/mot/tracker/deepsort_tracker.py +0 -188
paddlex/ppdet/modeling/mot/tracker/jde_tracker.py +0 -277
paddlex/ppdet/modeling/mot/utils.py +0 -263
paddlex/ppdet/modeling/mot/visualization.py +0 -150
paddlex/ppdet/modeling/necks/__init__.py +0 -30
paddlex/ppdet/modeling/necks/bifpn.py +0 -302
paddlex/ppdet/modeling/necks/blazeface_fpn.py +0 -216
paddlex/ppdet/modeling/necks/centernet_fpn.py +0 -426
paddlex/ppdet/modeling/necks/csp_pan.py +0 -364
paddlex/ppdet/modeling/necks/fpn.py +0 -231
paddlex/ppdet/modeling/necks/hrfpn.py +0 -126
paddlex/ppdet/modeling/necks/ttf_fpn.py +0 -242
paddlex/ppdet/modeling/necks/yolo_fpn.py +0 -988
paddlex/ppdet/modeling/ops.py +0 -1611
paddlex/ppdet/modeling/post_process.py +0 -731
paddlex/ppdet/modeling/proposal_generator/__init__.py +0 -2
paddlex/ppdet/modeling/proposal_generator/anchor_generator.py +0 -135
paddlex/ppdet/modeling/proposal_generator/proposal_generator.py +0 -77
paddlex/ppdet/modeling/proposal_generator/rpn_head.py +0 -260
paddlex/ppdet/modeling/proposal_generator/target.py +0 -681
paddlex/ppdet/modeling/proposal_generator/target_layer.py +0 -491
paddlex/ppdet/modeling/reid/__init__.py +0 -25
paddlex/ppdet/modeling/reid/fairmot_embedding_head.py +0 -225
paddlex/ppdet/modeling/reid/jde_embedding_head.py +0 -214
paddlex/ppdet/modeling/reid/pplcnet_embedding.py +0 -282
paddlex/ppdet/modeling/reid/pyramidal_embedding.py +0 -144
paddlex/ppdet/modeling/reid/resnet.py +0 -310
paddlex/ppdet/modeling/shape_spec.py +0 -25
paddlex/ppdet/modeling/transformers/__init__.py +0 -25
paddlex/ppdet/modeling/transformers/deformable_transformer.py +0 -517
paddlex/ppdet/modeling/transformers/detr_transformer.py +0 -353
paddlex/ppdet/modeling/transformers/matchers.py +0 -127
paddlex/ppdet/modeling/transformers/position_encoding.py +0 -108
paddlex/ppdet/modeling/transformers/utils.py +0 -110
paddlex/ppdet/optimizer.py +0 -335
paddlex/ppdet/slim/__init__.py +0 -82
paddlex/ppdet/slim/distill.py +0 -110
paddlex/ppdet/slim/prune.py +0 -85
paddlex/ppdet/slim/quant.py +0 -84
paddlex/ppdet/slim/unstructured_prune.py +0 -66
paddlex/ppdet/utils/__init__.py +0 -13
paddlex/ppdet/utils/check.py +0 -112
paddlex/ppdet/utils/checkpoint.py +0 -226
paddlex/ppdet/utils/cli.py +0 -151
paddlex/ppdet/utils/colormap.py +0 -58
paddlex/ppdet/utils/download.py +0 -558
paddlex/ppdet/utils/logger.py +0 -70
paddlex/ppdet/utils/profiler.py +0 -111
paddlex/ppdet/utils/stats.py +0 -94
paddlex/ppdet/utils/visualizer.py +0 -321
paddlex/ppdet/utils/voc_utils.py +0 -86
paddlex/seg.py +0 -41
paddlex/tools/__init__.py +0 -17
paddlex/tools/anchor_clustering/__init__.py +0 -15
paddlex/tools/anchor_clustering/yolo_cluster.py +0 -178
paddlex/tools/convert.py +0 -52
paddlex/tools/dataset_conversion/__init__.py +0 -24
paddlex/tools/dataset_conversion/x2coco.py +0 -379
paddlex/tools/dataset_conversion/x2imagenet.py +0 -82
paddlex/tools/dataset_conversion/x2seg.py +0 -343
paddlex/tools/dataset_conversion/x2voc.py +0 -230
paddlex/tools/dataset_split/__init__.py +0 -23
paddlex/tools/dataset_split/coco_split.py +0 -69
paddlex/tools/dataset_split/imagenet_split.py +0 -75
paddlex/tools/dataset_split/seg_split.py +0 -96
paddlex/tools/dataset_split/utils.py +0 -75
paddlex/tools/dataset_split/voc_split.py +0 -91
paddlex/tools/split.py +0 -41
paddlex/utils/checkpoint.py +0 -492
paddlex/utils/shm.py +0 -67
paddlex/utils/stats.py +0 -68
paddlex/utils/utils.py +0 -229
paddlex-2.1.0.data/data/paddlex_restful/restful/templates/paddlex_restful_demo.html +0 -5205
paddlex-2.1.0.dist-info/LICENSE +0 -201
paddlex-2.1.0.dist-info/METADATA +0 -32
paddlex-2.1.0.dist-info/RECORD +0 -698
paddlex-2.1.0.dist-info/WHEEL +0 -5
paddlex-2.1.0.dist-info/entry_points.txt +0 -4
paddlex-2.1.0.dist-info/top_level.txt +0 -3
paddlex_restful/__init__.py +0 -15
paddlex_restful/command.py +0 -63
paddlex_restful/restful/__init__.py +0 -15
paddlex_restful/restful/app.py +0 -969
paddlex_restful/restful/dataset/__init__.py +0 -13
paddlex_restful/restful/dataset/cls_dataset.py +0 -159
paddlex_restful/restful/dataset/dataset.py +0 -266
paddlex_restful/restful/dataset/datasetbase.py +0 -86
paddlex_restful/restful/dataset/det_dataset.py +0 -190
paddlex_restful/restful/dataset/ins_seg_dataset.py +0 -312
paddlex_restful/restful/dataset/operate.py +0 -155
paddlex_restful/restful/dataset/seg_dataset.py +0 -222
paddlex_restful/restful/dataset/utils.py +0 -267
paddlex_restful/restful/demo.py +0 -202
paddlex_restful/restful/dir.py +0 -45
paddlex_restful/restful/model.py +0 -312
paddlex_restful/restful/project/__init__.py +0 -13
paddlex_restful/restful/project/evaluate/__init__.py +0 -13
paddlex_restful/restful/project/evaluate/classification.py +0 -126
paddlex_restful/restful/project/evaluate/detection.py +0 -789
paddlex_restful/restful/project/evaluate/draw_pred_result.py +0 -181
paddlex_restful/restful/project/evaluate/segmentation.py +0 -122
paddlex_restful/restful/project/operate.py +0 -931
paddlex_restful/restful/project/project.py +0 -143
paddlex_restful/restful/project/prune/__init__.py +0 -13
paddlex_restful/restful/project/prune/classification.py +0 -32
paddlex_restful/restful/project/prune/detection.py +0 -48
paddlex_restful/restful/project/prune/segmentation.py +0 -34
paddlex_restful/restful/project/task.py +0 -884
paddlex_restful/restful/project/train/__init__.py +0 -13
paddlex_restful/restful/project/train/classification.py +0 -141
paddlex_restful/restful/project/train/detection.py +0 -263
paddlex_restful/restful/project/train/params.py +0 -432
paddlex_restful/restful/project/train/params_v2.py +0 -326
paddlex_restful/restful/project/train/segmentation.py +0 -191
paddlex_restful/restful/project/visualize.py +0 -244
paddlex_restful/restful/system.py +0 -102
paddlex_restful/restful/templates/paddlex_restful_demo.html +0 -5205
paddlex_restful/restful/utils.py +0 -841
paddlex_restful/restful/workspace.py +0 -343
paddlex_restful/restful/workspace_pb2.py +0 -1411

paddlex/inference/models/multilingual_speech_recognition/processors.py ADDED Viewed

@@ -0,0 +1,1941 @@
+# copyright (c) 2024 PaddlePaddle Authors. All Rights Reserve.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# Modified from OpenAI Whisper 2022 (https://github.com/openai/whisper/whisper)
+import os
+import tqdm
+import zlib
+import soundfile
+import numpy as np
+import lazy_paddle as paddle
+from dataclasses import dataclass
+from dataclasses import field
+from functools import lru_cache
+from typing import Dict, Iterable, List, Optional, Sequence, Tuple, Union
+from ..common.tokenizer import GPTTokenizer
+__all__ = [
+    "Whisper",
+    "Tokenizer",
+]
+def exact_div(x, y):
+    assert x % y == 0
+    return x // y
+_MODELS = ["large"]
+SAMPLE_RATE = 16000
+N_FFT = 400
+N_MELS = 80
+HOP_LENGTH = 160
+CHUNK_LENGTH = 30
+N_SAMPLES = CHUNK_LENGTH * SAMPLE_RATE  # 480000: number of samples in a chunk
+N_FRAMES = exact_div(
+    N_SAMPLES, HOP_LENGTH
+)  # 3000: number of frames in a mel spectrogram input
+@dataclass
+class ModelDimensions:
+    n_mels: int
+    n_audio_ctx: int
+    n_audio_state: int
+    n_audio_head: int
+    n_audio_layer: int
+    n_vocab: int
+    n_text_ctx: int
+    n_text_state: int
+    n_text_head: int
+    n_text_layer: int
+LANGUAGES = {
+    "en": "english",
+    "zh": "chinese",
+    "de": "german",
+    "es": "spanish",
+    "ru": "russian",
+    "ko": "korean",
+    "fr": "french",
+    "ja": "japanese",
+    "pt": "portuguese",
+    "tr": "turkish",
+    "pl": "polish",
+    "ca": "catalan",
+    "nl": "dutch",
+    "ar": "arabic",
+    "sv": "swedish",
+    "it": "italian",
+    "id": "indonesian",
+    "hi": "hindi",
+    "fi": "finnish",
+    "vi": "vietnamese",
+    "iw": "hebrew",
+    "uk": "ukrainian",
+    "el": "greek",
+    "ms": "malay",
+    "cs": "czech",
+    "ro": "romanian",
+    "da": "danish",
+    "hu": "hungarian",
+    "ta": "tamil",
+    "no": "norwegian",
+    "th": "thai",
+    "ur": "urdu",
+    "hr": "croatian",
+    "bg": "bulgarian",
+    "lt": "lithuanian",
+    "la": "latin",
+    "mi": "maori",
+    "ml": "malayalam",
+    "cy": "welsh",
+    "sk": "slovak",
+    "te": "telugu",
+    "fa": "persian",
+    "lv": "latvian",
+    "bn": "bengali",
+    "sr": "serbian",
+    "az": "azerbaijani",
+    "sl": "slovenian",
+    "kn": "kannada",
+    "et": "estonian",
+    "mk": "macedonian",
+    "br": "breton",
+    "eu": "basque",
+    "is": "icelandic",
+    "hy": "armenian",
+    "ne": "nepali",
+    "mn": "mongolian",
+    "bs": "bosnian",
+    "kk": "kazakh",
+    "sq": "albanian",
+    "sw": "swahili",
+    "gl": "galician",
+    "mr": "marathi",
+    "pa": "punjabi",
+    "si": "sinhala",
+    "km": "khmer",
+    "sn": "shona",
+    "yo": "yoruba",
+    "so": "somali",
+    "af": "afrikaans",
+    "oc": "occitan",
+    "ka": "georgian",
+    "be": "belarusian",
+    "tg": "tajik",
+    "sd": "sindhi",
+    "gu": "gujarati",
+    "am": "amharic",
+    "yi": "yiddish",
+    "lo": "lao",
+    "uz": "uzbek",
+    "fo": "faroese",
+    "ht": "haitian creole",
+    "ps": "pashto",
+    "tk": "turkmen",
+    "nn": "nynorsk",
+    "mt": "maltese",
+    "sa": "sanskrit",
+    "lb": "luxembourgish",
+    "my": "myanmar",
+    "bo": "tibetan",
+    "tl": "tagalog",
+    "mg": "malagasy",
+    "as": "assamese",
+    "tt": "tatar",
+    "haw": "hawaiian",
+    "ln": "lingala",
+    "ha": "hausa",
+    "ba": "bashkir",
+    "jw": "javanese",
+    "su": "sundanese",
+}
+# language code lookup by name, with a few language aliases
+TO_LANGUAGE_CODE = {
+    **{language: code for code, language in LANGUAGES.items()},
+    "burmese": "my",
+    "valencian": "ca",
+    "flemish": "nl",
+    "haitian": "ht",
+    "letzeburgesch": "lb",
+    "pushto": "ps",
+    "panjabi": "pa",
+    "moldavian": "ro",
+    "moldovan": "ro",
+    "sinhalese": "si",
+    "castilian": "es",
+}
+def compression_ratio(text) -> float:
+    return len(text) / len(zlib.compress(text.encode("utf-8")))
+def format_timestamp(
+    seconds: float, always_include_hours: bool = False, decimal_marker: str = "."
+):
+    assert seconds >= 0, "non-negative timestamp expected"
+    milliseconds = round(seconds * 1000.0)
+    hours = milliseconds // 3_600_000
+    milliseconds -= hours * 3_600_000
+    minutes = milliseconds // 60_000
+    milliseconds -= minutes * 60_000
+    seconds = milliseconds // 1_000
+    milliseconds -= seconds * 1_000
+    hours_marker = f"{hours:02d}:" if always_include_hours or hours > 0 else ""
+    return (
+        f"{hours_marker}{minutes:02d}:{seconds:02d}{decimal_marker}{milliseconds:03d}"
+    )
+@dataclass(frozen=True)
+class Tokenizer:
+    """A thin wrapper around `GPTTokenizer` providing quick access to special tokens"""
+    tokenizer: "GPTTokenizer"
+    language: Optional[str]
+    sot_sequence: Tuple[int]
+    def encode(self, text, **kwargs):
+        return self.tokenizer.encode(text, **kwargs)
+    def decode(
+        self, token_ids: Union[int, List[int], np.ndarray, paddle.Tensor], **kwargs
+    ):
+        if len(token_ids) > 1:
+            ids_list = []
+            for ids in token_ids:
+                if paddle.is_tensor(ids):
+                    ids = ids.item()
+                if ids < len(self.tokenizer):
+                    ids_list.append(ids)
+            token_ids = ids_list
+        elif len(token_ids) == 1:
+            token_ids = token_ids[0]
+        else:
+            raise ValueError(f"token_ids {token_ids} load error.")
+        return self.tokenizer.decode(token_ids, **kwargs)
+    def decode_with_timestamps(self, tokens) -> str:
+        """
+        Timestamp tokens are above the special tokens' id range and are ignored by `decode()`.
+        This method decodes given tokens with timestamps tokens annotated, e.g. "<|1.08|>".
+        """
+        outputs = [[]]
+        for token in tokens:
+            if token >= self.timestamp_begin:
+                timestamp = f"<|{(token - self.timestamp_begin) * 0.02:.2f}|>"
+                outputs.append(timestamp)
+                outputs.append([])
+            else:
+                outputs[-1].append(token)
+        outputs = [
+            s if isinstance(s, str) else self.tokenizer.decode(s) for s in outputs
+        ]
+        return "".join(outputs)
+    @property
+    @lru_cache()
+    def eot(self) -> int:
+        return self.tokenizer.eos_token_id
+    @property
+    @lru_cache()
+    def sot(self) -> int:
+        return self._get_single_token_id("<|startoftranscript|>")
+    @property
+    @lru_cache()
+    def sot_lm(self) -> int:
+        return self._get_single_token_id("<|startoflm|>")
+    @property
+    @lru_cache()
+    def sot_prev(self) -> int:
+        return self._get_single_token_id("<|startofprev|>")
+    @property
+    @lru_cache()
+    def no_speech(self) -> int:
+        return self._get_single_token_id("<|nospeech|>")
+    @property
+    @lru_cache()
+    def no_timestamps(self) -> int:
+        return self._get_single_token_id("<|notimestamps|>")
+    @property
+    @lru_cache()
+    def timestamp_begin(self) -> int:
+        return self.tokenizer.all_special_ids[-1] + 1
+    @property
+    @lru_cache()
+    def language_token(self) -> int:
+        """Returns the token id corresponding to the value of the `language` field"""
+        if self.language is None:
+            raise ValueError("This tokenizer does not have language token configured")
+        additional_tokens = dict(
+            zip(
+                self.tokenizer.additional_special_tokens,
+                self.tokenizer.additional_special_tokens_ids,
+            )
+        )
+        candidate = f"<|{self.language}|>"
+        if candidate in additional_tokens:
+            return additional_tokens[candidate]
+        raise KeyError(f"Language {self.language} not found in tokenizer.")
+    @property
+    @lru_cache()
+    def all_language_tokens(self) -> Tuple[int]:
+        result = []
+        for token, token_id in zip(
+            self.tokenizer.additional_special_tokens,
+            self.tokenizer.additional_special_tokens_ids,
+        ):
+            if token.strip("<|>") in LANGUAGES:
+                result.append(token_id)
+        return tuple(result)
+    @property
+    @lru_cache()
+    def all_language_codes(self) -> Tuple[str]:
+        return tuple(self.decode([l]).strip("<|>") for l in self.all_language_tokens)
+    @property
+    @lru_cache()
+    def sot_sequence_including_notimestamps(self) -> Tuple[int]:
+        return tuple(list(self.sot_sequence) + [self.no_timestamps])
+    @property
+    @lru_cache()
+    def non_speech_tokens(self) -> Tuple[int]:
+        """
+        Returns the list of tokens to suppress in order to avoid any speaker tags or non-speech
+        annotations, to prevent sampling texts that are not actually spoken in the audio, e.g.
+        - ♪♪♪
+        - ( SPEAKING FOREIGN LANGUAGE )
+        - [DAVID] Hey there,
+        keeping basic punctuations like commas, periods, question marks, exclamation points, etc.
+        """
+        symbols = list('"#()*+/:;<=>@[\\]^_`{|}~「」『』')
+        symbols += (
+            "<< >> <<< >>> -- --- -( -[ (' (\" (( )) ((( ))) [[ ]] {{ }} ♪♪ ♪♪♪".split()
+        )
+        # symbols that may be a single token or multiple tokens depending on the tokenizer.
+        # In case they're multiple tokens, suppress the first token, which is safe because:
+        # These are between U+2640 and U+267F miscellaneous symbols that are okay to suppress
+        # in generations, and in the 3-byte UTF-8 representation they share the first two bytes.
+        miscellaneous = set("♩♪♫♬♭♮♯")
+        assert all(0x2640 <= ord(c) <= 0x267F for c in miscellaneous)
+        # allow hyphens "-" and single quotes "'" between words, but not at the beginning of a word
+        result = {
+            self.tokenizer.encode(" -").input_ids[0],
+            self.tokenizer.encode(" '").input_ids[0],
+        }
+        for symbol in symbols + list(miscellaneous):
+            for tokens in [
+                self.tokenizer.encode(symbol).input_ids,
+                self.tokenizer.encode(" " + symbol).input_ids,
+            ]:
+                if len(tokens) == 1 or symbol in miscellaneous:
+                    result.add(tokens[0])
+        return tuple(sorted(result))
+    def _get_single_token_id(self, text) -> int:
+        tokens = self.tokenizer.encode(text).input_ids
+        assert len(tokens) == 1, f"{text} is not encoded as a single token"
+        return tokens[0]
+@lru_cache(maxsize=None)
+def build_tokenizer(resource_path: str, name: str = "gpt2"):
+    os.environ["TOKENIZERS_PARALLELISM"] = "false"
+    path = os.path.join(resource_path, "assets", name)
+    tokenizer = GPTTokenizer.from_pretrained(path)
+    specials = [
+        "<|startoftranscript|>",
+        *[f"<|{lang}|>" for lang in LANGUAGES.keys()],
+        "<|translate|>",
+        "<|transcribe|>",
+        "<|startoflm|>",
+        "<|startofprev|>",
+        "<|nospeech|>",
+        "<|notimestamps|>",
+    ]
+    tokenizer.add_special_tokens(dict(additional_special_tokens=specials))
+    return tokenizer
+@lru_cache(maxsize=None)
+def get_tokenizer(
+    multilingual: bool,
+    resource_path: str,
+    *,
+    task: Optional[str] = None,  # Literal["transcribe", "translate", None]
+    language: Optional[str] = None,
+) -> Tokenizer:
+    if language is not None:
+        language = language.lower()
+        if language not in LANGUAGES:
+            if language in TO_LANGUAGE_CODE:
+                language = TO_LANGUAGE_CODE[language]
+            else:
+                raise ValueError(f"Unsupported language: {language}")
+    if multilingual:
+        tokenizer_name = "multilingual"
+        task = task or "transcribe"
+        language = language or "en"
+    else:
+        tokenizer_name = "gpt2"
+        task = None
+        language = None
+    tokenizer = build_tokenizer(resource_path=resource_path, name=tokenizer_name)
+    all_special_ids: List[int] = tokenizer.all_special_ids
+    sot: int = all_special_ids[1]
+    translate: int = all_special_ids[-6]
+    transcribe: int = all_special_ids[-5]
+    langs = tuple(LANGUAGES.keys())
+    sot_sequence = [sot]
+    if language is not None:
+        sot_sequence.append(sot + 1 + langs.index(language))
+    if task is not None:
+        sot_sequence.append(transcribe if task == "transcribe" else translate)
+    return Tokenizer(
+        tokenizer=tokenizer, language=language, sot_sequence=tuple(sot_sequence)
+    )
+class MultiHeadAttention(paddle.nn.Layer):
+    def __init__(self, n_state: int, n_head: int):
+        super().__init__()
+        self.n_head = n_head
+        self.query = paddle.nn.Linear(n_state, n_state, bias_attr=True)
+        self.key = paddle.nn.Linear(n_state, n_state, bias_attr=False)
+        self.value = paddle.nn.Linear(n_state, n_state, bias_attr=True)
+        self.out = paddle.nn.Linear(n_state, n_state, bias_attr=True)
+    def forward(
+        self,
+        x: paddle.Tensor,
+        xa: Optional[paddle.Tensor] = None,
+        mask: Optional[paddle.Tensor] = None,
+        kv_cache: Optional[dict] = None,
+    ):
+        q = self.query(x)
+        if kv_cache is None or xa is None or self.key not in kv_cache:
+            # hooks, if installed (i.e. kv_cache is not None), will prepend the cached kv tensors;
+            # otherwise, perform key/value projections for self- or cross-attention as usual.
+            k = self.key(x if xa is None else xa)
+            v = self.value(x if xa is None else xa)
+        else:
+            # for cross-attention, calculate keys and values once and reuse in subsequent calls.
+            k = kv_cache[self.key]
+            v = kv_cache[self.value]
+        wv = self.qkv_attention(q, k, v, mask)
+        return self.out(wv)
+    def qkv_attention(
+        self,
+        q: paddle.Tensor,
+        k: paddle.Tensor,
+        v: paddle.Tensor,
+        mask: Optional[paddle.Tensor] = None,
+    ):
+        n_batch, n_ctx, n_state = q.shape
+        scale = (n_state // self.n_head) ** -0.25
+        q = (
+            paddle.transpose(q.reshape([*q.shape[:2], self.n_head, -1]), (0, 2, 1, 3))
+            * scale
+        )
+        k = (
+            paddle.transpose(k.reshape([*k.shape[:2], self.n_head, -1]), (0, 2, 3, 1))
+            * scale
+        )
+        v = paddle.transpose(v.reshape([*v.shape[:2], self.n_head, -1]), (0, 2, 1, 3))
+        qk = q @ k
+        if mask is not None:
+            qk = qk + mask[:n_ctx, :n_ctx]
+        w = paddle.nn.functional.softmax(qk.astype(q.dtype), axis=-1)
+        return paddle.transpose((w @ v), (0, 2, 1, 3)).flatten(start_axis=2)
+class ResidualAttentionBlock(paddle.nn.Layer):
+    def __init__(self, n_state: int, n_head: int, cross_attention: bool = False):
+        super().__init__()
+        self.attn = MultiHeadAttention(n_state, n_head)
+        self.attn_ln = paddle.nn.LayerNorm(n_state)
+        self.cross_attn = (
+            MultiHeadAttention(n_state, n_head) if cross_attention else None
+        )
+        self.cross_attn_ln = paddle.nn.LayerNorm(n_state) if cross_attention else None
+        n_mlp = n_state * 4
+        self.mlp = paddle.nn.Sequential(
+            paddle.nn.Linear(n_state, n_mlp, bias_attr=True),
+            paddle.nn.GELU(),
+            paddle.nn.Linear(n_mlp, n_state, bias_attr=True),
+        )
+        self.mlp_ln = paddle.nn.LayerNorm(n_state)
+    def forward(
+        self,
+        x: paddle.Tensor,
+        xa: Optional[paddle.Tensor] = None,
+        mask: Optional[paddle.Tensor] = None,
+        kv_cache: Optional[dict] = None,
+    ):
+        x = x + self.attn(self.attn_ln(x), mask=mask, kv_cache=kv_cache)
+        if self.cross_attn:
+            x = x + self.cross_attn(self.cross_attn_ln(x), xa, kv_cache=kv_cache)
+        x = x + self.mlp(self.mlp_ln(x))
+        return x
+def sinusoids(length, channels, max_timescale=10000):
+    """Returns sinusoids for positional embedding"""
+    assert channels % 2 == 0
+    log_timescale_increment = np.log(max_timescale) / (channels // 2 - 1)
+    inv_timescales = paddle.exp(
+        -log_timescale_increment * paddle.arange(channels // 2, dtype=paddle.float32)
+    )
+    scaled_time = (
+        paddle.arange(length, dtype=paddle.float32)[:, np.newaxis]
+        * inv_timescales[np.newaxis, :]
+    )
+    return paddle.to_tensor(
+        paddle.concat([paddle.sin(scaled_time), paddle.cos(scaled_time)], axis=1)
+    )
+class AudioEncoder(paddle.nn.Layer):
+    def __init__(
+        self, n_mels: int, n_ctx: int, n_state: int, n_head: int, n_layer: int
+    ):
+        super().__init__()
+        self.conv1 = paddle.nn.Conv1D(
+            n_mels, n_state, kernel_size=3, stride=1, padding=1, bias_attr=True
+        )
+        self.conv2 = paddle.nn.Conv1D(
+            n_state, n_state, kernel_size=3, stride=2, padding=1, bias_attr=True
+        )
+        self.register_buffer("positional_embedding", sinusoids(n_ctx, n_state))
+        self.blocks: Iterable[ResidualAttentionBlock] = paddle.nn.LayerList(
+            [ResidualAttentionBlock(n_state, n_head) for _ in range(n_layer)]
+        )
+        self.ln_post = paddle.nn.LayerNorm(n_state)
+    def forward(self, x: paddle.Tensor):
+        """
+        x : paddle.Tensor, shape = (batch_size, n_mels, n_ctx)
+            the mel spectrogram of the audio
+        """
+        x = paddle.nn.functional.gelu(self.conv1(x))
+        x = paddle.nn.functional.gelu(self.conv2(x))
+        x = paddle.transpose(x, (0, 2, 1))
+        assert x.shape[1:] == self.positional_embedding.shape, "incorrect audio shape"
+        x = x + self.positional_embedding
+        for block in self.blocks:
+            x = block(x)
+        x = self.ln_post(x)
+        return x
+class TextDecoder(paddle.nn.Layer):
+    def __init__(
+        self, n_vocab: int, n_ctx: int, n_state: int, n_head: int, n_layer: int
+    ):
+        super().__init__()
+        self.token_embedding = paddle.nn.Embedding(n_vocab, n_state)
+        self.positional_embedding = paddle.create_parameter(
+            shape=[n_ctx, n_state], dtype="float32"
+        )
+        self.blocks: Iterable[ResidualAttentionBlock] = paddle.nn.LayerList(
+            [
+                ResidualAttentionBlock(n_state, n_head, cross_attention=True)
+                for _ in range(n_layer)
+            ]
+        )
+        self.ln = paddle.nn.LayerNorm(n_state)
+        mask = paddle.full(shape=[n_ctx, n_state], fill_value=-np.inf, dtype="float32")
+        mask = paddle.triu(mask, diagonal=1)
+        self.register_buffer("mask", mask, persistable=False)
+    def forward(
+        self, x: paddle.Tensor, xa: paddle.Tensor, kv_cache: Optional[dict] = None
+    ):
+        """
+        x : paddle.LongTensor, shape = (batch_size, <= n_ctx)
+            the text tokens
+        xa : paddle.Tensor, shape = (batch_size, n_mels, n_audio_ctx)
+            the encoded audio features to be attended on
+        """
+        offset = next(iter(kv_cache.values())).shape[1] if kv_cache else 0
+        x = (
+            self.token_embedding(x)
+            + self.positional_embedding[offset : offset + x.shape[-1]]
+        )
+        x = x.to(xa.dtype)
+        for block in self.blocks:
+            x = block(x, xa, mask=self.mask, kv_cache=kv_cache)
+        x = self.ln(x)
+        logits = x @ paddle.transpose(self.token_embedding.weight, (1, 0))
+        return logits
+@dataclass(frozen=True)
+class DecodingOptions:
+    task: str = (
+        "transcribe"  # whether to perform X->X "transcribe" or X->English "translate"
+    )
+    language: Optional[str] = (
+        None  # language that the audio is in; uses detected language if None
+    )
+    # sampling-related options
+    temperature: float = 0.0
+    sample_len: Optional[int] = None  # maximum number of tokens to sample
+    best_of: Optional[int] = (
+        None  # number of independent samples to collect, when t > 0
+    )
+    beam_size: Optional[int] = None  # number of beams in beam search, when t == 0
+    patience: Optional[float] = (
+        None  # patience in beam search (https://arxiv.org/abs/2204.05424)
+    )
+    # options for ranking generations (either beams or best-of-N samples)
+    length_penalty: Optional[float] = (
+        None  # "alpha" in Google NMT, None defaults to length norm
+    )
+    # prompt, prefix, and token suppression
+    prompt: Optional[Union[str, List[int]]] = (
+        None  # text or tokens for the previous context
+    )
+    prefix: Optional[Union[str, List[int]]] = (
+        None  # text or tokens to prefix the current context
+    )
+    suppress_blank: bool = True  # this will suppress blank outputs
+    # list of tokens ids (or comma-separated token ids) to suppress
+    # "-1" will suppress a set of symbols as defined in `tokenizer.non_speech_tokens()`
+    suppress_tokens: Optional[Union[str, Iterable[int]]] = "-1"
+    # timestamp sampling options
+    without_timestamps: bool = False  # use <|notimestamps|> to sample text tokens only
+    max_initial_timestamp: Optional[float] = (
+        1.0  # the initial timestamp cannot be later than this
+    )
+    # implementation details
+    fp16: bool = False  # use fp16 for most of the calculation
+@dataclass(frozen=True)
+class DecodingResult:
+    audio_features: paddle.Tensor
+    language: str
+    language_probs: Optional[Dict[str, float]] = None
+    tokens: List[int] = field(default_factory=list)
+    text: str = ""
+    avg_logprob: float = np.nan
+    no_speech_prob: float = np.nan
+    temperature: float = np.nan
+    compression_ratio: float = np.nan
+class Inference:
+    def logits(
+        self, tokens: paddle.Tensor, audio_features: paddle.Tensor
+    ) -> paddle.Tensor:
+        """Perform a forward pass on the decoder and return per-token logits"""
+        raise NotImplementedError
+    def rearrange_kv_cache(self, source_indices) -> None:
+        """Update the key-value cache according to the updated beams"""
+        raise NotImplementedError
+    def cleanup_caching(self) -> None:
+        """Clean up any resources or hooks after decoding is finished"""
+        pass
+class WhisperInference(Inference):
+    def __init__(self, model: "Whisper", initial_token_length: int):
+        self.model: "Whisper" = model
+        self.initial_token_length = initial_token_length
+        self.kv_cache = {}
+        self.hooks = []
+    def logits(
+        self, tokens: paddle.Tensor, audio_features: paddle.Tensor
+    ) -> paddle.Tensor:
+        if not self.kv_cache:
+            self.kv_cache, self.hooks = self.model.install_kv_cache_hooks()
+        if tokens.shape[-1] > self.initial_token_length:
+            # only need to use the last token except in the first forward pass
+            tokens = tokens[:, -1:]
+        return self.model.decoder(tokens, audio_features, kv_cache=self.kv_cache)
+    def cleanup_caching(self):
+        for hook in self.hooks:
+            hook.remove()
+        self.kv_cache = {}
+        self.hooks = []
+    def rearrange_kv_cache(self, source_indices):
+        for module, tensor in self.kv_cache.items():
+            # update the key/value cache to contain the selected sequences
+            self.kv_cache[module] = tensor[source_indices].detach()
+@paddle.no_grad()
+def detect_language(
+    model: "Whisper",
+    mel: paddle.Tensor,
+    resource_path: str,
+    tokenizer: Tokenizer = None,
+) -> Tuple[paddle.Tensor, List[dict]]:
+    """
+    Detect the spoken language in the audio, and return them as list of strings, along with the ids
+    of the most probable language tokens and the probability distribution over all language tokens.
+    This is performed outside the main decode loop in order to not interfere with kv-caching.
+    Returns
+    -------
+    language_tokens : Tensor, shape = (batch_size,)
+        ids of the most probable language tokens, which appears after the startoftranscript token.
+    language_probs : List[Dict[str, float]], length = batch_size
+        list of dictionaries containing the probability distribution over all languages.
+    """
+    if tokenizer is None:
+        tokenizer = get_tokenizer(model.is_multilingual, resource_path=resource_path)
+    if (
+        tokenizer.language is None
+        or tokenizer.language_token not in tokenizer.sot_sequence
+    ):
+        raise ValueError(
+            "This model doesn't have language tokens so it can't perform lang id"
+        )
+    single = mel.ndim == 2
+    if single:
+        mel = mel.unsqueeze(0)
+    # skip encoder forward pass if already-encoded audio features were given
+    if mel.shape[-2:] != (model.dims.n_audio_ctx, model.dims.n_audio_state):
+        mel = model.encoder(mel)
+    # forward pass using a single token, startoftranscript
+    batch_size = mel.shape[0]
+    x = paddle.to_tensor([[tokenizer.sot]] * batch_size)  # [batch_size, 1]
+    logits = model.logits(x, mel)[:, 0]
+    # collect detected languages; suppress all non-language tokens
+    mask = paddle.ones(paddle.to_tensor(logits.shape[-1]), dtype=bool)
+    mask[list(tokenizer.all_language_tokens)] = False
+    logits[:, mask] = -np.inf
+    language_tokens = paddle.argmax(logits, axis=-1)
+    language_token_probs = paddle.nn.functional.softmax(logits, axis=-1)
+    language_probs = [
+        {
+            c: language_token_probs[i, j].tolist()
+            for j, c in zip(tokenizer.all_language_tokens, tokenizer.all_language_codes)
+        }
+        for i in range(batch_size)
+    ]
+    if single:
+        language_tokens = language_tokens[0]
+        language_probs = language_probs[0]
+    return language_tokens, language_probs
+def transcribe(
+    model: "Whisper",
+    mel: paddle.Tensor,
+    resource_path: str,
+    *,
+    verbose: Optional[bool] = None,
+    temperature: Union[float, Tuple[float, ...]] = (0.0, 0.2, 0.4, 0.6, 0.8, 1.0),
+    compression_ratio_threshold: Optional[float] = 2.4,
+    logprob_threshold: Optional[float] = -1.0,
+    no_speech_threshold: Optional[float] = 0.6,
+    condition_on_previous_text: bool = True,
+    **decode_options,
+):
+    """
+    Transcribe an audio file using Whisper
+    Parameters
+    ----------
+    model: Whisper
+        The Whisper model instance
+    mel: paddle.Tensor
+        The audio feature
+    verbose: bool
+        Whether to display the text being decoded to the console. If True, displays all the details,
+        If False, displays minimal details. If None, does not display anything
+    temperature: Union[float, Tuple[float, ...]]
+        Temperature for sampling. It can be a tuple of temperatures, which will be successfully used
+        upon failures according to either `compression_ratio_threshold` or `logprob_threshold`.
+    compression_ratio_threshold: float
+        If the gzip compression ratio is above this value, treat as failed
+    logprob_threshold: float
+        If the average log probability over sampled tokens is below this value, treat as failed
+    no_speech_threshold: float
+        If the no_speech probability is higher than this value AND the average log probability
+        over sampled tokens is below `logprob_threshold`, consider the segment as silent
+    condition_on_previous_text: bool
+        if True, the previous output of the model is provided as a prompt for the next window;
+        disabling may make the text inconsistent across windows, but the model becomes less prone to
+        getting stuck in a failure loop, such as repetition looping or timestamps going out of sync.
+    decode_options: dict
+        Keyword arguments to construct `DecodingOptions` instances
+    Returns
+    -------
+    A dictionary containing the resulting text ("text") and segment-level details ("segments"), and
+    the spoken language ("language"), which is detected when `decode_options["language"]` is None.
+    """
+    dtype = np.float32  # paddle only support float32
+    if dtype == np.float32:
+        decode_options["fp16"] = False
+    if (
+        decode_options.get("language") == "None"
+        or decode_options.get("language", None) is None
+    ):
+        if not model.is_multilingual:
+            decode_options["language"] = "en"
+        else:
+            if verbose:
+                print(
+                    "Detecting language using up to the first 30 seconds. Use `--language` to specify the language"
+                )
+            segment = pad_or_trim(mel, N_FRAMES)
+            _, probs = model.detect_language(segment, resource_path)
+            decode_options["language"] = max(probs, key=probs.get)
+            if verbose is not None:
+                print(
+                    f"Detected language: {LANGUAGES[decode_options['language']].title()}"
+                )
+    language = decode_options["language"]
+    task = decode_options.get("task", "transcribe")
+    tokenizer = get_tokenizer(
+        model.is_multilingual, resource_path=resource_path, language=language, task=task
+    )
+    def decode_with_fallback(segment: paddle.Tensor) -> DecodingResult:
+        temperatures = (
+            [temperature] if isinstance(temperature, (int, float)) else temperature
+        )
+        decode_result = None
+        for t in temperatures:
+            kwargs = {**decode_options}
+            if t > 0:
+                # disable beam_size and patience when t > 0
+                kwargs.pop("beam_size", None)
+                kwargs.pop("patience", None)
+            else:
+                # disable best_of when t == 0
+                kwargs.pop("best_of", None)
+            options = DecodingOptions(**kwargs, temperature=t)
+            decode_result = model.decode(segment, options, resource_path)
+            needs_fallback = False
+            if (
+                compression_ratio_threshold is not None
+                and decode_result.compression_ratio > compression_ratio_threshold
+            ):
+                needs_fallback = True  # too repetitive
+            if (
+                logprob_threshold is not None
+                and decode_result.avg_logprob < logprob_threshold
+            ):
+                needs_fallback = True  # average log probability is too low
+            if not needs_fallback:
+                break
+        return decode_result
+    seek = 0
+    input_stride = exact_div(
+        N_FRAMES, model.dims.n_audio_ctx
+    )  # mel frames per output token: 2
+    time_precision = (
+        input_stride * HOP_LENGTH / SAMPLE_RATE
+    )  # time per output token: 0.02 (seconds)
+    all_tokens = []
+    all_segments = []
+    prompt_reset_since = 0
+    initial_prompt = decode_options.pop("initial_prompt", None)
+    if initial_prompt and initial_prompt != "None":
+        initial_prompt = tokenizer.encode(" " + initial_prompt.strip()).input_ids
+        all_tokens.extend(initial_prompt)
+    else:
+        initial_prompt = []
+    def add_segment(
+        *, start: float, end: float, text_tokens: paddle.Tensor, result: DecodingResult
+    ):
+        text = tokenizer.decode(
+            [token for token in text_tokens if token < tokenizer.eot]
+        )
+        if len(text.strip()) == 0:  # skip empty text output
+            return
+        all_segments.append(
+            {
+                "id": len(all_segments),
+                "seek": seek,
+                "start": start,
+                "end": end,
+                "text": text,
+                "tokens": result.tokens,
+                "temperature": result.temperature,
+                "avg_logprob": result.avg_logprob,
+                "compression_ratio": result.compression_ratio,
+                "no_speech_prob": result.no_speech_prob,
+            }
+        )
+        if verbose:
+            print(f"[{format_timestamp(start)} --> {format_timestamp(end)}] {text}")
+    # show the progress bar when verbose is False (otherwise the transcribed text will be printed)
+    num_frames = mel.shape[-1]
+    previous_seek_value = seek
+    with tqdm.tqdm(
+        total=num_frames, unit="frames", disable=verbose is not False
+    ) as pbar:
+        while seek < num_frames:
+            timestamp_offset = float(seek * HOP_LENGTH / SAMPLE_RATE)
+            segment = pad_or_trim(mel[:, seek:], N_FRAMES)
+            segment_duration = segment.shape[-1] * HOP_LENGTH / SAMPLE_RATE
+            decode_options["prompt"] = all_tokens[prompt_reset_since:]
+            result: DecodingResult = decode_with_fallback(segment)
+            tokens = paddle.to_tensor(result.tokens)
+            if no_speech_threshold is not None:
+                # no voice activity check
+                should_skip = result.no_speech_prob > no_speech_threshold
+                if (
+                    logprob_threshold is not None
+                    and result.avg_logprob > logprob_threshold
+                ):
+                    # don't skip if the logprob is high enough, despite the no_speech_prob
+                    should_skip = False
+                if should_skip:
+                    seek += segment.shape[
+                        -1
+                    ]  # fast-forward to the next segment boundary
+                    continue
+            timestamp_tokens: paddle.Tensor = tokens.greater_equal(
+                paddle.to_tensor(tokenizer.timestamp_begin)
+            )
+            consecutive = paddle.where(timestamp_tokens[:-1] & timestamp_tokens[1:])[0]
+            if (
+                len(consecutive) > 0
+            ):  # if the output contains two consecutive timestamp tokens
+                consecutive = paddle.add(consecutive, paddle.to_tensor(1))
+                last_slice = 0
+                for current_slice in consecutive:
+                    sliced_tokens = tokens[last_slice:current_slice]
+                    start_timestamp_position = (
+                        sliced_tokens[0].item() - tokenizer.timestamp_begin
+                    )
+                    end_timestamp_position = (
+                        sliced_tokens[-1].item() - tokenizer.timestamp_begin
+                    )
+                    add_segment(
+                        start=timestamp_offset
+                        + start_timestamp_position * time_precision,
+                        end=timestamp_offset + end_timestamp_position * time_precision,
+                        text_tokens=sliced_tokens[1:-1],
+                        result=result,
+                    )
+                    last_slice = current_slice
+                last_timestamp_position = (
+                    tokens[last_slice - 1].item() - tokenizer.timestamp_begin
+                )
+                seek += last_timestamp_position * input_stride
+                all_tokens.extend(tokens[: last_slice + 1].tolist())
+            else:
+                duration = segment_duration
+                timestamps = tokens[timestamp_tokens.nonzero().flatten()]
+                if (
+                    len(timestamps) > 0
+                    and timestamps[-1].item() != tokenizer.timestamp_begin
+                ):
+                    # no consecutive timestamps but it has a timestamp; use the last one.
+                    # single timestamp at the end means no speech after the last timestamp.
+                    last_timestamp_position = (
+                        timestamps[-1].item() - tokenizer.timestamp_begin
+                    )
+                    duration = last_timestamp_position * time_precision
+                add_segment(
+                    start=timestamp_offset,
+                    end=timestamp_offset + duration,
+                    text_tokens=tokens,
+                    result=result,
+                )
+                seek += segment.shape[-1]
+                all_tokens.extend(tokens.tolist())
+            if not condition_on_previous_text or result.temperature > 0.5:
+                # do not feed the prompt tokens if a high temperature was used
+                prompt_reset_since = len(all_tokens)
+            # update progress bar
+            pbar.update(min(num_frames, seek) - previous_seek_value)
+            previous_seek_value = seek
+    return dict(
+        text=tokenizer.decode(all_tokens[len(initial_prompt) :]),
+        segments=all_segments,
+        language=language,
+    )
+class SequenceRanker:
+    def rank(
+        self, tokens: List[List[paddle.Tensor]], sum_logprobs: List[List[float]]
+    ) -> List[int]:
+        """
+        Given a list of groups of samples and their cumulative log probabilities,
+        return the indices of the samples in each group to select as the final result
+        """
+        raise NotImplementedError
+class MaximumLikelihoodRanker(SequenceRanker):
+    """
+    Select the sample with the highest log probabilities, penalized using either
+    a simple length normalization or Google NMT paper's length penalty
+    """
+    def __init__(self, length_penalty: Optional[float]):
+        self.length_penalty = length_penalty
+    def rank(self, tokens: List[List[paddle.Tensor]], sum_logprobs: List[List[float]]):
+        def scores(logprobs, lengths):
+            result = []
+            for logprob, length in zip(logprobs, lengths):
+                if self.length_penalty is None or self.length_penalty == "None":
+                    penalty = length
+                else:
+                    # from the Google NMT paper
+                    penalty = ((5 + length) / 6) ** self.length_penalty
+                result.append(logprob / penalty)
+            return result
+        # get the sequence with the highest score
+        lengths = [[len(t) for t in s] for s in tokens]
+        return [np.argmax(scores(p, l)) for p, l in zip(sum_logprobs, lengths)]
+class TokenDecoder:
+    def reset(self):
+        """Initialize any stateful variables for decoding a new sequence"""
+    def update(
+        self, tokens: paddle.Tensor, logits: paddle.Tensor, sum_logprobs: paddle.Tensor
+    ) -> Tuple[paddle.Tensor, bool]:
+        """Specify how to select the next token, based on the current trace and logits
+        Parameters
+        ----------
+        tokens : Tensor, shape = (n_batch, current_sequence_length)
+            all tokens in the context so far, including the prefix and sot_sequence tokens
+        logits : Tensor, shape = (n_batch, vocab_size)
+            per-token logits of the probability distribution at the current step
+        sum_logprobs : Tensor, shape = (n_batch)
+            cumulative log probabilities for each sequence
+        Returns
+        -------
+        tokens : Tensor, shape = (n_batch, current_sequence_length + 1)
+            the tokens, appended with the selected next token
+        completed : bool
+            True if all sequences has reached the end of text
+        """
+        raise NotImplementedError
+    def finalize(
+        self, tokens: paddle.Tensor, sum_logprobs: paddle.Tensor
+    ) -> Tuple[Sequence[Sequence[paddle.Tensor]], List[List[float]]]:
+        """Finalize search and return the final candidate sequences
+        Parameters
+        ----------
+        tokens : Tensor, shape = (batch_size, beam_size, current_sequence_length)
+            all tokens in the context so far, including the prefix and sot_sequence
+        sum_logprobs : Tensor, shape = (batch_size, beam_size)
+            cumulative log probabilities for each sequence
+        Returns
+        -------
+        tokens : Sequence[Sequence[Tensor]], length = batch_size
+            sequence of Tensors containing candidate token sequences, for each audio input
+        sum_logprobs : List[List[float]], length = batch_size
+            sequence of cumulative log probabilities corresponding to the above
+        """
+        raise NotImplementedError
+class GreedyDecoder(TokenDecoder):
+    def __init__(self, temperature: float, eot: int):
+        self.temperature = temperature
+        self.eot = eot
+    def update(
+        self, tokens: paddle.Tensor, logits: paddle.Tensor, sum_logprobs: paddle.Tensor
+    ) -> Tuple[paddle.Tensor, bool]:
+        temperature = self.temperature
+        if temperature == 0:
+            next_tokens = paddle.argmax(logits, axis=-1)
+        else:
+            next_tokens = paddle.distribution.Categorical(
+                logits=logits / temperature
+            ).sample([1])
+            next_tokens = paddle.reshape(
+                next_tokens,
+                [
+                    next_tokens.shape[0] * next_tokens.shape[1],
+                ],
+            )
+        logprobs = paddle.nn.functional.log_softmax(
+            logits, axis=-1, dtype=paddle.float32
+        )
+        current_logprobs = logprobs[paddle.arange(logprobs.shape[0]), next_tokens]
+        sum_logprobs += current_logprobs * paddle.to_tensor(
+            (tokens[:, -1] != self.eot), dtype=paddle.float32
+        )
+        next_tokens[tokens[:, -1] == self.eot] = self.eot
+        tokens = paddle.concat([tokens, next_tokens[:, None]], axis=-1)
+        completed = paddle.all((tokens[:, -1] == self.eot))
+        return tokens, completed
+    def finalize(self, tokens: paddle.Tensor, sum_logprobs: paddle.Tensor):
+        # make sure each sequence has at least one EOT token at the end
+        tokens = paddle.nn.functional.pad(
+            tokens, (0, 1), value=self.eot, data_format="NCL"
+        )
+        return tokens, sum_logprobs.tolist()
+class BeamSearchDecoder(TokenDecoder):
+    def __init__(
+        self,
+        beam_size: int,
+        eot: int,
+        inference: Inference,
+        patience: Optional[float] = None,
+    ):
+        self.beam_size = beam_size
+        self.eot = eot
+        self.inference = inference
+        self.patience = patience or 1.0
+        if patience is None or patience == "None":
+            self.patience = 1.0
+        else:
+            self.patience = patience
+        self.max_candidates: int = round(beam_size * self.patience)
+        self.finished_sequences = None
+        assert (
+            self.max_candidates > 0
+        ), f"Invalid beam size ({beam_size}) or patience ({patience})"
+    def reset(self):
+        self.finished_sequences = None
+    def update(
+        self, tokens: paddle.Tensor, logits: paddle.Tensor, sum_logprobs: paddle.Tensor
+    ) -> Tuple[paddle.Tensor, bool]:
+        if tokens.shape[0] % self.beam_size != 0:
+            raise ValueError(f"{tokens.shape}[0] % {self.beam_size} != 0")
+        batch_size = tokens.shape[0] // self.beam_size
+        if self.finished_sequences is None:  # for the first update
+            self.finished_sequences = [{} for _ in range(batch_size)]
+        logprobs = paddle.nn.functional.log_softmax(logits, axis=-1, dtype="float32")
+        next_tokens, source_indices, finished_sequences = [], [], []
+        for i in range(batch_size):
+            scores, sources, finished = {}, {}, {}
+            # STEP 1: calculate the cumulative log probabilities for possible candidates
+            for j in range(self.beam_size):
+                idx = i * self.beam_size + j
+                prefix = tokens[idx].tolist()
+                logprob, token = paddle.topk(logprobs[idx], k=self.beam_size + 1)
+                for logprob, token in zip(logprob, token):
+                    new_logprob = (sum_logprobs[idx] + logprob).item()
+                    sequence = tuple(prefix + [token.item()])
+                    scores[sequence] = new_logprob
+                    sources[sequence] = idx
+            # STEP 2: rank the candidates and keep the top beam_size sequences for each audio
+            saved = 0
+            for sequence in sorted(scores, key=scores.get, reverse=True):
+                if sequence[-1] == self.eot:
+                    finished[sequence] = scores[sequence]
+                else:
+                    sum_logprobs[len(next_tokens)] = scores[sequence]
+                    next_tokens.append(sequence)
+                    source_indices.append(sources[sequence])
+                    saved += 1
+                    if saved == self.beam_size:
+                        break
+            finished_sequences.append(finished)
+        tokens = paddle.to_tensor(next_tokens)
+        self.inference.rearrange_kv_cache(source_indices)
+        # add newly finished sequences to self.finished_sequences
+        assert len(self.finished_sequences) == len(finished_sequences)
+        for previously_finished, newly_finished in zip(
+            self.finished_sequences, finished_sequences
+        ):
+            for seq in sorted(newly_finished, key=newly_finished.get, reverse=True):
+                if len(previously_finished) >= self.max_candidates:
+                    break  # the candidate list is full
+                previously_finished[seq] = newly_finished[seq]
+        # mark as completed if all audio has enough number of samples
+        completed = all(
+            len(sequences) >= self.max_candidates
+            for sequences in self.finished_sequences
+        )
+        return tokens, completed
+    def finalize(self, preceding_tokens: paddle.Tensor, sum_logprobs: paddle.Tensor):
+        # collect all finished sequences, including patience, and add unfinished ones if not enough
+        sum_logprobs = sum_logprobs.cpu()
+        for i, sequences in enumerate(self.finished_sequences):
+            if (
+                len(sequences) < self.beam_size
+            ):  # when not enough sequences are finished
+                for j in list(np.argsort(sum_logprobs[i]))[::-1]:
+                    sequence = preceding_tokens[i, j].tolist() + [self.eot]
+                    sequences[tuple(sequence)] = sum_logprobs[i][j].item()
+                    if len(sequences) >= self.beam_size:
+                        break
+        tokens: List[List[paddle.Tensor]] = [
+            [paddle.to_tensor(seq) for seq in sequences.keys()]
+            for sequences in self.finished_sequences
+        ]
+        sum_logprobs: List[List[float]] = [
+            list(sequences.values()) for sequences in self.finished_sequences
+        ]
+        return tokens, sum_logprobs
+class LogitFilter:
+    def apply(self, logits: paddle.Tensor, tokens: paddle.Tensor) -> None:
+        """Apply any filtering or masking to logits in-place
+        Parameters
+        ----------
+        logits : Tensor, shape = (n_batch, vocab_size)
+            per-token logits of the probability distribution at the current step
+        tokens : Tensor, shape = (n_batch, current_sequence_length)
+            all tokens in the context so far, including the prefix and sot_sequence tokens
+        """
+        raise NotImplementedError
+class SuppressBlank(LogitFilter):
+    def __init__(self, tokenizer: Tokenizer, sample_begin: int):
+        self.tokenizer = tokenizer
+        self.sample_begin = sample_begin
+    def apply(self, logits: paddle.Tensor, tokens: paddle.Tensor):
+        if tokens.shape[1] == self.sample_begin:
+            logits[:, self.tokenizer.encode(" ").input_ids + [self.tokenizer.eot]] = (
+                -np.inf
+            )
+class SuppressTokens(LogitFilter):
+    def __init__(self, suppress_tokens: Sequence[int]):
+        self.suppress_tokens = list(suppress_tokens)
+    def apply(self, logits: paddle.Tensor, tokens: paddle.Tensor):
+        logits[:, self.suppress_tokens] = -np.inf
+class ApplyTimestampRules(LogitFilter):
+    def __init__(
+        self,
+        tokenizer: Tokenizer,
+        sample_begin: int,
+        max_initial_timestamp_index: Optional[int],
+    ):
+        self.tokenizer = tokenizer
+        self.sample_begin = sample_begin
+        self.max_initial_timestamp_index = max_initial_timestamp_index
+    def apply(self, logits: paddle.Tensor, tokens: paddle.Tensor):
+        # suppress <|notimestamps|> which is handled by without_timestamps
+        if self.tokenizer.no_timestamps is not None:
+            logits[:, self.tokenizer.no_timestamps] = -np.inf
+        # timestamps have to appear in pairs, except directly before EOT; mask logits accordingly
+        for k in range(tokens.shape[0]):
+            seq = [t for t in tokens[k, self.sample_begin :].tolist()]
+            last_was_timestamp = (
+                len(seq) >= 1 and seq[-1] >= self.tokenizer.timestamp_begin
+            )
+            penultimate_was_timestamp = (
+                len(seq) < 2 or seq[-2] >= self.tokenizer.timestamp_begin
+            )
+            if last_was_timestamp:
+                if penultimate_was_timestamp:  # has to be non-timestamp
+                    logits[k, self.tokenizer.timestamp_begin :] = -np.inf
+                else:  # cannot be normal text tokens
+                    logits[k, : self.tokenizer.eot] = -np.inf
+        # apply the `max_initial_timestamp` option
+        if (
+            tokens.shape[1] == self.sample_begin
+            and self.max_initial_timestamp_index is not None
+        ):
+            last_allowed = (
+                self.tokenizer.timestamp_begin + self.max_initial_timestamp_index
+            )
+            logits[:, last_allowed + 1 :] = -np.inf
+        # if sum of probability over timestamps is above any other token, sample timestamp
+        logprobs = paddle.nn.functional.log_softmax(logits, axis=-1, dtype="float32")
+        for k in range(tokens.shape[0]):
+            # When using paddle.logsumexp on a 32GB Tesla-V100 GPU, we encountered CUDA error 700.
+            # To bypass this issue in CI, we have decomposed the operation into separate steps.
+            # It will raise 2e-6 difference in precision.
+            # TODO: revert this after logsumexp been fixed.
+            timestamp_logprob = paddle.exp(
+                logprobs[k, self.tokenizer.timestamp_begin :]
+            )
+            timestamp_logprob = paddle.sum(timestamp_logprob, axis=-1)
+            timestamp_logprob = paddle.log(timestamp_logprob)
+            max_text_token_logprob = paddle.max(
+                logprobs[k, : self.tokenizer.timestamp_begin]
+            )
+            if timestamp_logprob > max_text_token_logprob:
+                logits[k, : self.tokenizer.timestamp_begin] = -np.inf
+class DecodingTask:
+    inference: Inference
+    sequence_ranker: SequenceRanker
+    decoder: TokenDecoder
+    logit_filters: List[LogitFilter]
+    def __init__(self, model: "Whisper", options: DecodingOptions, resource_path: str):
+        self.model = model
+        language = options.language or "en"
+        tokenizer = get_tokenizer(
+            model.is_multilingual,
+            resource_path=resource_path,
+            language=language,
+            task=options.task,
+        )
+        self.tokenizer: Tokenizer = tokenizer
+        self.options: DecodingOptions = self._verify_options(options)
+        self.resource_path: str = resource_path
+        self.beam_size: int = options.beam_size or options.best_of or 1
+        self.n_ctx: int = model.dims.n_text_ctx
+        self.sample_len: int = options.sample_len or model.dims.n_text_ctx // 2
+        self.sot_sequence: Tuple[int] = tokenizer.sot_sequence
+        if self.options.without_timestamps:
+            self.sot_sequence = tokenizer.sot_sequence_including_notimestamps
+        self.initial_tokens: Tuple[int] = self._get_initial_tokens()
+        self.sample_begin: int = len(self.initial_tokens)
+        self.sot_index: int = self.initial_tokens.index(tokenizer.sot)
+        # inference: implements the forward pass through the decoder, including kv caching
+        self.inference = WhisperInference(model, len(self.initial_tokens))
+        # sequence ranker: implements how to rank a group of sampled sequences
+        self.sequence_ranker = MaximumLikelihoodRanker(options.length_penalty)
+        # decoder: implements how to select the next tokens, given the autoregressive distribution
+        if options.beam_size is not None:
+            self.decoder = BeamSearchDecoder(
+                options.beam_size, tokenizer.eot, self.inference, options.patience
+            )
+        else:
+            self.decoder = GreedyDecoder(options.temperature, tokenizer.eot)
+        # logit filters: applies various rules to suppress or penalize certain tokens
+        self.logit_filters = []
+        if self.options.suppress_blank:
+            self.logit_filters.append(SuppressBlank(self.tokenizer, self.sample_begin))
+        if self.options.suppress_tokens:
+            self.logit_filters.append(SuppressTokens(self._get_suppress_tokens()))
+        if not options.without_timestamps:
+            precision = CHUNK_LENGTH / model.dims.n_audio_ctx  # usually 0.02 seconds
+            max_initial_timestamp_index = None
+            if options.max_initial_timestamp:
+                max_initial_timestamp_index = round(
+                    self.options.max_initial_timestamp / precision
+                )
+            self.logit_filters.append(
+                ApplyTimestampRules(
+                    tokenizer, self.sample_begin, max_initial_timestamp_index
+                )
+            )
+    def _verify_options(self, options: DecodingOptions) -> DecodingOptions:
+        if options.beam_size is not None and options.best_of is not None:
+            raise ValueError("beam_size and best_of can't be given together")
+        if options.temperature == 0:
+            if options.best_of is not None:
+                raise ValueError("best_of with greedy sampling (T=0) is not compatible")
+        if options.patience is not None and options.beam_size is None:
+            raise ValueError("patience requires beam_size to be given")
+        if options.length_penalty is not None and options.length_penalty != "None":
+            if not (0 <= options.length_penalty <= 1):
+                raise ValueError(
+                    "length_penalty (alpha) should be a value between 0 and 1"
+                )
+        return options
+    def _get_initial_tokens(self) -> Tuple[int]:
+        tokens = list(self.sot_sequence)
+        prefix = self.options.prefix
+        prompt = self.options.prompt
+        if prefix:
+            prefix_tokens = (
+                self.tokenizer.encode(" " + prefix.strip().input_ids)
+                if isinstance(prefix, str)
+                else prefix
+            )
+            if self.sample_len is not None:
+                max_prefix_len = self.n_ctx // 2 - self.sample_len
+                prefix_tokens = prefix_tokens[-max_prefix_len:]
+            tokens = tokens + prefix_tokens
+        if prompt:
+            prompt_tokens = (
+                self.tokenizer.encode(" " + prompt.strip().input_ids)
+                if isinstance(prompt, str)
+                else prompt
+            )
+            tokens = (
+                [self.tokenizer.sot_prev]
+                + prompt_tokens[-(self.n_ctx // 2 - 1) :]
+                + tokens
+            )
+        return tuple(tokens)
+    def _get_suppress_tokens(self) -> Tuple[int]:
+        suppress_tokens = self.options.suppress_tokens
+        if isinstance(suppress_tokens, str):
+            suppress_tokens = [int(t) for t in suppress_tokens.split(",")]
+        if -1 in suppress_tokens:
+            suppress_tokens = [t for t in suppress_tokens if t >= 0]
+            suppress_tokens.extend(self.tokenizer.non_speech_tokens)
+        elif suppress_tokens is None or len(suppress_tokens) == 0:
+            suppress_tokens = []  # interpret empty string as an empty list
+        else:
+            assert isinstance(suppress_tokens, list), "suppress_tokens must be a list"
+        suppress_tokens.extend(
+            [self.tokenizer.sot, self.tokenizer.sot_prev, self.tokenizer.sot_lm]
+        )
+        if self.tokenizer.no_speech is not None:
+            # no-speech probability is collected separately
+            suppress_tokens.append(self.tokenizer.no_speech)
+        return tuple(sorted(set(suppress_tokens)))
+    def _get_audio_features(self, mel: paddle.Tensor):
+        if mel.shape[-2:] == (
+            self.model.dims.n_audio_ctx,
+            self.model.dims.n_audio_state,
+        ):
+            # encoded audio features are given; skip audio encoding
+            audio_features = mel
+        else:
+            audio_features = self.model.encoder(mel)
+        return audio_features
+    def _detect_language(
+        self, audio_features: paddle.Tensor, tokens: paddle.Tensor, resource_path: str
+    ):
+        languages = [self.options.language] * audio_features.shape[0]
+        lang_probs = None
+        if self.options.language is None or self.options.task == "lang_id":
+            lang_tokens, lang_probs = self.model.detect_language(
+                audio_features, self.tokenizer, self.resource_path
+            )
+            languages = [max(probs, key=probs.get) for probs in lang_probs]
+            if self.options.language is None:
+                tokens[:, self.sot_index + 1] = lang_tokens  # write language tokens
+        return languages, lang_probs
+    def _main_loop(self, audio_features: paddle.Tensor, tokens: paddle.Tensor):
+        assert audio_features.shape[0] == tokens.shape[0]
+        n_batch = tokens.shape[0]
+        sum_logprobs: paddle.Tensor = paddle.zeros(
+            paddle.to_tensor(n_batch), dtype=paddle.float32
+        )
+        no_speech_probs = [np.nan] * n_batch
+        try:
+            for i in range(self.sample_len):
+                logits = self.inference.logits(tokens, audio_features)
+                if (
+                    i == 0 and self.tokenizer.no_speech is not None
+                ):  # save no_speech_probs
+                    probs_at_sot = paddle.nn.functional.softmax(
+                        logits[:, self.sot_index], axis=-1, dtype=paddle.float32
+                    )
+                    no_speech_probs = probs_at_sot[:, self.tokenizer.no_speech].tolist()
+                # now we need to consider the logits at the last token only
+                logits = logits[:, -1]
+                # apply the logit filters, e.g. for suppressing or applying penalty to
+                for logit_filter in self.logit_filters:
+                    logit_filter.apply(logits, tokens)
+                # expand the tokens tensor with the selected next tokens
+                tokens, completed = self.decoder.update(tokens, logits, sum_logprobs)
+                if completed or tokens.shape[-1] > self.n_ctx:
+                    break
+        finally:
+            self.inference.cleanup_caching()
+        return tokens, sum_logprobs, no_speech_probs
+    @paddle.no_grad()
+    def run(self, mel: paddle.Tensor) -> List[DecodingResult]:
+        self.decoder.reset()
+        tokenizer: Tokenizer = self.tokenizer
+        batch_size: int = mel.shape[0]
+        audio_features: paddle.Tensor = self._get_audio_features(
+            mel
+        )  # encoder forward pass
+        tokens: paddle.Tensor
+        if batch_size > 1:
+            for i in range(batch_size):
+                tokens = paddle.concat(
+                    x=[
+                        paddle.to_tensor([self.initial_tokens]),
+                        paddle.to_tensor([self.initial_tokens]),
+                    ],
+                    axis=0,
+                )
+        elif batch_size == 1:
+            tokens = paddle.to_tensor([self.initial_tokens])
+        # detect language if requested, overwriting the language token
+        languages, language_probs = self._detect_language(
+            paddle.to_tensor(audio_features),
+            paddle.to_tensor(tokens),
+            self.resource_path,
+        )
+        if self.options.task == "lang_id":
+            return [
+                DecodingResult(
+                    audio_features=features, language=language, language_probs=probs
+                )
+                for features, language, probs in zip(
+                    audio_features, languages, language_probs
+                )
+            ]
+        # repeat the audio & text tensors by the group size, for beam search or best-of-n sampling
+        audio_features = paddle.repeat_interleave(
+            audio_features, self.beam_size, axis=0
+        )
+        tokens = paddle.repeat_interleave(tokens, self.beam_size, axis=0)
+        # call the main sampling loop
+        tokens, sum_logprobs, no_speech_probs = self._main_loop(audio_features, tokens)
+        # reshape the tensors to have (batch_size, beam_size) as the first two dimensions
+        audio_features = audio_features[:: self.beam_size]
+        no_speech_probs = no_speech_probs[:: self.beam_size]
+        assert audio_features.shape[0] == len(no_speech_probs) == batch_size
+        tokens = tokens.reshape([batch_size, self.beam_size, -1])
+        sum_logprobs = sum_logprobs.reshape([batch_size, self.beam_size])
+        # get the final candidates for each group, and slice between the first sampled token and EOT
+        tokens, sum_logprobs = self.decoder.finalize(tokens, sum_logprobs)
+        tokens: List[List[paddle.Tensor]] = [
+            [t[self.sample_begin : (t == tokenizer.eot).nonzero()[0, 0]] for t in s]
+            for s in tokens
+        ]
+        # select the top-ranked sample in each group
+        selected = self.sequence_ranker.rank(tokens, sum_logprobs)
+        tokens: List[List[int]] = [t[i].tolist() for i, t in zip(selected, tokens)]
+        texts: List[str] = [tokenizer.decode(t).strip() for t in tokens]
+        sum_logprobs: List[float] = [lp[i] for i, lp in zip(selected, sum_logprobs)]
+        avg_logprobs: List[float] = [
+            lp / (len(t) + 1) for t, lp in zip(tokens, sum_logprobs)
+        ]
+        fields = (
+            texts,
+            languages,
+            tokens,
+            audio_features,
+            avg_logprobs,
+            no_speech_probs,
+        )
+        if len(set(map(len, fields))) != 1:
+            raise RuntimeError(f"inconsistent result lengths: {list(map(len, fields))}")
+        return [
+            DecodingResult(
+                audio_features=features,
+                language=language,
+                tokens=tokens,
+                text=text,
+                avg_logprob=avg_logprob,
+                no_speech_prob=no_speech_prob,
+                temperature=self.options.temperature,
+                compression_ratio=compression_ratio(text),
+            )
+            for text, language, tokens, features, avg_logprob, no_speech_prob in zip(
+                *fields
+            )
+        ]
+@paddle.no_grad()
+def decode(
+    model: "Whisper",
+    mel: paddle.Tensor,
+    options: DecodingOptions = DecodingOptions(),
+    resource_path=str,
+) -> Union[DecodingResult, List[DecodingResult]]:
+    """
+    Performs decoding of 30-second audio segment(s), provided as Mel spectrogram(s).
+    Parameters
+    ----------
+    model: Whisper
+        the Whisper model instance
+    mel: paddle.Tensor, shape = (80, 3000) or (*, 80, 3000)
+        A tensor containing the Mel spectrogram(s)
+    options: DecodingOptions
+        A dataclass that contains all necessary options for decoding 30-second segments
+    Returns
+    -------
+    result: Union[DecodingResult, List[DecodingResult]]
+        The result(s) of decoding contained in `DecodingResult` dataclass instance(s)
+    """
+    single = mel.ndim == 2
+    if single:
+        mel = mel.unsqueeze(0)
+    result = DecodingTask(model, options, resource_path).run(mel)
+    if single:
+        result = result[0]
+    return result
+class Whisper(paddle.nn.Layer):
+    """
+    The `Whisper` module use AudioEncoder and TextDecoder, and return detect_language, transcribe, decode.
+    """
+    def __init__(self, dims: ModelDimensions):
+        super().__init__()
+        self.dims = dims
+        self.encoder = AudioEncoder(
+            self.dims.n_mels,
+            self.dims.n_audio_ctx,
+            self.dims.n_audio_state,
+            self.dims.n_audio_head,
+            self.dims.n_audio_layer,
+        )
+        self.decoder = TextDecoder(
+            self.dims.n_vocab,
+            self.dims.n_text_ctx,
+            self.dims.n_text_state,
+            self.dims.n_text_head,
+            self.dims.n_text_layer,
+        )
+    def embed_audio(self, mel: paddle.Tensor):
+        return self.encoder.forward(mel)
+    def logits(self, tokens: paddle.Tensor, audio_features: paddle.Tensor):
+        return self.decoder.forward(tokens, audio_features)
+    def forward(
+        self, mel: paddle.Tensor, tokens: paddle.Tensor
+    ) -> Dict[str, paddle.Tensor]:
+        return self.decoder(tokens, self.encoder(mel))
+    @property
+    def device(self):
+        return paddle.device.get_device()
+    @property
+    def is_multilingual(self):
+        return self.dims.n_vocab == 51865
+    def install_kv_cache_hooks(self, cache: Optional[dict] = None):
+        """
+        The `MultiHeadAttention` module optionally accepts `kv_cache` which stores the key and value
+        tensors calculated for the previous positions. This method returns a dictionary that stores
+        all caches, and the necessary hooks for the key and value projection modules that save the
+        intermediate tensors to be reused during later calculations.
+        Returns
+        -------
+        cache : Dict[nn.Layer, paddle.Tensor]
+            A dictionary object mapping the key/value projection modules to its cache
+        hooks : List[RemovableHandle]
+            List of PyTorch RemovableHandle objects to stop the hooks to be called
+        """
+        cache = {**cache} if cache is not None else {}
+        hooks = []
+        def save_to_cache(module, _, output):
+            if (
+                module not in cache
+                or output.shape[1] > self.decoder.positional_embedding.shape[0]
+            ):
+                cache[module] = (
+                    output  # save as-is, for the first token or cross attention
+                )
+            else:
+                cache[module] = paddle.concat([cache[module], output], axis=1).detach()
+            return cache[module]
+        def install_hooks(layer: paddle.nn.Layer):
+            if isinstance(layer, MultiHeadAttention):
+                hooks.append(layer.key.register_forward_post_hook(save_to_cache))
+                hooks.append(layer.value.register_forward_post_hook(save_to_cache))
+        self.decoder.apply(install_hooks)
+        return cache, hooks
+    detect_language = detect_language
+    transcribe = transcribe
+    decode = decode
+def pad_or_trim(array, length: int = N_SAMPLES, *, axis: int = -1):
+    """
+    Pad or trim the audio array to N_SAMPLES, as expected by the encoder.
+    """
+    if paddle.is_tensor(array):
+        if array.shape[axis] > length:
+            array = array.index_select(axis=axis, index=paddle.arange(length))
+        if array.shape[axis] < length:
+            pad_widths = [(0, 0)] * array.ndim
+            pad_widths[axis] = (0, length - array.shape[axis])
+            array = paddle.transpose(array, (1, 0))
+            array = paddle.nn.functional.pad(
+                array,
+                [pad for sizes in pad_widths[::-1] for pad in sizes],
+                data_format="NLC",
+            )
+            array = paddle.transpose(array, (1, 0))
+    else:
+        if array.shape[axis] > length:
+            array = array.take(indices=range(length), axis=axis)
+        if array.shape[axis] < length:
+            pad_widths = [(0, 0)] * array.ndim
+            pad_widths[axis] = (0, length - array.shape[axis])
+            array = paddle.transpose(array, (1, 0))
+            array = np.pad(array, pad_widths)
+            array = paddle.transpose(array, (1, 0))
+    return array
+def hann_window(n_fft: int = N_FFT):
+    """
+    hanning window
+    n_fft:  The number of frequency components of the discrete Fourier transform.
+    """
+    return paddle.to_tensor(
+        [0.5 - 0.5 * np.cos(2 * np.pi * n / n_fft) for n in range(n_fft)],
+        dtype=paddle.float32,
+    )
+@lru_cache(maxsize=None)
+def mel_filters(resource_path: str, n_mels: int = N_MELS) -> paddle.Tensor:
+    """
+    load the mel filterbank matrix for projecting STFT into a Mel spectrogram.
+    Allows decoupling librosa dependency; saved using:
+        np.savez_compressed(
+            "mel_filters.npz",
+            mel_80=librosa.filters.mel(sr=16000, n_fft=400, n_mels=80),
+        )
+    """
+    assert n_mels == 80, f"Unsupported n_mels: {n_mels}"
+    with np.load(os.path.join(resource_path, "assets", "mel_filters.npz")) as f:
+        return paddle.to_tensor(f[f"mel_{n_mels}"])
+def log_mel_spectrogram(
+    audio: Union[str, np.ndarray, paddle.Tensor],
+    n_mels: int = N_MELS,
+    resource_path: str = None,
+):
+    """
+    Compute the log-Mel spectrogram of
+    Parameters
+    ----------
+    audio: Union[str, np.ndarray, paddle.Tensor], shape = (*)
+        The path to audio or either a NumPy array or Tensor containing the audio waveform in 16 kHz
+    n_mels: int
+        The number of Mel-frequency filters, only 80 is supported
+    Returns
+    -------
+    paddle.Tensor, shape = (80, n_frames)
+        A Tensor that contains the Mel spectrogram
+    """
+    if not paddle.is_tensor(audio):
+        if isinstance(audio, str):
+            audio, _ = soundfile.read(audio, dtype="float32", always_2d=True)
+            audio = audio[:, 0]
+        audio = paddle.to_tensor(audio)
+    window = hann_window(N_FFT)
+    stft = paddle.signal.stft(audio, N_FFT, HOP_LENGTH, window=window)
+    magnitudes = stft[:, :-1].abs() ** 2
+    filters = mel_filters(resource_path, n_mels)
+    mel_spec = filters @ magnitudes
+    mel_spec = paddle.to_tensor(mel_spec.numpy().tolist())
+    log_spec = paddle.clip(mel_spec, min=1e-10).log10()
+    log_spec = paddle.maximum(log_spec, log_spec.max() - 8.0)
+    log_spec = (log_spec + 4.0) / 4.0
+    return log_spec

paddlex 2.1.0__py3-none-any.whl → 3.0.0rc0__py3-none-any.whl

paddlex 2.1.0py3-none-any.whl → 3.0.0rc0py3-none-any.whl