paddlex 2.0.0rc4__py3-none-any.whl → 3.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (1533) hide show
  1. paddlex/.version +1 -0
  2. paddlex/__init__.py +35 -18
  3. paddlex/__main__.py +39 -0
  4. paddlex/configs/modules/3d_bev_detection/BEVFusion.yaml +38 -0
  5. paddlex/configs/modules/chart_parsing/PP-Chart2Table.yaml +13 -0
  6. paddlex/configs/modules/doc_text_orientation/PP-LCNet_x1_0_doc_ori.yaml +41 -0
  7. paddlex/configs/modules/doc_vlm/PP-DocBee-2B.yaml +14 -0
  8. paddlex/configs/modules/doc_vlm/PP-DocBee-7B.yaml +14 -0
  9. paddlex/configs/modules/doc_vlm/PP-DocBee2-3B.yaml +14 -0
  10. paddlex/configs/modules/face_detection/BlazeFace-FPN-SSH.yaml +40 -0
  11. paddlex/configs/modules/face_detection/BlazeFace.yaml +40 -0
  12. paddlex/configs/modules/face_detection/PP-YOLOE_plus-S_face.yaml +40 -0
  13. paddlex/configs/modules/face_detection/PicoDet_LCNet_x2_5_face.yaml +40 -0
  14. paddlex/configs/modules/face_feature/MobileFaceNet.yaml +41 -0
  15. paddlex/configs/modules/face_feature/ResNet50_face.yaml +41 -0
  16. paddlex/configs/modules/formula_recognition/LaTeX_OCR_rec.yaml +40 -0
  17. paddlex/configs/modules/formula_recognition/PP-FormulaNet-L.yaml +40 -0
  18. paddlex/configs/modules/formula_recognition/PP-FormulaNet-S.yaml +40 -0
  19. paddlex/configs/modules/formula_recognition/PP-FormulaNet_plus-L.yaml +40 -0
  20. paddlex/configs/modules/formula_recognition/PP-FormulaNet_plus-M.yaml +40 -0
  21. paddlex/configs/modules/formula_recognition/PP-FormulaNet_plus-S.yaml +40 -0
  22. paddlex/configs/modules/formula_recognition/UniMERNet.yaml +40 -0
  23. paddlex/configs/modules/human_detection/PP-YOLOE-L_human.yaml +42 -0
  24. paddlex/configs/modules/human_detection/PP-YOLOE-S_human.yaml +42 -0
  25. paddlex/configs/modules/image_anomaly_detection/STFPM.yaml +41 -0
  26. paddlex/configs/modules/image_classification/CLIP_vit_base_patch16_224.yaml +41 -0
  27. paddlex/configs/modules/image_classification/CLIP_vit_large_patch14_224.yaml +41 -0
  28. paddlex/configs/modules/image_classification/ConvNeXt_base_224.yaml +41 -0
  29. paddlex/configs/modules/image_classification/ConvNeXt_base_384.yaml +41 -0
  30. paddlex/configs/modules/image_classification/ConvNeXt_large_224.yaml +41 -0
  31. paddlex/configs/modules/image_classification/ConvNeXt_large_384.yaml +41 -0
  32. paddlex/configs/modules/image_classification/ConvNeXt_small.yaml +41 -0
  33. paddlex/configs/modules/image_classification/ConvNeXt_tiny.yaml +41 -0
  34. paddlex/configs/modules/image_classification/FasterNet-L.yaml +40 -0
  35. paddlex/configs/modules/image_classification/FasterNet-M.yaml +40 -0
  36. paddlex/configs/modules/image_classification/FasterNet-S.yaml +40 -0
  37. paddlex/configs/modules/image_classification/FasterNet-T0.yaml +40 -0
  38. paddlex/configs/modules/image_classification/FasterNet-T1.yaml +40 -0
  39. paddlex/configs/modules/image_classification/FasterNet-T2.yaml +40 -0
  40. paddlex/configs/modules/image_classification/MobileNetV1_x0_25.yaml +41 -0
  41. paddlex/configs/modules/image_classification/MobileNetV1_x0_5.yaml +41 -0
  42. paddlex/configs/modules/image_classification/MobileNetV1_x0_75.yaml +41 -0
  43. paddlex/configs/modules/image_classification/MobileNetV1_x1_0.yaml +41 -0
  44. paddlex/configs/modules/image_classification/MobileNetV2_x0_25.yaml +41 -0
  45. paddlex/configs/modules/image_classification/MobileNetV2_x0_5.yaml +41 -0
  46. paddlex/configs/modules/image_classification/MobileNetV2_x1_0.yaml +41 -0
  47. paddlex/configs/modules/image_classification/MobileNetV2_x1_5.yaml +41 -0
  48. paddlex/configs/modules/image_classification/MobileNetV2_x2_0.yaml +41 -0
  49. paddlex/configs/modules/image_classification/MobileNetV3_large_x0_35.yaml +41 -0
  50. paddlex/configs/modules/image_classification/MobileNetV3_large_x0_5.yaml +41 -0
  51. paddlex/configs/modules/image_classification/MobileNetV3_large_x0_75.yaml +41 -0
  52. paddlex/configs/modules/image_classification/MobileNetV3_large_x1_0.yaml +41 -0
  53. paddlex/configs/modules/image_classification/MobileNetV3_large_x1_25.yaml +41 -0
  54. paddlex/configs/modules/image_classification/MobileNetV3_small_x0_35.yaml +41 -0
  55. paddlex/configs/modules/image_classification/MobileNetV3_small_x0_5.yaml +41 -0
  56. paddlex/configs/modules/image_classification/MobileNetV3_small_x0_75.yaml +41 -0
  57. paddlex/configs/modules/image_classification/MobileNetV3_small_x1_0.yaml +41 -0
  58. paddlex/configs/modules/image_classification/MobileNetV3_small_x1_25.yaml +41 -0
  59. paddlex/configs/modules/image_classification/MobileNetV4_conv_large.yaml +41 -0
  60. paddlex/configs/modules/image_classification/MobileNetV4_conv_medium.yaml +41 -0
  61. paddlex/configs/modules/image_classification/MobileNetV4_conv_small.yaml +41 -0
  62. paddlex/configs/modules/image_classification/MobileNetV4_hybrid_large.yaml +41 -0
  63. paddlex/configs/modules/image_classification/MobileNetV4_hybrid_medium.yaml +41 -0
  64. paddlex/configs/modules/image_classification/PP-HGNetV2-B0.yaml +41 -0
  65. paddlex/configs/modules/image_classification/PP-HGNetV2-B1.yaml +41 -0
  66. paddlex/configs/modules/image_classification/PP-HGNetV2-B2.yaml +41 -0
  67. paddlex/configs/modules/image_classification/PP-HGNetV2-B3.yaml +41 -0
  68. paddlex/configs/modules/image_classification/PP-HGNetV2-B4.yaml +41 -0
  69. paddlex/configs/modules/image_classification/PP-HGNetV2-B5.yaml +41 -0
  70. paddlex/configs/modules/image_classification/PP-HGNetV2-B6.yaml +41 -0
  71. paddlex/configs/modules/image_classification/PP-HGNet_base.yaml +41 -0
  72. paddlex/configs/modules/image_classification/PP-HGNet_small.yaml +41 -0
  73. paddlex/configs/modules/image_classification/PP-HGNet_tiny.yaml +41 -0
  74. paddlex/configs/modules/image_classification/PP-LCNetV2_base.yaml +41 -0
  75. paddlex/configs/modules/image_classification/PP-LCNetV2_large.yaml +41 -0
  76. paddlex/configs/modules/image_classification/PP-LCNetV2_small.yaml +41 -0
  77. paddlex/configs/modules/image_classification/PP-LCNet_x0_25.yaml +41 -0
  78. paddlex/configs/modules/image_classification/PP-LCNet_x0_35.yaml +41 -0
  79. paddlex/configs/modules/image_classification/PP-LCNet_x0_5.yaml +41 -0
  80. paddlex/configs/modules/image_classification/PP-LCNet_x0_75.yaml +41 -0
  81. paddlex/configs/modules/image_classification/PP-LCNet_x1_0.yaml +41 -0
  82. paddlex/configs/modules/image_classification/PP-LCNet_x1_5.yaml +41 -0
  83. paddlex/configs/modules/image_classification/PP-LCNet_x2_0.yaml +41 -0
  84. paddlex/configs/modules/image_classification/PP-LCNet_x2_5.yaml +41 -0
  85. paddlex/configs/modules/image_classification/ResNet101.yaml +41 -0
  86. paddlex/configs/modules/image_classification/ResNet101_vd.yaml +41 -0
  87. paddlex/configs/modules/image_classification/ResNet152.yaml +41 -0
  88. paddlex/configs/modules/image_classification/ResNet152_vd.yaml +41 -0
  89. paddlex/configs/modules/image_classification/ResNet18.yaml +41 -0
  90. paddlex/configs/modules/image_classification/ResNet18_vd.yaml +41 -0
  91. paddlex/configs/modules/image_classification/ResNet200_vd.yaml +41 -0
  92. paddlex/configs/modules/image_classification/ResNet34.yaml +41 -0
  93. paddlex/configs/modules/image_classification/ResNet34_vd.yaml +41 -0
  94. paddlex/configs/modules/image_classification/ResNet50.yaml +41 -0
  95. paddlex/configs/modules/image_classification/ResNet50_vd.yaml +41 -0
  96. paddlex/configs/modules/image_classification/StarNet-S1.yaml +41 -0
  97. paddlex/configs/modules/image_classification/StarNet-S2.yaml +41 -0
  98. paddlex/configs/modules/image_classification/StarNet-S3.yaml +41 -0
  99. paddlex/configs/modules/image_classification/StarNet-S4.yaml +41 -0
  100. paddlex/configs/modules/image_classification/SwinTransformer_base_patch4_window12_384.yaml +41 -0
  101. paddlex/configs/modules/image_classification/SwinTransformer_base_patch4_window7_224.yaml +41 -0
  102. paddlex/configs/modules/image_classification/SwinTransformer_large_patch4_window12_384.yaml +41 -0
  103. paddlex/configs/modules/image_classification/SwinTransformer_large_patch4_window7_224.yaml +41 -0
  104. paddlex/configs/modules/image_classification/SwinTransformer_small_patch4_window7_224.yaml +41 -0
  105. paddlex/configs/modules/image_classification/SwinTransformer_tiny_patch4_window7_224.yaml +41 -0
  106. paddlex/configs/modules/image_feature/PP-ShiTuV2_rec.yaml +42 -0
  107. paddlex/configs/modules/image_feature/PP-ShiTuV2_rec_CLIP_vit_base.yaml +42 -0
  108. paddlex/configs/modules/image_feature/PP-ShiTuV2_rec_CLIP_vit_large.yaml +41 -0
  109. paddlex/configs/modules/image_multilabel_classification/CLIP_vit_base_patch16_448_ML.yaml +41 -0
  110. paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B0_ML.yaml +41 -0
  111. paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B4_ML.yaml +41 -0
  112. paddlex/configs/modules/image_multilabel_classification/PP-HGNetV2-B6_ML.yaml +41 -0
  113. paddlex/configs/modules/image_multilabel_classification/PP-LCNet_x1_0_ML.yaml +41 -0
  114. paddlex/configs/modules/image_multilabel_classification/ResNet50_ML.yaml +41 -0
  115. paddlex/configs/modules/image_unwarping/UVDoc.yaml +12 -0
  116. paddlex/configs/modules/instance_segmentation/Cascade-MaskRCNN-ResNet50-FPN.yaml +40 -0
  117. paddlex/configs/modules/instance_segmentation/Cascade-MaskRCNN-ResNet50-vd-SSLDv2-FPN.yaml +40 -0
  118. paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-H.yaml +40 -0
  119. paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-L.yaml +40 -0
  120. paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-M.yaml +40 -0
  121. paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-S.yaml +40 -0
  122. paddlex/configs/modules/instance_segmentation/Mask-RT-DETR-X.yaml +40 -0
  123. paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNeXt101-vd-FPN.yaml +39 -0
  124. paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet101-FPN.yaml +40 -0
  125. paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet101-vd-FPN.yaml +40 -0
  126. paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50-FPN.yaml +40 -0
  127. paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50-vd-FPN.yaml +40 -0
  128. paddlex/configs/modules/instance_segmentation/MaskRCNN-ResNet50.yaml +40 -0
  129. paddlex/configs/modules/instance_segmentation/PP-YOLOE_seg-S.yaml +40 -0
  130. paddlex/configs/modules/instance_segmentation/SOLOv2.yaml +40 -0
  131. paddlex/configs/modules/keypoint_detection/PP-TinyPose_128x96.yaml +40 -0
  132. paddlex/configs/modules/keypoint_detection/PP-TinyPose_256x192.yaml +40 -0
  133. paddlex/configs/modules/layout_detection/PP-DocBlockLayout.yaml +40 -0
  134. paddlex/configs/modules/layout_detection/PP-DocLayout-L.yaml +40 -0
  135. paddlex/configs/modules/layout_detection/PP-DocLayout-M.yaml +40 -0
  136. paddlex/configs/modules/layout_detection/PP-DocLayout-S.yaml +40 -0
  137. paddlex/configs/modules/layout_detection/PP-DocLayout_plus-L.yaml +40 -0
  138. paddlex/configs/modules/layout_detection/PicoDet-L_layout_17cls.yaml +40 -0
  139. paddlex/configs/modules/layout_detection/PicoDet-L_layout_3cls.yaml +40 -0
  140. paddlex/configs/modules/layout_detection/PicoDet-S_layout_17cls.yaml +40 -0
  141. paddlex/configs/modules/layout_detection/PicoDet-S_layout_3cls.yaml +40 -0
  142. paddlex/configs/modules/layout_detection/PicoDet_layout_1x.yaml +40 -0
  143. paddlex/configs/modules/layout_detection/PicoDet_layout_1x_table.yaml +40 -0
  144. paddlex/configs/modules/layout_detection/RT-DETR-H_layout_17cls.yaml +40 -0
  145. paddlex/configs/modules/layout_detection/RT-DETR-H_layout_3cls.yaml +40 -0
  146. paddlex/configs/modules/mainbody_detection/PP-ShiTuV2_det.yaml +41 -0
  147. paddlex/configs/modules/multilingual_speech_recognition/whisper_base.yaml +12 -0
  148. paddlex/configs/modules/multilingual_speech_recognition/whisper_large.yaml +12 -0
  149. paddlex/configs/modules/multilingual_speech_recognition/whisper_medium.yaml +12 -0
  150. paddlex/configs/modules/multilingual_speech_recognition/whisper_small.yaml +12 -0
  151. paddlex/configs/modules/multilingual_speech_recognition/whisper_tiny.yaml +12 -0
  152. paddlex/configs/modules/object_detection/Cascade-FasterRCNN-ResNet50-FPN.yaml +41 -0
  153. paddlex/configs/modules/object_detection/Cascade-FasterRCNN-ResNet50-vd-SSLDv2-FPN.yaml +42 -0
  154. paddlex/configs/modules/object_detection/CenterNet-DLA-34.yaml +41 -0
  155. paddlex/configs/modules/object_detection/CenterNet-ResNet50.yaml +41 -0
  156. paddlex/configs/modules/object_detection/Co-DINO-R50.yaml +40 -0
  157. paddlex/configs/modules/object_detection/Co-DINO-Swin-L.yaml +40 -0
  158. paddlex/configs/modules/object_detection/Co-Deformable-DETR-R50.yaml +40 -0
  159. paddlex/configs/modules/object_detection/Co-Deformable-DETR-Swin-T.yaml +40 -0
  160. paddlex/configs/modules/object_detection/DETR-R50.yaml +42 -0
  161. paddlex/configs/modules/object_detection/FCOS-ResNet50.yaml +41 -0
  162. paddlex/configs/modules/object_detection/FasterRCNN-ResNeXt101-vd-FPN.yaml +42 -0
  163. paddlex/configs/modules/object_detection/FasterRCNN-ResNet101-FPN.yaml +42 -0
  164. paddlex/configs/modules/object_detection/FasterRCNN-ResNet101.yaml +42 -0
  165. paddlex/configs/modules/object_detection/FasterRCNN-ResNet34-FPN.yaml +42 -0
  166. paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-FPN.yaml +42 -0
  167. paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-vd-FPN.yaml +42 -0
  168. paddlex/configs/modules/object_detection/FasterRCNN-ResNet50-vd-SSLDv2-FPN.yaml +42 -0
  169. paddlex/configs/modules/object_detection/FasterRCNN-ResNet50.yaml +42 -0
  170. paddlex/configs/modules/object_detection/FasterRCNN-Swin-Tiny-FPN.yaml +42 -0
  171. paddlex/configs/modules/object_detection/PP-YOLOE_plus-L.yaml +40 -0
  172. paddlex/configs/modules/object_detection/PP-YOLOE_plus-M.yaml +40 -0
  173. paddlex/configs/modules/object_detection/PP-YOLOE_plus-S.yaml +40 -0
  174. paddlex/configs/modules/object_detection/PP-YOLOE_plus-X.yaml +40 -0
  175. paddlex/configs/modules/object_detection/PicoDet-L.yaml +40 -0
  176. paddlex/configs/modules/object_detection/PicoDet-M.yaml +42 -0
  177. paddlex/configs/modules/object_detection/PicoDet-S.yaml +40 -0
  178. paddlex/configs/modules/object_detection/PicoDet-XS.yaml +42 -0
  179. paddlex/configs/modules/object_detection/RT-DETR-H.yaml +40 -0
  180. paddlex/configs/modules/object_detection/RT-DETR-L.yaml +40 -0
  181. paddlex/configs/modules/object_detection/RT-DETR-R18.yaml +40 -0
  182. paddlex/configs/modules/object_detection/RT-DETR-R50.yaml +40 -0
  183. paddlex/configs/modules/object_detection/RT-DETR-X.yaml +40 -0
  184. paddlex/configs/modules/object_detection/YOLOX-L.yaml +40 -0
  185. paddlex/configs/modules/object_detection/YOLOX-M.yaml +40 -0
  186. paddlex/configs/modules/object_detection/YOLOX-N.yaml +40 -0
  187. paddlex/configs/modules/object_detection/YOLOX-S.yaml +40 -0
  188. paddlex/configs/modules/object_detection/YOLOX-T.yaml +40 -0
  189. paddlex/configs/modules/object_detection/YOLOX-X.yaml +40 -0
  190. paddlex/configs/modules/object_detection/YOLOv3-DarkNet53.yaml +40 -0
  191. paddlex/configs/modules/object_detection/YOLOv3-MobileNetV3.yaml +40 -0
  192. paddlex/configs/modules/object_detection/YOLOv3-ResNet50_vd_DCN.yaml +40 -0
  193. paddlex/configs/modules/open_vocabulary_detection/GroundingDINO-T.yaml +13 -0
  194. paddlex/configs/modules/open_vocabulary_detection/YOLO-Worldv2-L.yaml +13 -0
  195. paddlex/configs/modules/open_vocabulary_segmentation/SAM-H_box.yaml +17 -0
  196. paddlex/configs/modules/open_vocabulary_segmentation/SAM-H_point.yaml +15 -0
  197. paddlex/configs/modules/pedestrian_attribute_recognition/PP-LCNet_x1_0_pedestrian_attribute.yaml +41 -0
  198. paddlex/configs/modules/rotated_object_detection/PP-YOLOE-R-L.yaml +40 -0
  199. paddlex/configs/modules/seal_text_detection/PP-OCRv4_mobile_seal_det.yaml +40 -0
  200. paddlex/configs/modules/seal_text_detection/PP-OCRv4_server_seal_det.yaml +40 -0
  201. paddlex/configs/modules/semantic_segmentation/Deeplabv3-R101.yaml +40 -0
  202. paddlex/configs/modules/semantic_segmentation/Deeplabv3-R50.yaml +40 -0
  203. paddlex/configs/modules/semantic_segmentation/Deeplabv3_Plus-R101.yaml +40 -0
  204. paddlex/configs/modules/semantic_segmentation/Deeplabv3_Plus-R50.yaml +40 -0
  205. paddlex/configs/modules/semantic_segmentation/MaskFormer_small.yaml +42 -0
  206. paddlex/configs/modules/semantic_segmentation/MaskFormer_tiny.yaml +42 -0
  207. paddlex/configs/modules/semantic_segmentation/OCRNet_HRNet-W18.yaml +40 -0
  208. paddlex/configs/modules/semantic_segmentation/OCRNet_HRNet-W48.yaml +40 -0
  209. paddlex/configs/modules/semantic_segmentation/PP-LiteSeg-B.yaml +41 -0
  210. paddlex/configs/modules/semantic_segmentation/PP-LiteSeg-T.yaml +40 -0
  211. paddlex/configs/modules/semantic_segmentation/SeaFormer_base.yaml +40 -0
  212. paddlex/configs/modules/semantic_segmentation/SeaFormer_large.yaml +40 -0
  213. paddlex/configs/modules/semantic_segmentation/SeaFormer_small.yaml +40 -0
  214. paddlex/configs/modules/semantic_segmentation/SeaFormer_tiny.yaml +40 -0
  215. paddlex/configs/modules/semantic_segmentation/SegFormer-B0.yaml +40 -0
  216. paddlex/configs/modules/semantic_segmentation/SegFormer-B1.yaml +40 -0
  217. paddlex/configs/modules/semantic_segmentation/SegFormer-B2.yaml +40 -0
  218. paddlex/configs/modules/semantic_segmentation/SegFormer-B3.yaml +40 -0
  219. paddlex/configs/modules/semantic_segmentation/SegFormer-B4.yaml +40 -0
  220. paddlex/configs/modules/semantic_segmentation/SegFormer-B5.yaml +40 -0
  221. paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-L.yaml +42 -0
  222. paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-S.yaml +42 -0
  223. paddlex/configs/modules/small_object_detection/PP-YOLOE_plus_SOD-largesize-L.yaml +42 -0
  224. paddlex/configs/modules/table_cells_detection/RT-DETR-L_wired_table_cell_det.yaml +40 -0
  225. paddlex/configs/modules/table_cells_detection/RT-DETR-L_wireless_table_cell_det.yaml +40 -0
  226. paddlex/configs/modules/table_classification/PP-LCNet_x1_0_table_cls.yaml +41 -0
  227. paddlex/configs/modules/table_structure_recognition/SLANeXt_wired.yaml +39 -0
  228. paddlex/configs/modules/table_structure_recognition/SLANeXt_wireless.yaml +39 -0
  229. paddlex/configs/modules/table_structure_recognition/SLANet.yaml +39 -0
  230. paddlex/configs/modules/table_structure_recognition/SLANet_plus.yaml +39 -0
  231. paddlex/configs/modules/text_detection/PP-OCRv3_mobile_det.yaml +40 -0
  232. paddlex/configs/modules/text_detection/PP-OCRv3_server_det.yaml +40 -0
  233. paddlex/configs/modules/text_detection/PP-OCRv4_mobile_det.yaml +40 -0
  234. paddlex/configs/modules/text_detection/PP-OCRv4_server_det.yaml +40 -0
  235. paddlex/configs/modules/text_detection/PP-OCRv5_mobile_det.yaml +40 -0
  236. paddlex/configs/modules/text_detection/PP-OCRv5_server_det.yaml +40 -0
  237. paddlex/configs/modules/text_recognition/PP-OCRv3_mobile_rec.yaml +39 -0
  238. paddlex/configs/modules/text_recognition/PP-OCRv4_mobile_rec.yaml +39 -0
  239. paddlex/configs/modules/text_recognition/PP-OCRv4_server_rec.yaml +39 -0
  240. paddlex/configs/modules/text_recognition/PP-OCRv4_server_rec_doc.yaml +39 -0
  241. paddlex/configs/modules/text_recognition/PP-OCRv5_mobile_rec.yaml +39 -0
  242. paddlex/configs/modules/text_recognition/PP-OCRv5_server_rec.yaml +39 -0
  243. paddlex/configs/modules/text_recognition/arabic_PP-OCRv3_mobile_rec.yaml +39 -0
  244. paddlex/configs/modules/text_recognition/ch_RepSVTR_rec.yaml +39 -0
  245. paddlex/configs/modules/text_recognition/ch_SVTRv2_rec.yaml +39 -0
  246. paddlex/configs/modules/text_recognition/chinese_cht_PP-OCRv3_mobile_rec.yaml +39 -0
  247. paddlex/configs/modules/text_recognition/cyrillic_PP-OCRv3_mobile_rec.yaml +39 -0
  248. paddlex/configs/modules/text_recognition/devanagari_PP-OCRv3_mobile_rec.yaml +39 -0
  249. paddlex/configs/modules/text_recognition/en_PP-OCRv3_mobile_rec.yaml +39 -0
  250. paddlex/configs/modules/text_recognition/en_PP-OCRv4_mobile_rec.yaml +39 -0
  251. paddlex/configs/modules/text_recognition/japan_PP-OCRv3_mobile_rec.yaml +39 -0
  252. paddlex/configs/modules/text_recognition/ka_PP-OCRv3_mobile_rec.yaml +39 -0
  253. paddlex/configs/modules/text_recognition/korean_PP-OCRv3_mobile_rec.yaml +39 -0
  254. paddlex/configs/modules/text_recognition/latin_PP-OCRv3_mobile_rec.yaml +39 -0
  255. paddlex/configs/modules/text_recognition/ta_PP-OCRv3_mobile_rec.yaml +39 -0
  256. paddlex/configs/modules/text_recognition/te_PP-OCRv3_mobile_rec.yaml +39 -0
  257. paddlex/configs/modules/textline_orientation/PP-LCNet_x0_25_textline_ori.yaml +41 -0
  258. paddlex/configs/modules/ts_anomaly_detection/AutoEncoder_ad.yaml +37 -0
  259. paddlex/configs/modules/ts_anomaly_detection/DLinear_ad.yaml +37 -0
  260. paddlex/configs/modules/ts_anomaly_detection/Nonstationary_ad.yaml +37 -0
  261. paddlex/configs/modules/ts_anomaly_detection/PatchTST_ad.yaml +37 -0
  262. paddlex/configs/modules/ts_anomaly_detection/TimesNet_ad.yaml +37 -0
  263. paddlex/configs/modules/ts_classification/TimesNet_cls.yaml +37 -0
  264. paddlex/configs/modules/ts_forecast/DLinear.yaml +38 -0
  265. paddlex/configs/modules/ts_forecast/NLinear.yaml +38 -0
  266. paddlex/configs/modules/ts_forecast/Nonstationary.yaml +38 -0
  267. paddlex/configs/modules/ts_forecast/PatchTST.yaml +38 -0
  268. paddlex/configs/modules/ts_forecast/RLinear.yaml +38 -0
  269. paddlex/configs/modules/ts_forecast/TiDE.yaml +38 -0
  270. paddlex/configs/modules/ts_forecast/TimesNet.yaml +38 -0
  271. paddlex/configs/modules/vehicle_attribute_recognition/PP-LCNet_x1_0_vehicle_attribute.yaml +41 -0
  272. paddlex/configs/modules/vehicle_detection/PP-YOLOE-L_vehicle.yaml +41 -0
  273. paddlex/configs/modules/vehicle_detection/PP-YOLOE-S_vehicle.yaml +42 -0
  274. paddlex/configs/modules/video_classification/PP-TSM-R50_8frames_uniform.yaml +42 -0
  275. paddlex/configs/modules/video_classification/PP-TSMv2-LCNetV2_16frames_uniform.yaml +42 -0
  276. paddlex/configs/modules/video_classification/PP-TSMv2-LCNetV2_8frames_uniform.yaml +42 -0
  277. paddlex/configs/modules/video_detection/YOWO.yaml +40 -0
  278. paddlex/configs/pipelines/3d_bev_detection.yaml +9 -0
  279. paddlex/configs/pipelines/OCR.yaml +45 -0
  280. paddlex/configs/pipelines/PP-ChatOCRv3-doc.yaml +151 -0
  281. paddlex/configs/pipelines/PP-ChatOCRv4-doc.yaml +237 -0
  282. paddlex/configs/pipelines/PP-ShiTuV2.yaml +18 -0
  283. paddlex/configs/pipelines/PP-StructureV3.yaml +226 -0
  284. paddlex/configs/pipelines/anomaly_detection.yaml +8 -0
  285. paddlex/configs/pipelines/doc_preprocessor.yaml +15 -0
  286. paddlex/configs/pipelines/doc_understanding.yaml +9 -0
  287. paddlex/configs/pipelines/face_recognition.yaml +18 -0
  288. paddlex/configs/pipelines/formula_recognition.yaml +39 -0
  289. paddlex/configs/pipelines/human_keypoint_detection.yaml +17 -0
  290. paddlex/configs/pipelines/image_classification.yaml +10 -0
  291. paddlex/configs/pipelines/image_multilabel_classification.yaml +9 -0
  292. paddlex/configs/pipelines/instance_segmentation.yaml +10 -0
  293. paddlex/configs/pipelines/layout_parsing.yaml +102 -0
  294. paddlex/configs/pipelines/multilingual_speech_recognition.yaml +9 -0
  295. paddlex/configs/pipelines/object_detection.yaml +10 -0
  296. paddlex/configs/pipelines/open_vocabulary_detection.yaml +12 -0
  297. paddlex/configs/pipelines/open_vocabulary_segmentation.yaml +13 -0
  298. paddlex/configs/pipelines/pedestrian_attribute_recognition.yaml +15 -0
  299. paddlex/configs/pipelines/rotated_object_detection.yaml +10 -0
  300. paddlex/configs/pipelines/seal_recognition.yaml +52 -0
  301. paddlex/configs/pipelines/semantic_segmentation.yaml +10 -0
  302. paddlex/configs/pipelines/small_object_detection.yaml +10 -0
  303. paddlex/configs/pipelines/table_recognition.yaml +57 -0
  304. paddlex/configs/pipelines/table_recognition_v2.yaml +82 -0
  305. paddlex/configs/pipelines/ts_anomaly_detection.yaml +8 -0
  306. paddlex/configs/pipelines/ts_classification.yaml +8 -0
  307. paddlex/configs/pipelines/ts_forecast.yaml +8 -0
  308. paddlex/configs/pipelines/vehicle_attribute_recognition.yaml +15 -0
  309. paddlex/configs/pipelines/video_classification.yaml +9 -0
  310. paddlex/configs/pipelines/video_detection.yaml +10 -0
  311. paddlex/constants.py +17 -0
  312. paddlex/engine.py +56 -0
  313. paddlex/hpip_links.html +31 -0
  314. paddlex/inference/__init__.py +19 -0
  315. paddlex/inference/common/__init__.py +13 -0
  316. paddlex/inference/common/batch_sampler/__init__.py +21 -0
  317. paddlex/inference/common/batch_sampler/audio_batch_sampler.py +83 -0
  318. paddlex/inference/common/batch_sampler/base_batch_sampler.py +94 -0
  319. paddlex/inference/common/batch_sampler/det_3d_batch_sampler.py +144 -0
  320. paddlex/inference/common/batch_sampler/doc_vlm_batch_sampler.py +87 -0
  321. paddlex/inference/common/batch_sampler/image_batch_sampler.py +121 -0
  322. paddlex/inference/common/batch_sampler/ts_batch_sampler.py +109 -0
  323. paddlex/inference/common/batch_sampler/video_batch_sampler.py +74 -0
  324. paddlex/inference/common/reader/__init__.py +19 -0
  325. paddlex/inference/common/reader/audio_reader.py +46 -0
  326. paddlex/inference/common/reader/det_3d_reader.py +241 -0
  327. paddlex/inference/common/reader/image_reader.py +73 -0
  328. paddlex/inference/common/reader/ts_reader.py +46 -0
  329. paddlex/inference/common/reader/video_reader.py +42 -0
  330. paddlex/inference/common/result/__init__.py +29 -0
  331. paddlex/inference/common/result/base_cv_result.py +41 -0
  332. paddlex/inference/common/result/base_result.py +72 -0
  333. paddlex/inference/common/result/base_ts_result.py +41 -0
  334. paddlex/inference/common/result/base_video_result.py +36 -0
  335. paddlex/inference/common/result/mixin.py +709 -0
  336. paddlex/inference/models/__init__.py +86 -0
  337. paddlex/inference/models/anomaly_detection/__init__.py +15 -0
  338. paddlex/inference/models/anomaly_detection/predictor.py +135 -0
  339. paddlex/inference/models/anomaly_detection/processors.py +53 -0
  340. paddlex/inference/models/anomaly_detection/result.py +71 -0
  341. paddlex/inference/models/base/__init__.py +15 -0
  342. paddlex/inference/models/base/predictor/__init__.py +15 -0
  343. paddlex/inference/models/base/predictor/base_predictor.py +414 -0
  344. paddlex/inference/models/common/__init__.py +26 -0
  345. paddlex/inference/models/common/static_infer.py +801 -0
  346. paddlex/inference/models/common/tokenizer/__init__.py +21 -0
  347. paddlex/inference/models/common/tokenizer/bert_tokenizer.py +655 -0
  348. paddlex/inference/models/common/tokenizer/clip_tokenizer.py +609 -0
  349. paddlex/inference/models/common/tokenizer/gpt_tokenizer.py +453 -0
  350. paddlex/inference/models/common/tokenizer/qwen2_5_tokenizer.py +112 -0
  351. paddlex/inference/models/common/tokenizer/qwen2_tokenizer.py +438 -0
  352. paddlex/inference/models/common/tokenizer/qwen_tokenizer.py +288 -0
  353. paddlex/inference/models/common/tokenizer/tokenizer_utils.py +2149 -0
  354. paddlex/inference/models/common/tokenizer/tokenizer_utils_base.py +3720 -0
  355. paddlex/inference/models/common/tokenizer/utils.py +66 -0
  356. paddlex/inference/models/common/tokenizer/vocab.py +647 -0
  357. paddlex/inference/models/common/ts/__init__.py +15 -0
  358. paddlex/inference/models/common/ts/funcs.py +540 -0
  359. paddlex/inference/models/common/ts/processors.py +322 -0
  360. paddlex/inference/models/common/vision/__init__.py +23 -0
  361. paddlex/inference/models/common/vision/funcs.py +98 -0
  362. paddlex/inference/models/common/vision/processors.py +285 -0
  363. paddlex/inference/models/common/vlm/__init__.py +13 -0
  364. paddlex/inference/models/common/vlm/activations.py +189 -0
  365. paddlex/inference/models/common/vlm/bert_padding.py +127 -0
  366. paddlex/inference/models/common/vlm/conversion_utils.py +99 -0
  367. paddlex/inference/models/common/vlm/distributed.py +229 -0
  368. paddlex/inference/models/common/vlm/flash_attn_utils.py +119 -0
  369. paddlex/inference/models/common/vlm/fusion_ops.py +205 -0
  370. paddlex/inference/models/common/vlm/generation/__init__.py +34 -0
  371. paddlex/inference/models/common/vlm/generation/configuration_utils.py +533 -0
  372. paddlex/inference/models/common/vlm/generation/logits_process.py +730 -0
  373. paddlex/inference/models/common/vlm/generation/stopping_criteria.py +106 -0
  374. paddlex/inference/models/common/vlm/generation/utils.py +2162 -0
  375. paddlex/inference/models/common/vlm/transformers/__init__.py +16 -0
  376. paddlex/inference/models/common/vlm/transformers/configuration_utils.py +1037 -0
  377. paddlex/inference/models/common/vlm/transformers/conversion_utils.py +408 -0
  378. paddlex/inference/models/common/vlm/transformers/model_outputs.py +1612 -0
  379. paddlex/inference/models/common/vlm/transformers/model_utils.py +2014 -0
  380. paddlex/inference/models/common/vlm/transformers/utils.py +178 -0
  381. paddlex/inference/models/common/vlm/utils.py +109 -0
  382. paddlex/inference/models/doc_vlm/__init__.py +15 -0
  383. paddlex/inference/models/doc_vlm/modeling/GOT_ocr_2_0.py +830 -0
  384. paddlex/inference/models/doc_vlm/modeling/__init__.py +17 -0
  385. paddlex/inference/models/doc_vlm/modeling/qwen2.py +1606 -0
  386. paddlex/inference/models/doc_vlm/modeling/qwen2_5_vl.py +3006 -0
  387. paddlex/inference/models/doc_vlm/modeling/qwen2_vl.py +2495 -0
  388. paddlex/inference/models/doc_vlm/predictor.py +253 -0
  389. paddlex/inference/models/doc_vlm/processors/GOT_ocr_2_0.py +97 -0
  390. paddlex/inference/models/doc_vlm/processors/__init__.py +17 -0
  391. paddlex/inference/models/doc_vlm/processors/common.py +561 -0
  392. paddlex/inference/models/doc_vlm/processors/qwen2_5_vl.py +548 -0
  393. paddlex/inference/models/doc_vlm/processors/qwen2_vl.py +543 -0
  394. paddlex/inference/models/doc_vlm/result.py +21 -0
  395. paddlex/inference/models/face_feature/__init__.py +15 -0
  396. paddlex/inference/models/face_feature/predictor.py +66 -0
  397. paddlex/inference/models/formula_recognition/__init__.py +15 -0
  398. paddlex/inference/models/formula_recognition/predictor.py +193 -0
  399. paddlex/inference/models/formula_recognition/processors.py +1015 -0
  400. paddlex/inference/models/formula_recognition/result.py +411 -0
  401. paddlex/inference/models/image_classification/__init__.py +15 -0
  402. paddlex/inference/models/image_classification/predictor.py +172 -0
  403. paddlex/inference/models/image_classification/processors.py +89 -0
  404. paddlex/inference/models/image_classification/result.py +93 -0
  405. paddlex/inference/models/image_feature/__init__.py +15 -0
  406. paddlex/inference/models/image_feature/predictor.py +146 -0
  407. paddlex/inference/models/image_feature/processors.py +31 -0
  408. paddlex/inference/models/image_feature/result.py +32 -0
  409. paddlex/inference/models/image_multilabel_classification/__init__.py +15 -0
  410. paddlex/inference/models/image_multilabel_classification/predictor.py +95 -0
  411. paddlex/inference/models/image_multilabel_classification/processors.py +89 -0
  412. paddlex/inference/models/image_multilabel_classification/result.py +96 -0
  413. paddlex/inference/models/image_unwarping/__init__.py +15 -0
  414. paddlex/inference/models/image_unwarping/predictor.py +97 -0
  415. paddlex/inference/models/image_unwarping/processors.py +92 -0
  416. paddlex/inference/models/image_unwarping/result.py +47 -0
  417. paddlex/inference/models/instance_segmentation/__init__.py +15 -0
  418. paddlex/inference/models/instance_segmentation/predictor.py +202 -0
  419. paddlex/inference/models/instance_segmentation/processors.py +102 -0
  420. paddlex/inference/models/instance_segmentation/result.py +162 -0
  421. paddlex/inference/models/keypoint_detection/__init__.py +15 -0
  422. paddlex/inference/models/keypoint_detection/predictor.py +190 -0
  423. paddlex/inference/models/keypoint_detection/processors.py +367 -0
  424. paddlex/inference/models/keypoint_detection/result.py +197 -0
  425. paddlex/inference/models/m_3d_bev_detection/__init__.py +15 -0
  426. paddlex/inference/models/m_3d_bev_detection/predictor.py +303 -0
  427. paddlex/inference/models/m_3d_bev_detection/processors.py +990 -0
  428. paddlex/inference/models/m_3d_bev_detection/result.py +68 -0
  429. paddlex/inference/models/m_3d_bev_detection/visualizer_3d.py +169 -0
  430. paddlex/inference/models/multilingual_speech_recognition/__init__.py +15 -0
  431. paddlex/inference/models/multilingual_speech_recognition/predictor.py +137 -0
  432. paddlex/inference/models/multilingual_speech_recognition/processors.py +1933 -0
  433. paddlex/inference/models/multilingual_speech_recognition/result.py +21 -0
  434. paddlex/inference/models/object_detection/__init__.py +15 -0
  435. paddlex/inference/models/object_detection/predictor.py +344 -0
  436. paddlex/inference/models/object_detection/processors.py +885 -0
  437. paddlex/inference/models/object_detection/result.py +114 -0
  438. paddlex/inference/models/object_detection/utils.py +70 -0
  439. paddlex/inference/models/open_vocabulary_detection/__init__.py +15 -0
  440. paddlex/inference/models/open_vocabulary_detection/predictor.py +172 -0
  441. paddlex/inference/models/open_vocabulary_detection/processors/__init__.py +16 -0
  442. paddlex/inference/models/open_vocabulary_detection/processors/common.py +114 -0
  443. paddlex/inference/models/open_vocabulary_detection/processors/groundingdino_processors.py +496 -0
  444. paddlex/inference/models/open_vocabulary_detection/processors/yoloworld_processors.py +209 -0
  445. paddlex/inference/models/open_vocabulary_segmentation/__init__.py +15 -0
  446. paddlex/inference/models/open_vocabulary_segmentation/predictor.py +113 -0
  447. paddlex/inference/models/open_vocabulary_segmentation/processors/__init__.py +15 -0
  448. paddlex/inference/models/open_vocabulary_segmentation/processors/sam_processer.py +249 -0
  449. paddlex/inference/models/open_vocabulary_segmentation/results/__init__.py +15 -0
  450. paddlex/inference/models/open_vocabulary_segmentation/results/sam_result.py +149 -0
  451. paddlex/inference/models/semantic_segmentation/__init__.py +15 -0
  452. paddlex/inference/models/semantic_segmentation/predictor.py +158 -0
  453. paddlex/inference/models/semantic_segmentation/processors.py +117 -0
  454. paddlex/inference/models/semantic_segmentation/result.py +73 -0
  455. paddlex/inference/models/table_structure_recognition/__init__.py +15 -0
  456. paddlex/inference/models/table_structure_recognition/predictor.py +161 -0
  457. paddlex/inference/models/table_structure_recognition/processors.py +229 -0
  458. paddlex/inference/models/table_structure_recognition/result.py +63 -0
  459. paddlex/inference/models/text_detection/__init__.py +15 -0
  460. paddlex/inference/models/text_detection/predictor.py +191 -0
  461. paddlex/inference/models/text_detection/processors.py +538 -0
  462. paddlex/inference/models/text_detection/result.py +46 -0
  463. paddlex/inference/models/text_recognition/__init__.py +15 -0
  464. paddlex/inference/models/text_recognition/predictor.py +98 -0
  465. paddlex/inference/models/text_recognition/processors.py +245 -0
  466. paddlex/inference/models/text_recognition/result.py +76 -0
  467. paddlex/inference/models/ts_anomaly_detection/__init__.py +15 -0
  468. paddlex/inference/models/ts_anomaly_detection/predictor.py +141 -0
  469. paddlex/inference/models/ts_anomaly_detection/processors.py +98 -0
  470. paddlex/inference/models/ts_anomaly_detection/result.py +83 -0
  471. paddlex/inference/models/ts_classification/__init__.py +15 -0
  472. paddlex/inference/models/ts_classification/predictor.py +122 -0
  473. paddlex/inference/models/ts_classification/processors.py +122 -0
  474. paddlex/inference/models/ts_classification/result.py +87 -0
  475. paddlex/inference/models/ts_forecasting/__init__.py +15 -0
  476. paddlex/inference/models/ts_forecasting/predictor.py +154 -0
  477. paddlex/inference/models/ts_forecasting/processors.py +158 -0
  478. paddlex/inference/models/ts_forecasting/result.py +96 -0
  479. paddlex/inference/models/video_classification/__init__.py +15 -0
  480. paddlex/inference/models/video_classification/predictor.py +141 -0
  481. paddlex/inference/models/video_classification/processors.py +409 -0
  482. paddlex/inference/models/video_classification/result.py +96 -0
  483. paddlex/inference/models/video_detection/__init__.py +15 -0
  484. paddlex/inference/models/video_detection/predictor.py +129 -0
  485. paddlex/inference/models/video_detection/processors.py +463 -0
  486. paddlex/inference/models/video_detection/result.py +109 -0
  487. paddlex/inference/pipelines/__init__.py +239 -0
  488. paddlex/inference/pipelines/_parallel.py +172 -0
  489. paddlex/inference/pipelines/anomaly_detection/__init__.py +15 -0
  490. paddlex/inference/pipelines/anomaly_detection/pipeline.py +82 -0
  491. paddlex/inference/pipelines/attribute_recognition/__init__.py +15 -0
  492. paddlex/inference/pipelines/attribute_recognition/pipeline.py +120 -0
  493. paddlex/inference/pipelines/attribute_recognition/result.py +102 -0
  494. paddlex/inference/pipelines/base.py +156 -0
  495. paddlex/inference/pipelines/components/__init__.py +29 -0
  496. paddlex/inference/pipelines/components/chat_server/__init__.py +16 -0
  497. paddlex/inference/pipelines/components/chat_server/base.py +39 -0
  498. paddlex/inference/pipelines/components/chat_server/openai_bot_chat.py +236 -0
  499. paddlex/inference/pipelines/components/common/__init__.py +19 -0
  500. paddlex/inference/pipelines/components/common/base_operator.py +37 -0
  501. paddlex/inference/pipelines/components/common/base_result.py +66 -0
  502. paddlex/inference/pipelines/components/common/convert_points_and_boxes.py +45 -0
  503. paddlex/inference/pipelines/components/common/crop_image_regions.py +556 -0
  504. paddlex/inference/pipelines/components/common/seal_det_warp.py +972 -0
  505. paddlex/inference/pipelines/components/common/sort_boxes.py +85 -0
  506. paddlex/inference/pipelines/components/common/warp_image.py +50 -0
  507. paddlex/inference/pipelines/components/faisser.py +357 -0
  508. paddlex/inference/pipelines/components/prompt_engineering/__init__.py +16 -0
  509. paddlex/inference/pipelines/components/prompt_engineering/base.py +35 -0
  510. paddlex/inference/pipelines/components/prompt_engineering/generate_ensemble_prompt.py +128 -0
  511. paddlex/inference/pipelines/components/prompt_engineering/generate_kie_prompt.py +148 -0
  512. paddlex/inference/pipelines/components/retriever/__init__.py +16 -0
  513. paddlex/inference/pipelines/components/retriever/base.py +228 -0
  514. paddlex/inference/pipelines/components/retriever/openai_bot_retriever.py +70 -0
  515. paddlex/inference/pipelines/components/retriever/qianfan_bot_retriever.py +166 -0
  516. paddlex/inference/pipelines/components/utils/__init__.py +13 -0
  517. paddlex/inference/pipelines/components/utils/mixin.py +206 -0
  518. paddlex/inference/pipelines/doc_preprocessor/__init__.py +15 -0
  519. paddlex/inference/pipelines/doc_preprocessor/pipeline.py +209 -0
  520. paddlex/inference/pipelines/doc_preprocessor/result.py +98 -0
  521. paddlex/inference/pipelines/doc_understanding/__init__.py +15 -0
  522. paddlex/inference/pipelines/doc_understanding/pipeline.py +71 -0
  523. paddlex/inference/pipelines/face_recognition/__init__.py +15 -0
  524. paddlex/inference/pipelines/face_recognition/pipeline.py +63 -0
  525. paddlex/inference/pipelines/face_recognition/result.py +44 -0
  526. paddlex/inference/pipelines/formula_recognition/__init__.py +15 -0
  527. paddlex/inference/pipelines/formula_recognition/pipeline.py +347 -0
  528. paddlex/inference/pipelines/formula_recognition/result.py +282 -0
  529. paddlex/inference/pipelines/image_classification/__init__.py +15 -0
  530. paddlex/inference/pipelines/image_classification/pipeline.py +90 -0
  531. paddlex/inference/pipelines/image_multilabel_classification/__init__.py +15 -0
  532. paddlex/inference/pipelines/image_multilabel_classification/pipeline.py +97 -0
  533. paddlex/inference/pipelines/instance_segmentation/__init__.py +15 -0
  534. paddlex/inference/pipelines/instance_segmentation/pipeline.py +91 -0
  535. paddlex/inference/pipelines/keypoint_detection/__init__.py +15 -0
  536. paddlex/inference/pipelines/keypoint_detection/pipeline.py +158 -0
  537. paddlex/inference/pipelines/layout_parsing/__init__.py +16 -0
  538. paddlex/inference/pipelines/layout_parsing/pipeline.py +568 -0
  539. paddlex/inference/pipelines/layout_parsing/pipeline_v2.py +1382 -0
  540. paddlex/inference/pipelines/layout_parsing/result.py +191 -0
  541. paddlex/inference/pipelines/layout_parsing/result_v2.py +745 -0
  542. paddlex/inference/pipelines/layout_parsing/setting.py +87 -0
  543. paddlex/inference/pipelines/layout_parsing/utils.py +951 -0
  544. paddlex/inference/pipelines/layout_parsing/xycut_enhanced/__init__.py +16 -0
  545. paddlex/inference/pipelines/layout_parsing/xycut_enhanced/utils.py +1143 -0
  546. paddlex/inference/pipelines/layout_parsing/xycut_enhanced/xycuts.py +562 -0
  547. paddlex/inference/pipelines/m_3d_bev_detection/__init__.py +15 -0
  548. paddlex/inference/pipelines/m_3d_bev_detection/pipeline.py +74 -0
  549. paddlex/inference/pipelines/multilingual_speech_recognition/__init__.py +15 -0
  550. paddlex/inference/pipelines/multilingual_speech_recognition/pipeline.py +78 -0
  551. paddlex/inference/pipelines/object_detection/__init__.py +15 -0
  552. paddlex/inference/pipelines/object_detection/pipeline.py +115 -0
  553. paddlex/inference/pipelines/ocr/__init__.py +15 -0
  554. paddlex/inference/pipelines/ocr/pipeline.py +463 -0
  555. paddlex/inference/pipelines/ocr/result.py +255 -0
  556. paddlex/inference/pipelines/open_vocabulary_detection/__init__.py +15 -0
  557. paddlex/inference/pipelines/open_vocabulary_detection/pipeline.py +86 -0
  558. paddlex/inference/pipelines/open_vocabulary_segmentation/__init__.py +15 -0
  559. paddlex/inference/pipelines/open_vocabulary_segmentation/pipeline.py +100 -0
  560. paddlex/inference/pipelines/pp_chatocr/__init__.py +16 -0
  561. paddlex/inference/pipelines/pp_chatocr/pipeline_base.py +111 -0
  562. paddlex/inference/pipelines/pp_chatocr/pipeline_v3.py +781 -0
  563. paddlex/inference/pipelines/pp_chatocr/pipeline_v4.py +992 -0
  564. paddlex/inference/pipelines/pp_shitu_v2/__init__.py +15 -0
  565. paddlex/inference/pipelines/pp_shitu_v2/pipeline.py +156 -0
  566. paddlex/inference/pipelines/pp_shitu_v2/result.py +126 -0
  567. paddlex/inference/pipelines/rotated_object_detection/__init__.py +15 -0
  568. paddlex/inference/pipelines/rotated_object_detection/pipeline.py +95 -0
  569. paddlex/inference/pipelines/seal_recognition/__init__.py +15 -0
  570. paddlex/inference/pipelines/seal_recognition/pipeline.py +335 -0
  571. paddlex/inference/pipelines/seal_recognition/result.py +89 -0
  572. paddlex/inference/pipelines/semantic_segmentation/__init__.py +15 -0
  573. paddlex/inference/pipelines/semantic_segmentation/pipeline.py +95 -0
  574. paddlex/inference/pipelines/small_object_detection/__init__.py +15 -0
  575. paddlex/inference/pipelines/small_object_detection/pipeline.py +95 -0
  576. paddlex/inference/pipelines/table_recognition/__init__.py +16 -0
  577. paddlex/inference/pipelines/table_recognition/pipeline.py +486 -0
  578. paddlex/inference/pipelines/table_recognition/pipeline_v2.py +1395 -0
  579. paddlex/inference/pipelines/table_recognition/result.py +218 -0
  580. paddlex/inference/pipelines/table_recognition/table_recognition_post_processing.py +366 -0
  581. paddlex/inference/pipelines/table_recognition/table_recognition_post_processing_v2.py +488 -0
  582. paddlex/inference/pipelines/table_recognition/utils.py +44 -0
  583. paddlex/inference/pipelines/ts_anomaly_detection/__init__.py +15 -0
  584. paddlex/inference/pipelines/ts_anomaly_detection/pipeline.py +72 -0
  585. paddlex/inference/pipelines/ts_classification/__init__.py +15 -0
  586. paddlex/inference/pipelines/ts_classification/pipeline.py +72 -0
  587. paddlex/inference/pipelines/ts_forecasting/__init__.py +15 -0
  588. paddlex/inference/pipelines/ts_forecasting/pipeline.py +72 -0
  589. paddlex/inference/pipelines/video_classification/__init__.py +15 -0
  590. paddlex/inference/pipelines/video_classification/pipeline.py +79 -0
  591. paddlex/inference/pipelines/video_detection/__init__.py +15 -0
  592. paddlex/inference/pipelines/video_detection/pipeline.py +86 -0
  593. paddlex/inference/serving/__init__.py +17 -0
  594. paddlex/inference/serving/basic_serving/__init__.py +18 -0
  595. paddlex/inference/serving/basic_serving/_app.py +221 -0
  596. paddlex/inference/serving/basic_serving/_pipeline_apps/__init__.py +44 -0
  597. paddlex/inference/serving/basic_serving/_pipeline_apps/_common/__init__.py +13 -0
  598. paddlex/inference/serving/basic_serving/_pipeline_apps/_common/common.py +104 -0
  599. paddlex/inference/serving/basic_serving/_pipeline_apps/_common/image_recognition.py +36 -0
  600. paddlex/inference/serving/basic_serving/_pipeline_apps/_common/ocr.py +95 -0
  601. paddlex/inference/serving/basic_serving/_pipeline_apps/anomaly_detection.py +67 -0
  602. paddlex/inference/serving/basic_serving/_pipeline_apps/doc_preprocessor.py +100 -0
  603. paddlex/inference/serving/basic_serving/_pipeline_apps/doc_understanding.py +153 -0
  604. paddlex/inference/serving/basic_serving/_pipeline_apps/face_recognition.py +226 -0
  605. paddlex/inference/serving/basic_serving/_pipeline_apps/formula_recognition.py +100 -0
  606. paddlex/inference/serving/basic_serving/_pipeline_apps/human_keypoint_detection.py +81 -0
  607. paddlex/inference/serving/basic_serving/_pipeline_apps/image_classification.py +69 -0
  608. paddlex/inference/serving/basic_serving/_pipeline_apps/image_multilabel_classification.py +73 -0
  609. paddlex/inference/serving/basic_serving/_pipeline_apps/instance_segmentation.py +87 -0
  610. paddlex/inference/serving/basic_serving/_pipeline_apps/layout_parsing.py +117 -0
  611. paddlex/inference/serving/basic_serving/_pipeline_apps/m_3d_bev_detection.py +79 -0
  612. paddlex/inference/serving/basic_serving/_pipeline_apps/multilingual_speech_recognition.py +92 -0
  613. paddlex/inference/serving/basic_serving/_pipeline_apps/object_detection.py +77 -0
  614. paddlex/inference/serving/basic_serving/_pipeline_apps/ocr.py +102 -0
  615. paddlex/inference/serving/basic_serving/_pipeline_apps/open_vocabulary_detection.py +81 -0
  616. paddlex/inference/serving/basic_serving/_pipeline_apps/open_vocabulary_segmentation.py +91 -0
  617. paddlex/inference/serving/basic_serving/_pipeline_apps/pedestrian_attribute_recognition.py +84 -0
  618. paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv3_doc.py +193 -0
  619. paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv4_doc.py +223 -0
  620. paddlex/inference/serving/basic_serving/_pipeline_apps/pp_shituv2.py +221 -0
  621. paddlex/inference/serving/basic_serving/_pipeline_apps/pp_structurev3.py +143 -0
  622. paddlex/inference/serving/basic_serving/_pipeline_apps/rotated_object_detection.py +81 -0
  623. paddlex/inference/serving/basic_serving/_pipeline_apps/seal_recognition.py +106 -0
  624. paddlex/inference/serving/basic_serving/_pipeline_apps/semantic_segmentation.py +67 -0
  625. paddlex/inference/serving/basic_serving/_pipeline_apps/small_object_detection.py +72 -0
  626. paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition.py +108 -0
  627. paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition_v2.py +113 -0
  628. paddlex/inference/serving/basic_serving/_pipeline_apps/ts_anomaly_detection.py +65 -0
  629. paddlex/inference/serving/basic_serving/_pipeline_apps/ts_classification.py +64 -0
  630. paddlex/inference/serving/basic_serving/_pipeline_apps/ts_forecast.py +65 -0
  631. paddlex/inference/serving/basic_serving/_pipeline_apps/vehicle_attribute_recognition.py +84 -0
  632. paddlex/inference/serving/basic_serving/_pipeline_apps/video_classification.py +76 -0
  633. paddlex/inference/serving/basic_serving/_pipeline_apps/video_detection.py +92 -0
  634. paddlex/inference/serving/basic_serving/_server.py +40 -0
  635. paddlex/inference/serving/infra/__init__.py +13 -0
  636. paddlex/inference/serving/infra/config.py +36 -0
  637. paddlex/inference/serving/infra/models.py +79 -0
  638. paddlex/inference/serving/infra/storage.py +180 -0
  639. paddlex/inference/serving/infra/utils.py +285 -0
  640. paddlex/inference/serving/schemas/__init__.py +13 -0
  641. paddlex/inference/serving/schemas/anomaly_detection.py +39 -0
  642. paddlex/inference/serving/schemas/doc_preprocessor.py +54 -0
  643. paddlex/inference/serving/schemas/doc_understanding.py +78 -0
  644. paddlex/inference/serving/schemas/face_recognition.py +124 -0
  645. paddlex/inference/serving/schemas/formula_recognition.py +56 -0
  646. paddlex/inference/serving/schemas/human_keypoint_detection.py +55 -0
  647. paddlex/inference/serving/schemas/image_classification.py +45 -0
  648. paddlex/inference/serving/schemas/image_multilabel_classification.py +47 -0
  649. paddlex/inference/serving/schemas/instance_segmentation.py +53 -0
  650. paddlex/inference/serving/schemas/layout_parsing.py +71 -0
  651. paddlex/inference/serving/schemas/m_3d_bev_detection.py +48 -0
  652. paddlex/inference/serving/schemas/multilingual_speech_recognition.py +57 -0
  653. paddlex/inference/serving/schemas/object_detection.py +52 -0
  654. paddlex/inference/serving/schemas/ocr.py +60 -0
  655. paddlex/inference/serving/schemas/open_vocabulary_detection.py +52 -0
  656. paddlex/inference/serving/schemas/open_vocabulary_segmentation.py +52 -0
  657. paddlex/inference/serving/schemas/pedestrian_attribute_recognition.py +61 -0
  658. paddlex/inference/serving/schemas/pp_chatocrv3_doc.py +133 -0
  659. paddlex/inference/serving/schemas/pp_chatocrv4_doc.py +150 -0
  660. paddlex/inference/serving/schemas/pp_shituv2.py +124 -0
  661. paddlex/inference/serving/schemas/pp_structurev3.py +88 -0
  662. paddlex/inference/serving/schemas/rotated_object_detection.py +52 -0
  663. paddlex/inference/serving/schemas/seal_recognition.py +62 -0
  664. paddlex/inference/serving/schemas/semantic_segmentation.py +45 -0
  665. paddlex/inference/serving/schemas/shared/__init__.py +13 -0
  666. paddlex/inference/serving/schemas/shared/classification.py +23 -0
  667. paddlex/inference/serving/schemas/shared/image_segmentation.py +28 -0
  668. paddlex/inference/serving/schemas/shared/object_detection.py +24 -0
  669. paddlex/inference/serving/schemas/shared/ocr.py +25 -0
  670. paddlex/inference/serving/schemas/small_object_detection.py +52 -0
  671. paddlex/inference/serving/schemas/table_recognition.py +64 -0
  672. paddlex/inference/serving/schemas/table_recognition_v2.py +69 -0
  673. paddlex/inference/serving/schemas/ts_anomaly_detection.py +37 -0
  674. paddlex/inference/serving/schemas/ts_classification.py +38 -0
  675. paddlex/inference/serving/schemas/ts_forecast.py +37 -0
  676. paddlex/inference/serving/schemas/vehicle_attribute_recognition.py +61 -0
  677. paddlex/inference/serving/schemas/video_classification.py +44 -0
  678. paddlex/inference/serving/schemas/video_detection.py +56 -0
  679. paddlex/inference/utils/__init__.py +13 -0
  680. paddlex/inference/utils/benchmark.py +379 -0
  681. paddlex/inference/utils/color_map.py +123 -0
  682. paddlex/inference/utils/get_pipeline_path.py +27 -0
  683. paddlex/inference/utils/hpi.py +254 -0
  684. paddlex/inference/utils/hpi_model_info_collection.json +2331 -0
  685. paddlex/inference/utils/io/__init__.py +36 -0
  686. paddlex/inference/utils/io/readers.py +504 -0
  687. paddlex/inference/utils/io/style.py +381 -0
  688. paddlex/inference/utils/io/tablepyxl.py +157 -0
  689. paddlex/inference/utils/io/writers.py +458 -0
  690. paddlex/inference/utils/model_paths.py +48 -0
  691. paddlex/inference/utils/new_ir_blocklist.py +27 -0
  692. paddlex/inference/utils/official_models.py +367 -0
  693. paddlex/inference/utils/pp_option.py +339 -0
  694. paddlex/inference/utils/trt_blocklist.py +43 -0
  695. paddlex/inference/utils/trt_config.py +420 -0
  696. paddlex/model.py +131 -0
  697. paddlex/modules/__init__.py +115 -0
  698. paddlex/modules/anomaly_detection/__init__.py +18 -0
  699. paddlex/modules/anomaly_detection/dataset_checker/__init__.py +94 -0
  700. paddlex/modules/anomaly_detection/dataset_checker/dataset_src/__init__.py +19 -0
  701. paddlex/modules/anomaly_detection/dataset_checker/dataset_src/analyse_dataset.py +82 -0
  702. paddlex/modules/anomaly_detection/dataset_checker/dataset_src/check_dataset.py +91 -0
  703. paddlex/modules/anomaly_detection/dataset_checker/dataset_src/convert_dataset.py +233 -0
  704. paddlex/modules/anomaly_detection/dataset_checker/dataset_src/split_dataset.py +87 -0
  705. paddlex/modules/anomaly_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
  706. paddlex/modules/anomaly_detection/dataset_checker/dataset_src/utils/visualizer.py +76 -0
  707. paddlex/modules/anomaly_detection/evaluator.py +58 -0
  708. paddlex/modules/anomaly_detection/exportor.py +22 -0
  709. paddlex/modules/anomaly_detection/model_list.py +16 -0
  710. paddlex/modules/anomaly_detection/trainer.py +70 -0
  711. paddlex/modules/base/__init__.py +18 -0
  712. paddlex/modules/base/build_model.py +33 -0
  713. paddlex/modules/base/dataset_checker/__init__.py +16 -0
  714. paddlex/modules/base/dataset_checker/dataset_checker.py +169 -0
  715. paddlex/modules/base/dataset_checker/utils.py +108 -0
  716. paddlex/modules/base/evaluator.py +170 -0
  717. paddlex/modules/base/exportor.py +145 -0
  718. paddlex/modules/base/trainer.py +144 -0
  719. paddlex/modules/base/utils/__init__.py +13 -0
  720. paddlex/modules/base/utils/cinn_setting.py +89 -0
  721. paddlex/modules/base/utils/coco_eval.py +94 -0
  722. paddlex/modules/base/utils/topk_eval.py +118 -0
  723. paddlex/modules/doc_vlm/__init__.py +18 -0
  724. paddlex/modules/doc_vlm/dataset_checker.py +29 -0
  725. paddlex/modules/doc_vlm/evaluator.py +29 -0
  726. paddlex/modules/doc_vlm/exportor.py +29 -0
  727. paddlex/modules/doc_vlm/model_list.py +16 -0
  728. paddlex/modules/doc_vlm/trainer.py +41 -0
  729. paddlex/modules/face_recognition/__init__.py +18 -0
  730. paddlex/modules/face_recognition/dataset_checker/__init__.py +71 -0
  731. paddlex/modules/face_recognition/dataset_checker/dataset_src/__init__.py +16 -0
  732. paddlex/modules/face_recognition/dataset_checker/dataset_src/check_dataset.py +172 -0
  733. paddlex/modules/face_recognition/dataset_checker/dataset_src/utils/__init__.py +13 -0
  734. paddlex/modules/face_recognition/dataset_checker/dataset_src/utils/visualizer.py +153 -0
  735. paddlex/modules/face_recognition/evaluator.py +52 -0
  736. paddlex/modules/face_recognition/exportor.py +22 -0
  737. paddlex/modules/face_recognition/model_list.py +15 -0
  738. paddlex/modules/face_recognition/trainer.py +75 -0
  739. paddlex/modules/formula_recognition/__init__.py +18 -0
  740. paddlex/modules/formula_recognition/dataset_checker/__init__.py +113 -0
  741. paddlex/modules/formula_recognition/dataset_checker/dataset_src/__init__.py +19 -0
  742. paddlex/modules/formula_recognition/dataset_checker/dataset_src/analyse_dataset.py +158 -0
  743. paddlex/modules/formula_recognition/dataset_checker/dataset_src/check_dataset.py +76 -0
  744. paddlex/modules/formula_recognition/dataset_checker/dataset_src/convert_dataset.py +95 -0
  745. paddlex/modules/formula_recognition/dataset_checker/dataset_src/split_dataset.py +80 -0
  746. paddlex/modules/formula_recognition/evaluator.py +80 -0
  747. paddlex/modules/formula_recognition/exportor.py +22 -0
  748. paddlex/modules/formula_recognition/model_list.py +23 -0
  749. paddlex/modules/formula_recognition/trainer.py +123 -0
  750. paddlex/modules/general_recognition/__init__.py +18 -0
  751. paddlex/modules/general_recognition/dataset_checker/__init__.py +107 -0
  752. paddlex/modules/general_recognition/dataset_checker/dataset_src/__init__.py +19 -0
  753. paddlex/modules/general_recognition/dataset_checker/dataset_src/analyse_dataset.py +96 -0
  754. paddlex/modules/general_recognition/dataset_checker/dataset_src/check_dataset.py +99 -0
  755. paddlex/modules/general_recognition/dataset_checker/dataset_src/convert_dataset.py +100 -0
  756. paddlex/modules/general_recognition/dataset_checker/dataset_src/split_dataset.py +82 -0
  757. paddlex/modules/general_recognition/dataset_checker/dataset_src/utils/__init__.py +13 -0
  758. paddlex/modules/general_recognition/dataset_checker/dataset_src/utils/visualizer.py +147 -0
  759. paddlex/modules/general_recognition/evaluator.py +31 -0
  760. paddlex/modules/general_recognition/exportor.py +22 -0
  761. paddlex/modules/general_recognition/model_list.py +19 -0
  762. paddlex/modules/general_recognition/trainer.py +52 -0
  763. paddlex/modules/image_classification/__init__.py +18 -0
  764. paddlex/modules/image_classification/dataset_checker/__init__.py +104 -0
  765. paddlex/modules/image_classification/dataset_checker/dataset_src/__init__.py +19 -0
  766. paddlex/modules/image_classification/dataset_checker/dataset_src/analyse_dataset.py +92 -0
  767. paddlex/modules/image_classification/dataset_checker/dataset_src/check_dataset.py +132 -0
  768. paddlex/modules/image_classification/dataset_checker/dataset_src/convert_dataset.py +51 -0
  769. paddlex/modules/image_classification/dataset_checker/dataset_src/split_dataset.py +81 -0
  770. paddlex/modules/image_classification/dataset_checker/dataset_src/utils/__init__.py +13 -0
  771. paddlex/modules/image_classification/dataset_checker/dataset_src/utils/visualizer.py +153 -0
  772. paddlex/modules/image_classification/evaluator.py +43 -0
  773. paddlex/modules/image_classification/exportor.py +22 -0
  774. paddlex/modules/image_classification/model_list.py +99 -0
  775. paddlex/modules/image_classification/trainer.py +82 -0
  776. paddlex/modules/image_unwarping/__init__.py +13 -0
  777. paddlex/modules/image_unwarping/model_list.py +17 -0
  778. paddlex/modules/instance_segmentation/__init__.py +18 -0
  779. paddlex/modules/instance_segmentation/dataset_checker/__init__.py +107 -0
  780. paddlex/modules/instance_segmentation/dataset_checker/dataset_src/__init__.py +19 -0
  781. paddlex/modules/instance_segmentation/dataset_checker/dataset_src/analyse_dataset.py +82 -0
  782. paddlex/modules/instance_segmentation/dataset_checker/dataset_src/check_dataset.py +95 -0
  783. paddlex/modules/instance_segmentation/dataset_checker/dataset_src/convert_dataset.py +241 -0
  784. paddlex/modules/instance_segmentation/dataset_checker/dataset_src/split_dataset.py +122 -0
  785. paddlex/modules/instance_segmentation/dataset_checker/dataset_src/utils/__init__.py +13 -0
  786. paddlex/modules/instance_segmentation/dataset_checker/dataset_src/utils/visualizer.py +223 -0
  787. paddlex/modules/instance_segmentation/evaluator.py +32 -0
  788. paddlex/modules/instance_segmentation/exportor.py +22 -0
  789. paddlex/modules/instance_segmentation/model_list.py +33 -0
  790. paddlex/modules/instance_segmentation/trainer.py +31 -0
  791. paddlex/modules/keypoint_detection/__init__.py +18 -0
  792. paddlex/modules/keypoint_detection/dataset_checker/__init__.py +56 -0
  793. paddlex/modules/keypoint_detection/dataset_checker/dataset_src/__init__.py +15 -0
  794. paddlex/modules/keypoint_detection/dataset_checker/dataset_src/check_dataset.py +91 -0
  795. paddlex/modules/keypoint_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
  796. paddlex/modules/keypoint_detection/dataset_checker/dataset_src/utils/visualizer.py +124 -0
  797. paddlex/modules/keypoint_detection/evaluator.py +41 -0
  798. paddlex/modules/keypoint_detection/exportor.py +22 -0
  799. paddlex/modules/keypoint_detection/model_list.py +16 -0
  800. paddlex/modules/keypoint_detection/trainer.py +39 -0
  801. paddlex/modules/m_3d_bev_detection/__init__.py +18 -0
  802. paddlex/modules/m_3d_bev_detection/dataset_checker/__init__.py +95 -0
  803. paddlex/modules/m_3d_bev_detection/dataset_checker/dataset_src/__init__.py +17 -0
  804. paddlex/modules/m_3d_bev_detection/dataset_checker/dataset_src/analyse_dataset.py +106 -0
  805. paddlex/modules/m_3d_bev_detection/dataset_checker/dataset_src/check_dataset.py +101 -0
  806. paddlex/modules/m_3d_bev_detection/evaluator.py +46 -0
  807. paddlex/modules/m_3d_bev_detection/exportor.py +22 -0
  808. paddlex/modules/m_3d_bev_detection/model_list.py +18 -0
  809. paddlex/modules/m_3d_bev_detection/trainer.py +68 -0
  810. paddlex/modules/multilabel_classification/__init__.py +18 -0
  811. paddlex/modules/multilabel_classification/dataset_checker/__init__.py +106 -0
  812. paddlex/modules/multilabel_classification/dataset_checker/dataset_src/__init__.py +19 -0
  813. paddlex/modules/multilabel_classification/dataset_checker/dataset_src/analyse_dataset.py +94 -0
  814. paddlex/modules/multilabel_classification/dataset_checker/dataset_src/check_dataset.py +132 -0
  815. paddlex/modules/multilabel_classification/dataset_checker/dataset_src/convert_dataset.py +120 -0
  816. paddlex/modules/multilabel_classification/dataset_checker/dataset_src/split_dataset.py +81 -0
  817. paddlex/modules/multilabel_classification/dataset_checker/dataset_src/utils/__init__.py +13 -0
  818. paddlex/modules/multilabel_classification/dataset_checker/dataset_src/utils/visualizer.py +149 -0
  819. paddlex/modules/multilabel_classification/evaluator.py +43 -0
  820. paddlex/modules/multilabel_classification/exportor.py +22 -0
  821. paddlex/modules/multilabel_classification/model_list.py +24 -0
  822. paddlex/modules/multilabel_classification/trainer.py +85 -0
  823. paddlex/modules/multilingual_speech_recognition/__init__.py +18 -0
  824. paddlex/modules/multilingual_speech_recognition/dataset_checker.py +27 -0
  825. paddlex/modules/multilingual_speech_recognition/evaluator.py +27 -0
  826. paddlex/modules/multilingual_speech_recognition/exportor.py +27 -0
  827. paddlex/modules/multilingual_speech_recognition/model_list.py +22 -0
  828. paddlex/modules/multilingual_speech_recognition/trainer.py +42 -0
  829. paddlex/modules/object_detection/__init__.py +18 -0
  830. paddlex/modules/object_detection/dataset_checker/__init__.py +106 -0
  831. paddlex/modules/object_detection/dataset_checker/dataset_src/__init__.py +19 -0
  832. paddlex/modules/object_detection/dataset_checker/dataset_src/analyse_dataset.py +82 -0
  833. paddlex/modules/object_detection/dataset_checker/dataset_src/check_dataset.py +91 -0
  834. paddlex/modules/object_detection/dataset_checker/dataset_src/convert_dataset.py +438 -0
  835. paddlex/modules/object_detection/dataset_checker/dataset_src/split_dataset.py +123 -0
  836. paddlex/modules/object_detection/dataset_checker/dataset_src/utils/__init__.py +13 -0
  837. paddlex/modules/object_detection/dataset_checker/dataset_src/utils/visualizer.py +193 -0
  838. paddlex/modules/object_detection/evaluator.py +57 -0
  839. paddlex/modules/object_detection/exportor.py +22 -0
  840. paddlex/modules/object_detection/model_list.py +86 -0
  841. paddlex/modules/object_detection/trainer.py +98 -0
  842. paddlex/modules/open_vocabulary_detection/__init__.py +18 -0
  843. paddlex/modules/open_vocabulary_detection/dataset_checker.py +29 -0
  844. paddlex/modules/open_vocabulary_detection/evaluator.py +29 -0
  845. paddlex/modules/open_vocabulary_detection/exportor.py +29 -0
  846. paddlex/modules/open_vocabulary_detection/model_list.py +16 -0
  847. paddlex/modules/open_vocabulary_detection/trainer.py +44 -0
  848. paddlex/modules/open_vocabulary_segmentation/__init__.py +18 -0
  849. paddlex/modules/open_vocabulary_segmentation/dataset_checker.py +29 -0
  850. paddlex/modules/open_vocabulary_segmentation/evaluator.py +29 -0
  851. paddlex/modules/open_vocabulary_segmentation/exportor.py +29 -0
  852. paddlex/modules/open_vocabulary_segmentation/model_list.py +19 -0
  853. paddlex/modules/open_vocabulary_segmentation/trainer.py +44 -0
  854. paddlex/modules/semantic_segmentation/__init__.py +18 -0
  855. paddlex/modules/semantic_segmentation/dataset_checker/__init__.py +109 -0
  856. paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/__init__.py +19 -0
  857. paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/analyse_dataset.py +76 -0
  858. paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/check_dataset.py +80 -0
  859. paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/convert_dataset.py +165 -0
  860. paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/split_dataset.py +87 -0
  861. paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/utils/__init__.py +13 -0
  862. paddlex/modules/semantic_segmentation/dataset_checker/dataset_src/utils/visualizer.py +75 -0
  863. paddlex/modules/semantic_segmentation/evaluator.py +58 -0
  864. paddlex/modules/semantic_segmentation/exportor.py +31 -0
  865. paddlex/modules/semantic_segmentation/model_list.py +37 -0
  866. paddlex/modules/semantic_segmentation/trainer.py +72 -0
  867. paddlex/modules/table_recognition/__init__.py +18 -0
  868. paddlex/modules/table_recognition/dataset_checker/__init__.py +98 -0
  869. paddlex/modules/table_recognition/dataset_checker/dataset_src/__init__.py +18 -0
  870. paddlex/modules/table_recognition/dataset_checker/dataset_src/analyse_dataset.py +59 -0
  871. paddlex/modules/table_recognition/dataset_checker/dataset_src/check_dataset.py +87 -0
  872. paddlex/modules/table_recognition/dataset_checker/dataset_src/split_dataset.py +80 -0
  873. paddlex/modules/table_recognition/evaluator.py +43 -0
  874. paddlex/modules/table_recognition/exportor.py +22 -0
  875. paddlex/modules/table_recognition/model_list.py +21 -0
  876. paddlex/modules/table_recognition/trainer.py +67 -0
  877. paddlex/modules/text_detection/__init__.py +18 -0
  878. paddlex/modules/text_detection/dataset_checker/__init__.py +107 -0
  879. paddlex/modules/text_detection/dataset_checker/dataset_src/__init__.py +18 -0
  880. paddlex/modules/text_detection/dataset_checker/dataset_src/analyse_dataset.py +220 -0
  881. paddlex/modules/text_detection/dataset_checker/dataset_src/check_dataset.py +106 -0
  882. paddlex/modules/text_detection/dataset_checker/dataset_src/split_dataset.py +140 -0
  883. paddlex/modules/text_detection/evaluator.py +41 -0
  884. paddlex/modules/text_detection/exportor.py +22 -0
  885. paddlex/modules/text_detection/model_list.py +26 -0
  886. paddlex/modules/text_detection/trainer.py +65 -0
  887. paddlex/modules/text_recognition/__init__.py +18 -0
  888. paddlex/modules/text_recognition/dataset_checker/__init__.py +125 -0
  889. paddlex/modules/text_recognition/dataset_checker/dataset_src/__init__.py +19 -0
  890. paddlex/modules/text_recognition/dataset_checker/dataset_src/analyse_dataset.py +162 -0
  891. paddlex/modules/text_recognition/dataset_checker/dataset_src/check_dataset.py +104 -0
  892. paddlex/modules/text_recognition/dataset_checker/dataset_src/convert_dataset.py +95 -0
  893. paddlex/modules/text_recognition/dataset_checker/dataset_src/split_dataset.py +80 -0
  894. paddlex/modules/text_recognition/evaluator.py +64 -0
  895. paddlex/modules/text_recognition/exportor.py +22 -0
  896. paddlex/modules/text_recognition/model_list.py +36 -0
  897. paddlex/modules/text_recognition/trainer.py +105 -0
  898. paddlex/modules/ts_anomaly_detection/__init__.py +19 -0
  899. paddlex/modules/ts_anomaly_detection/dataset_checker/__init__.py +111 -0
  900. paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/__init__.py +19 -0
  901. paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/analyse_dataset.py +19 -0
  902. paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/check_dataset.py +64 -0
  903. paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/convert_dataset.py +74 -0
  904. paddlex/modules/ts_anomaly_detection/dataset_checker/dataset_src/split_dataset.py +63 -0
  905. paddlex/modules/ts_anomaly_detection/evaluator.py +67 -0
  906. paddlex/modules/ts_anomaly_detection/exportor.py +44 -0
  907. paddlex/modules/ts_anomaly_detection/model_list.py +22 -0
  908. paddlex/modules/ts_anomaly_detection/trainer.py +113 -0
  909. paddlex/modules/ts_classification/__init__.py +19 -0
  910. paddlex/modules/ts_classification/dataset_checker/__init__.py +111 -0
  911. paddlex/modules/ts_classification/dataset_checker/dataset_src/__init__.py +19 -0
  912. paddlex/modules/ts_classification/dataset_checker/dataset_src/analyse_dataset.py +77 -0
  913. paddlex/modules/ts_classification/dataset_checker/dataset_src/check_dataset.py +64 -0
  914. paddlex/modules/ts_classification/dataset_checker/dataset_src/convert_dataset.py +74 -0
  915. paddlex/modules/ts_classification/dataset_checker/dataset_src/split_dataset.py +88 -0
  916. paddlex/modules/ts_classification/evaluator.py +66 -0
  917. paddlex/modules/ts_classification/exportor.py +44 -0
  918. paddlex/modules/ts_classification/model_list.py +18 -0
  919. paddlex/modules/ts_classification/trainer.py +108 -0
  920. paddlex/modules/ts_forecast/__init__.py +19 -0
  921. paddlex/modules/ts_forecast/dataset_checker/__init__.py +111 -0
  922. paddlex/modules/ts_forecast/dataset_checker/dataset_src/__init__.py +19 -0
  923. paddlex/modules/ts_forecast/dataset_checker/dataset_src/analyse_dataset.py +19 -0
  924. paddlex/modules/ts_forecast/dataset_checker/dataset_src/check_dataset.py +64 -0
  925. paddlex/modules/ts_forecast/dataset_checker/dataset_src/convert_dataset.py +73 -0
  926. paddlex/modules/ts_forecast/dataset_checker/dataset_src/split_dataset.py +63 -0
  927. paddlex/modules/ts_forecast/evaluator.py +66 -0
  928. paddlex/modules/ts_forecast/exportor.py +44 -0
  929. paddlex/modules/ts_forecast/model_list.py +24 -0
  930. paddlex/modules/ts_forecast/trainer.py +108 -0
  931. paddlex/modules/video_classification/__init__.py +18 -0
  932. paddlex/modules/video_classification/dataset_checker/__init__.py +93 -0
  933. paddlex/modules/video_classification/dataset_checker/dataset_src/__init__.py +18 -0
  934. paddlex/modules/video_classification/dataset_checker/dataset_src/analyse_dataset.py +93 -0
  935. paddlex/modules/video_classification/dataset_checker/dataset_src/check_dataset.py +120 -0
  936. paddlex/modules/video_classification/dataset_checker/dataset_src/split_dataset.py +82 -0
  937. paddlex/modules/video_classification/evaluator.py +44 -0
  938. paddlex/modules/video_classification/exportor.py +22 -0
  939. paddlex/modules/video_classification/model_list.py +19 -0
  940. paddlex/modules/video_classification/trainer.py +88 -0
  941. paddlex/modules/video_detection/__init__.py +18 -0
  942. paddlex/modules/video_detection/dataset_checker/__init__.py +86 -0
  943. paddlex/modules/video_detection/dataset_checker/dataset_src/__init__.py +17 -0
  944. paddlex/modules/video_detection/dataset_checker/dataset_src/analyse_dataset.py +100 -0
  945. paddlex/modules/video_detection/dataset_checker/dataset_src/check_dataset.py +132 -0
  946. paddlex/modules/video_detection/evaluator.py +42 -0
  947. paddlex/modules/video_detection/exportor.py +22 -0
  948. paddlex/modules/video_detection/model_list.py +15 -0
  949. paddlex/modules/video_detection/trainer.py +82 -0
  950. paddlex/ops/__init__.py +152 -0
  951. paddlex/ops/iou3d_nms/iou3d_cpu.cpp +266 -0
  952. paddlex/ops/iou3d_nms/iou3d_cpu.h +28 -0
  953. paddlex/ops/iou3d_nms/iou3d_nms.cpp +206 -0
  954. paddlex/ops/iou3d_nms/iou3d_nms.h +35 -0
  955. paddlex/ops/iou3d_nms/iou3d_nms_api.cpp +114 -0
  956. paddlex/ops/iou3d_nms/iou3d_nms_kernel.cu +484 -0
  957. paddlex/ops/setup.py +37 -0
  958. paddlex/ops/voxel/voxelize_op.cc +194 -0
  959. paddlex/ops/voxel/voxelize_op.cu +346 -0
  960. paddlex/paddlex_cli.py +476 -0
  961. paddlex/repo_apis/Paddle3D_api/__init__.py +17 -0
  962. paddlex/repo_apis/Paddle3D_api/bev_fusion/__init__.py +18 -0
  963. paddlex/repo_apis/Paddle3D_api/bev_fusion/config.py +118 -0
  964. paddlex/repo_apis/Paddle3D_api/bev_fusion/model.py +238 -0
  965. paddlex/repo_apis/Paddle3D_api/bev_fusion/register.py +55 -0
  966. paddlex/repo_apis/Paddle3D_api/bev_fusion/runner.py +104 -0
  967. paddlex/repo_apis/Paddle3D_api/pp3d_config.py +145 -0
  968. paddlex/repo_apis/PaddleClas_api/__init__.py +17 -0
  969. paddlex/repo_apis/PaddleClas_api/cls/__init__.py +19 -0
  970. paddlex/repo_apis/PaddleClas_api/cls/config.py +595 -0
  971. paddlex/repo_apis/PaddleClas_api/cls/model.py +355 -0
  972. paddlex/repo_apis/PaddleClas_api/cls/register.py +907 -0
  973. paddlex/repo_apis/PaddleClas_api/cls/runner.py +218 -0
  974. paddlex/repo_apis/PaddleClas_api/shitu_rec/__init__.py +18 -0
  975. paddlex/repo_apis/PaddleClas_api/shitu_rec/config.py +141 -0
  976. paddlex/repo_apis/PaddleClas_api/shitu_rec/model.py +20 -0
  977. paddlex/repo_apis/PaddleClas_api/shitu_rec/register.py +68 -0
  978. paddlex/repo_apis/PaddleClas_api/shitu_rec/runner.py +50 -0
  979. paddlex/repo_apis/PaddleDetection_api/__init__.py +17 -0
  980. paddlex/repo_apis/PaddleDetection_api/config_helper.py +280 -0
  981. paddlex/repo_apis/PaddleDetection_api/instance_seg/__init__.py +18 -0
  982. paddlex/repo_apis/PaddleDetection_api/instance_seg/config.py +457 -0
  983. paddlex/repo_apis/PaddleDetection_api/instance_seg/model.py +403 -0
  984. paddlex/repo_apis/PaddleDetection_api/instance_seg/register.py +262 -0
  985. paddlex/repo_apis/PaddleDetection_api/instance_seg/runner.py +225 -0
  986. paddlex/repo_apis/PaddleDetection_api/object_det/__init__.py +19 -0
  987. paddlex/repo_apis/PaddleDetection_api/object_det/config.py +540 -0
  988. paddlex/repo_apis/PaddleDetection_api/object_det/model.py +429 -0
  989. paddlex/repo_apis/PaddleDetection_api/object_det/official_categories.py +245 -0
  990. paddlex/repo_apis/PaddleDetection_api/object_det/register.py +1135 -0
  991. paddlex/repo_apis/PaddleDetection_api/object_det/runner.py +225 -0
  992. paddlex/repo_apis/PaddleNLP_api/__init__.py +13 -0
  993. paddlex/repo_apis/PaddleOCR_api/__init__.py +22 -0
  994. paddlex/repo_apis/PaddleOCR_api/config_utils.py +53 -0
  995. paddlex/repo_apis/PaddleOCR_api/formula_rec/__init__.py +16 -0
  996. paddlex/repo_apis/PaddleOCR_api/formula_rec/config.py +571 -0
  997. paddlex/repo_apis/PaddleOCR_api/formula_rec/model.py +398 -0
  998. paddlex/repo_apis/PaddleOCR_api/formula_rec/register.py +99 -0
  999. paddlex/repo_apis/PaddleOCR_api/formula_rec/runner.py +239 -0
  1000. paddlex/repo_apis/PaddleOCR_api/table_rec/__init__.py +16 -0
  1001. paddlex/repo_apis/PaddleOCR_api/table_rec/config.py +64 -0
  1002. paddlex/repo_apis/PaddleOCR_api/table_rec/model.py +126 -0
  1003. paddlex/repo_apis/PaddleOCR_api/table_rec/register.py +70 -0
  1004. paddlex/repo_apis/PaddleOCR_api/table_rec/runner.py +51 -0
  1005. paddlex/repo_apis/PaddleOCR_api/text_det/__init__.py +16 -0
  1006. paddlex/repo_apis/PaddleOCR_api/text_det/config.py +62 -0
  1007. paddlex/repo_apis/PaddleOCR_api/text_det/model.py +72 -0
  1008. paddlex/repo_apis/PaddleOCR_api/text_det/register.py +107 -0
  1009. paddlex/repo_apis/PaddleOCR_api/text_det/runner.py +53 -0
  1010. paddlex/repo_apis/PaddleOCR_api/text_rec/__init__.py +16 -0
  1011. paddlex/repo_apis/PaddleOCR_api/text_rec/config.py +564 -0
  1012. paddlex/repo_apis/PaddleOCR_api/text_rec/model.py +398 -0
  1013. paddlex/repo_apis/PaddleOCR_api/text_rec/register.py +216 -0
  1014. paddlex/repo_apis/PaddleOCR_api/text_rec/runner.py +239 -0
  1015. paddlex/repo_apis/PaddleSeg_api/__init__.py +16 -0
  1016. paddlex/repo_apis/PaddleSeg_api/base_seg_config.py +134 -0
  1017. paddlex/repo_apis/PaddleSeg_api/seg/__init__.py +16 -0
  1018. paddlex/repo_apis/PaddleSeg_api/seg/config.py +183 -0
  1019. paddlex/repo_apis/PaddleSeg_api/seg/model.py +491 -0
  1020. paddlex/repo_apis/PaddleSeg_api/seg/register.py +272 -0
  1021. paddlex/repo_apis/PaddleSeg_api/seg/runner.py +261 -0
  1022. paddlex/repo_apis/PaddleTS_api/__init__.py +20 -0
  1023. paddlex/repo_apis/PaddleTS_api/ts_ad/__init__.py +16 -0
  1024. paddlex/repo_apis/PaddleTS_api/ts_ad/config.py +88 -0
  1025. paddlex/repo_apis/PaddleTS_api/ts_ad/register.py +146 -0
  1026. paddlex/repo_apis/PaddleTS_api/ts_ad/runner.py +158 -0
  1027. paddlex/repo_apis/PaddleTS_api/ts_base/__init__.py +13 -0
  1028. paddlex/repo_apis/PaddleTS_api/ts_base/config.py +244 -0
  1029. paddlex/repo_apis/PaddleTS_api/ts_base/model.py +276 -0
  1030. paddlex/repo_apis/PaddleTS_api/ts_base/runner.py +158 -0
  1031. paddlex/repo_apis/PaddleTS_api/ts_cls/__init__.py +16 -0
  1032. paddlex/repo_apis/PaddleTS_api/ts_cls/config.py +72 -0
  1033. paddlex/repo_apis/PaddleTS_api/ts_cls/register.py +59 -0
  1034. paddlex/repo_apis/PaddleTS_api/ts_cls/runner.py +158 -0
  1035. paddlex/repo_apis/PaddleTS_api/ts_fc/__init__.py +16 -0
  1036. paddlex/repo_apis/PaddleTS_api/ts_fc/config.py +136 -0
  1037. paddlex/repo_apis/PaddleTS_api/ts_fc/register.py +186 -0
  1038. paddlex/repo_apis/PaddleVideo_api/__init__.py +17 -0
  1039. paddlex/repo_apis/PaddleVideo_api/config_utils.py +51 -0
  1040. paddlex/repo_apis/PaddleVideo_api/video_cls/__init__.py +19 -0
  1041. paddlex/repo_apis/PaddleVideo_api/video_cls/config.py +548 -0
  1042. paddlex/repo_apis/PaddleVideo_api/video_cls/model.py +346 -0
  1043. paddlex/repo_apis/PaddleVideo_api/video_cls/register.py +70 -0
  1044. paddlex/repo_apis/PaddleVideo_api/video_cls/runner.py +204 -0
  1045. paddlex/repo_apis/PaddleVideo_api/video_det/__init__.py +19 -0
  1046. paddlex/repo_apis/PaddleVideo_api/video_det/config.py +549 -0
  1047. paddlex/repo_apis/PaddleVideo_api/video_det/model.py +298 -0
  1048. paddlex/repo_apis/PaddleVideo_api/video_det/register.py +44 -0
  1049. paddlex/repo_apis/PaddleVideo_api/video_det/runner.py +199 -0
  1050. paddlex/repo_apis/__init__.py +13 -0
  1051. paddlex/repo_apis/base/__init__.py +22 -0
  1052. paddlex/repo_apis/base/config.py +237 -0
  1053. paddlex/repo_apis/base/model.py +563 -0
  1054. paddlex/repo_apis/base/register.py +135 -0
  1055. paddlex/repo_apis/base/runner.py +390 -0
  1056. paddlex/repo_apis/base/utils/__init__.py +13 -0
  1057. paddlex/repo_apis/base/utils/arg.py +64 -0
  1058. paddlex/repo_apis/base/utils/subprocess.py +107 -0
  1059. paddlex/repo_manager/__init__.py +17 -0
  1060. paddlex/repo_manager/core.py +253 -0
  1061. paddlex/repo_manager/meta.py +180 -0
  1062. paddlex/repo_manager/repo.py +425 -0
  1063. paddlex/repo_manager/utils.py +148 -0
  1064. paddlex/utils/__init__.py +1 -12
  1065. paddlex/utils/cache.py +146 -0
  1066. paddlex/utils/config.py +216 -0
  1067. paddlex/utils/custom_device_list.py +311 -0
  1068. paddlex/utils/deps.py +249 -0
  1069. paddlex/utils/device.py +195 -0
  1070. paddlex/utils/download.py +168 -182
  1071. paddlex/utils/env.py +31 -48
  1072. paddlex/utils/errors/__init__.py +17 -0
  1073. paddlex/utils/errors/dataset_checker.py +78 -0
  1074. paddlex/utils/errors/others.py +138 -0
  1075. paddlex/utils/file_interface.py +211 -0
  1076. paddlex/utils/flags.py +70 -0
  1077. paddlex/utils/fonts/__init__.py +97 -0
  1078. paddlex/utils/func_register.py +41 -0
  1079. paddlex/utils/install.py +87 -0
  1080. paddlex/utils/interactive_get_pipeline.py +55 -0
  1081. paddlex/utils/lazy_loader.py +68 -0
  1082. paddlex/utils/logging.py +140 -33
  1083. paddlex/utils/misc.py +201 -0
  1084. paddlex/utils/pipeline_arguments.py +719 -0
  1085. paddlex/utils/result_saver.py +58 -0
  1086. paddlex/utils/subclass_register.py +99 -0
  1087. paddlex/version.py +55 -0
  1088. paddlex-3.0.0.dist-info/METADATA +1168 -0
  1089. paddlex-3.0.0.dist-info/RECORD +1093 -0
  1090. paddlex-3.0.0.dist-info/WHEEL +5 -0
  1091. paddlex-3.0.0.dist-info/entry_points.txt +2 -0
  1092. paddlex-3.0.0.dist-info/licenses/LICENSE +169 -0
  1093. paddlex-3.0.0.dist-info/top_level.txt +1 -0
  1094. PaddleClas/__init__.py +0 -16
  1095. PaddleClas/paddleclas.py +0 -375
  1096. PaddleClas/ppcls/__init__.py +0 -20
  1097. PaddleClas/ppcls/data/__init__.py +0 -15
  1098. PaddleClas/ppcls/data/imaug/__init__.py +0 -94
  1099. PaddleClas/ppcls/data/imaug/autoaugment.py +0 -264
  1100. PaddleClas/ppcls/data/imaug/batch_operators.py +0 -117
  1101. PaddleClas/ppcls/data/imaug/cutout.py +0 -41
  1102. PaddleClas/ppcls/data/imaug/fmix.py +0 -217
  1103. PaddleClas/ppcls/data/imaug/grid.py +0 -89
  1104. PaddleClas/ppcls/data/imaug/hide_and_seek.py +0 -44
  1105. PaddleClas/ppcls/data/imaug/operators.py +0 -244
  1106. PaddleClas/ppcls/data/imaug/randaugment.py +0 -106
  1107. PaddleClas/ppcls/data/imaug/random_erasing.py +0 -55
  1108. PaddleClas/ppcls/data/reader.py +0 -318
  1109. PaddleClas/ppcls/modeling/__init__.py +0 -20
  1110. PaddleClas/ppcls/modeling/architectures/__init__.py +0 -51
  1111. PaddleClas/ppcls/modeling/architectures/alexnet.py +0 -132
  1112. PaddleClas/ppcls/modeling/architectures/darknet.py +0 -161
  1113. PaddleClas/ppcls/modeling/architectures/densenet.py +0 -308
  1114. PaddleClas/ppcls/modeling/architectures/distillation_models.py +0 -65
  1115. PaddleClas/ppcls/modeling/architectures/distilled_vision_transformer.py +0 -196
  1116. PaddleClas/ppcls/modeling/architectures/dpn.py +0 -425
  1117. PaddleClas/ppcls/modeling/architectures/efficientnet.py +0 -901
  1118. PaddleClas/ppcls/modeling/architectures/ghostnet.py +0 -331
  1119. PaddleClas/ppcls/modeling/architectures/googlenet.py +0 -207
  1120. PaddleClas/ppcls/modeling/architectures/hrnet.py +0 -742
  1121. PaddleClas/ppcls/modeling/architectures/inception_v3.py +0 -481
  1122. PaddleClas/ppcls/modeling/architectures/inception_v4.py +0 -455
  1123. PaddleClas/ppcls/modeling/architectures/mixnet.py +0 -782
  1124. PaddleClas/ppcls/modeling/architectures/mobilenet_v1.py +0 -266
  1125. PaddleClas/ppcls/modeling/architectures/mobilenet_v2.py +0 -248
  1126. PaddleClas/ppcls/modeling/architectures/mobilenet_v3.py +0 -359
  1127. PaddleClas/ppcls/modeling/architectures/regnet.py +0 -383
  1128. PaddleClas/ppcls/modeling/architectures/repvgg.py +0 -339
  1129. PaddleClas/ppcls/modeling/architectures/res2net.py +0 -272
  1130. PaddleClas/ppcls/modeling/architectures/res2net_vd.py +0 -295
  1131. PaddleClas/ppcls/modeling/architectures/resnest.py +0 -705
  1132. PaddleClas/ppcls/modeling/architectures/resnet.py +0 -316
  1133. PaddleClas/ppcls/modeling/architectures/resnet_vc.py +0 -309
  1134. PaddleClas/ppcls/modeling/architectures/resnet_vd.py +0 -354
  1135. PaddleClas/ppcls/modeling/architectures/resnext.py +0 -253
  1136. PaddleClas/ppcls/modeling/architectures/resnext101_wsl.py +0 -447
  1137. PaddleClas/ppcls/modeling/architectures/resnext_vd.py +0 -266
  1138. PaddleClas/ppcls/modeling/architectures/rexnet.py +0 -240
  1139. PaddleClas/ppcls/modeling/architectures/se_resnet_vd.py +0 -378
  1140. PaddleClas/ppcls/modeling/architectures/se_resnext.py +0 -290
  1141. PaddleClas/ppcls/modeling/architectures/se_resnext_vd.py +0 -285
  1142. PaddleClas/ppcls/modeling/architectures/shufflenet_v2.py +0 -320
  1143. PaddleClas/ppcls/modeling/architectures/squeezenet.py +0 -154
  1144. PaddleClas/ppcls/modeling/architectures/vgg.py +0 -152
  1145. PaddleClas/ppcls/modeling/architectures/vision_transformer.py +0 -402
  1146. PaddleClas/ppcls/modeling/architectures/xception.py +0 -345
  1147. PaddleClas/ppcls/modeling/architectures/xception_deeplab.py +0 -386
  1148. PaddleClas/ppcls/modeling/loss.py +0 -154
  1149. PaddleClas/ppcls/modeling/utils.py +0 -53
  1150. PaddleClas/ppcls/optimizer/__init__.py +0 -19
  1151. PaddleClas/ppcls/optimizer/learning_rate.py +0 -159
  1152. PaddleClas/ppcls/optimizer/optimizer.py +0 -165
  1153. PaddleClas/ppcls/utils/__init__.py +0 -27
  1154. PaddleClas/ppcls/utils/check.py +0 -151
  1155. PaddleClas/ppcls/utils/config.py +0 -201
  1156. PaddleClas/ppcls/utils/logger.py +0 -120
  1157. PaddleClas/ppcls/utils/metrics.py +0 -107
  1158. PaddleClas/ppcls/utils/misc.py +0 -62
  1159. PaddleClas/ppcls/utils/model_zoo.py +0 -213
  1160. PaddleClas/ppcls/utils/save_load.py +0 -163
  1161. PaddleClas/setup.py +0 -55
  1162. PaddleClas/tools/__init__.py +0 -15
  1163. PaddleClas/tools/download.py +0 -50
  1164. PaddleClas/tools/ema.py +0 -58
  1165. PaddleClas/tools/eval.py +0 -112
  1166. PaddleClas/tools/export_model.py +0 -85
  1167. PaddleClas/tools/export_serving_model.py +0 -76
  1168. PaddleClas/tools/infer/__init__.py +0 -16
  1169. PaddleClas/tools/infer/infer.py +0 -94
  1170. PaddleClas/tools/infer/predict.py +0 -117
  1171. PaddleClas/tools/infer/utils.py +0 -233
  1172. PaddleClas/tools/program.py +0 -444
  1173. PaddleClas/tools/test_hubserving.py +0 -113
  1174. PaddleClas/tools/train.py +0 -141
  1175. paddlex/cls.py +0 -76
  1176. paddlex/command.py +0 -215
  1177. paddlex/cv/__init__.py +0 -17
  1178. paddlex/cv/datasets/__init__.py +0 -18
  1179. paddlex/cv/datasets/coco.py +0 -169
  1180. paddlex/cv/datasets/imagenet.py +0 -88
  1181. paddlex/cv/datasets/seg_dataset.py +0 -91
  1182. paddlex/cv/datasets/voc.py +0 -301
  1183. paddlex/cv/models/__init__.py +0 -18
  1184. paddlex/cv/models/base.py +0 -623
  1185. paddlex/cv/models/classifier.py +0 -814
  1186. paddlex/cv/models/detector.py +0 -1747
  1187. paddlex/cv/models/load_model.py +0 -126
  1188. paddlex/cv/models/segmenter.py +0 -673
  1189. paddlex/cv/models/slim/__init__.py +0 -13
  1190. paddlex/cv/models/slim/prune.py +0 -55
  1191. paddlex/cv/models/utils/__init__.py +0 -13
  1192. paddlex/cv/models/utils/det_metrics/__init__.py +0 -15
  1193. paddlex/cv/models/utils/det_metrics/coco_utils.py +0 -217
  1194. paddlex/cv/models/utils/det_metrics/metrics.py +0 -220
  1195. paddlex/cv/models/utils/ema.py +0 -48
  1196. paddlex/cv/models/utils/seg_metrics.py +0 -62
  1197. paddlex/cv/models/utils/visualize.py +0 -394
  1198. paddlex/cv/transforms/__init__.py +0 -46
  1199. paddlex/cv/transforms/batch_operators.py +0 -286
  1200. paddlex/cv/transforms/box_utils.py +0 -41
  1201. paddlex/cv/transforms/functions.py +0 -193
  1202. paddlex/cv/transforms/operators.py +0 -1402
  1203. paddlex/det.py +0 -43
  1204. paddlex/paddleseg/__init__.py +0 -17
  1205. paddlex/paddleseg/core/__init__.py +0 -20
  1206. paddlex/paddleseg/core/infer.py +0 -289
  1207. paddlex/paddleseg/core/predict.py +0 -145
  1208. paddlex/paddleseg/core/train.py +0 -258
  1209. paddlex/paddleseg/core/val.py +0 -172
  1210. paddlex/paddleseg/cvlibs/__init__.py +0 -17
  1211. paddlex/paddleseg/cvlibs/callbacks.py +0 -279
  1212. paddlex/paddleseg/cvlibs/config.py +0 -359
  1213. paddlex/paddleseg/cvlibs/manager.py +0 -142
  1214. paddlex/paddleseg/cvlibs/param_init.py +0 -91
  1215. paddlex/paddleseg/datasets/__init__.py +0 -21
  1216. paddlex/paddleseg/datasets/ade.py +0 -112
  1217. paddlex/paddleseg/datasets/cityscapes.py +0 -86
  1218. paddlex/paddleseg/datasets/cocostuff.py +0 -79
  1219. paddlex/paddleseg/datasets/dataset.py +0 -164
  1220. paddlex/paddleseg/datasets/mini_deep_globe_road_extraction.py +0 -95
  1221. paddlex/paddleseg/datasets/optic_disc_seg.py +0 -97
  1222. paddlex/paddleseg/datasets/pascal_context.py +0 -80
  1223. paddlex/paddleseg/datasets/voc.py +0 -113
  1224. paddlex/paddleseg/models/__init__.py +0 -39
  1225. paddlex/paddleseg/models/ann.py +0 -436
  1226. paddlex/paddleseg/models/attention_unet.py +0 -189
  1227. paddlex/paddleseg/models/backbones/__init__.py +0 -18
  1228. paddlex/paddleseg/models/backbones/hrnet.py +0 -815
  1229. paddlex/paddleseg/models/backbones/mobilenetv3.py +0 -365
  1230. paddlex/paddleseg/models/backbones/resnet_vd.py +0 -364
  1231. paddlex/paddleseg/models/backbones/xception_deeplab.py +0 -415
  1232. paddlex/paddleseg/models/bisenet.py +0 -311
  1233. paddlex/paddleseg/models/danet.py +0 -220
  1234. paddlex/paddleseg/models/decoupled_segnet.py +0 -233
  1235. paddlex/paddleseg/models/deeplab.py +0 -258
  1236. paddlex/paddleseg/models/dnlnet.py +0 -231
  1237. paddlex/paddleseg/models/emanet.py +0 -219
  1238. paddlex/paddleseg/models/fast_scnn.py +0 -318
  1239. paddlex/paddleseg/models/fcn.py +0 -135
  1240. paddlex/paddleseg/models/gcnet.py +0 -223
  1241. paddlex/paddleseg/models/gscnn.py +0 -357
  1242. paddlex/paddleseg/models/hardnet.py +0 -309
  1243. paddlex/paddleseg/models/isanet.py +0 -202
  1244. paddlex/paddleseg/models/layers/__init__.py +0 -19
  1245. paddlex/paddleseg/models/layers/activation.py +0 -73
  1246. paddlex/paddleseg/models/layers/attention.py +0 -146
  1247. paddlex/paddleseg/models/layers/layer_libs.py +0 -168
  1248. paddlex/paddleseg/models/layers/nonlocal2d.py +0 -155
  1249. paddlex/paddleseg/models/layers/pyramid_pool.py +0 -182
  1250. paddlex/paddleseg/models/losses/__init__.py +0 -27
  1251. paddlex/paddleseg/models/losses/binary_cross_entropy_loss.py +0 -174
  1252. paddlex/paddleseg/models/losses/bootstrapped_cross_entropy.py +0 -73
  1253. paddlex/paddleseg/models/losses/cross_entropy_loss.py +0 -94
  1254. paddlex/paddleseg/models/losses/decoupledsegnet_relax_boundary_loss.py +0 -129
  1255. paddlex/paddleseg/models/losses/dice_loss.py +0 -61
  1256. paddlex/paddleseg/models/losses/edge_attention_loss.py +0 -78
  1257. paddlex/paddleseg/models/losses/gscnn_dual_task_loss.py +0 -141
  1258. paddlex/paddleseg/models/losses/l1_loss.py +0 -76
  1259. paddlex/paddleseg/models/losses/lovasz_loss.py +0 -222
  1260. paddlex/paddleseg/models/losses/mean_square_error_loss.py +0 -65
  1261. paddlex/paddleseg/models/losses/mixed_loss.py +0 -58
  1262. paddlex/paddleseg/models/losses/ohem_cross_entropy_loss.py +0 -99
  1263. paddlex/paddleseg/models/losses/ohem_edge_attention_loss.py +0 -114
  1264. paddlex/paddleseg/models/ocrnet.py +0 -248
  1265. paddlex/paddleseg/models/pspnet.py +0 -147
  1266. paddlex/paddleseg/models/sfnet.py +0 -236
  1267. paddlex/paddleseg/models/shufflenet_slim.py +0 -268
  1268. paddlex/paddleseg/models/u2net.py +0 -574
  1269. paddlex/paddleseg/models/unet.py +0 -155
  1270. paddlex/paddleseg/models/unet_3plus.py +0 -316
  1271. paddlex/paddleseg/models/unet_plusplus.py +0 -237
  1272. paddlex/paddleseg/transforms/__init__.py +0 -16
  1273. paddlex/paddleseg/transforms/functional.py +0 -161
  1274. paddlex/paddleseg/transforms/transforms.py +0 -937
  1275. paddlex/paddleseg/utils/__init__.py +0 -22
  1276. paddlex/paddleseg/utils/config_check.py +0 -60
  1277. paddlex/paddleseg/utils/download.py +0 -163
  1278. paddlex/paddleseg/utils/env/__init__.py +0 -16
  1279. paddlex/paddleseg/utils/env/seg_env.py +0 -56
  1280. paddlex/paddleseg/utils/env/sys_env.py +0 -122
  1281. paddlex/paddleseg/utils/logger.py +0 -48
  1282. paddlex/paddleseg/utils/metrics.py +0 -146
  1283. paddlex/paddleseg/utils/progbar.py +0 -212
  1284. paddlex/paddleseg/utils/timer.py +0 -53
  1285. paddlex/paddleseg/utils/utils.py +0 -120
  1286. paddlex/paddleseg/utils/visualize.py +0 -90
  1287. paddlex/ppcls/__init__.py +0 -20
  1288. paddlex/ppcls/data/__init__.py +0 -15
  1289. paddlex/ppcls/data/imaug/__init__.py +0 -94
  1290. paddlex/ppcls/data/imaug/autoaugment.py +0 -264
  1291. paddlex/ppcls/data/imaug/batch_operators.py +0 -117
  1292. paddlex/ppcls/data/imaug/cutout.py +0 -41
  1293. paddlex/ppcls/data/imaug/fmix.py +0 -217
  1294. paddlex/ppcls/data/imaug/grid.py +0 -89
  1295. paddlex/ppcls/data/imaug/hide_and_seek.py +0 -44
  1296. paddlex/ppcls/data/imaug/operators.py +0 -256
  1297. paddlex/ppcls/data/imaug/randaugment.py +0 -106
  1298. paddlex/ppcls/data/imaug/random_erasing.py +0 -55
  1299. paddlex/ppcls/data/reader.py +0 -318
  1300. paddlex/ppcls/modeling/__init__.py +0 -20
  1301. paddlex/ppcls/modeling/architectures/__init__.py +0 -51
  1302. paddlex/ppcls/modeling/architectures/alexnet.py +0 -132
  1303. paddlex/ppcls/modeling/architectures/darknet.py +0 -161
  1304. paddlex/ppcls/modeling/architectures/densenet.py +0 -308
  1305. paddlex/ppcls/modeling/architectures/distillation_models.py +0 -65
  1306. paddlex/ppcls/modeling/architectures/distilled_vision_transformer.py +0 -196
  1307. paddlex/ppcls/modeling/architectures/dpn.py +0 -425
  1308. paddlex/ppcls/modeling/architectures/efficientnet.py +0 -901
  1309. paddlex/ppcls/modeling/architectures/ghostnet.py +0 -331
  1310. paddlex/ppcls/modeling/architectures/googlenet.py +0 -207
  1311. paddlex/ppcls/modeling/architectures/hrnet.py +0 -742
  1312. paddlex/ppcls/modeling/architectures/inception_v3.py +0 -541
  1313. paddlex/ppcls/modeling/architectures/inception_v4.py +0 -455
  1314. paddlex/ppcls/modeling/architectures/mixnet.py +0 -782
  1315. paddlex/ppcls/modeling/architectures/mobilenet_v1.py +0 -266
  1316. paddlex/ppcls/modeling/architectures/mobilenet_v2.py +0 -248
  1317. paddlex/ppcls/modeling/architectures/mobilenet_v3.py +0 -359
  1318. paddlex/ppcls/modeling/architectures/regnet.py +0 -383
  1319. paddlex/ppcls/modeling/architectures/repvgg.py +0 -339
  1320. paddlex/ppcls/modeling/architectures/res2net.py +0 -272
  1321. paddlex/ppcls/modeling/architectures/res2net_vd.py +0 -295
  1322. paddlex/ppcls/modeling/architectures/resnest.py +0 -705
  1323. paddlex/ppcls/modeling/architectures/resnet.py +0 -317
  1324. paddlex/ppcls/modeling/architectures/resnet_vc.py +0 -309
  1325. paddlex/ppcls/modeling/architectures/resnet_vd.py +0 -354
  1326. paddlex/ppcls/modeling/architectures/resnext.py +0 -259
  1327. paddlex/ppcls/modeling/architectures/resnext101_wsl.py +0 -447
  1328. paddlex/ppcls/modeling/architectures/resnext_vd.py +0 -266
  1329. paddlex/ppcls/modeling/architectures/rexnet.py +0 -240
  1330. paddlex/ppcls/modeling/architectures/se_resnet_vd.py +0 -378
  1331. paddlex/ppcls/modeling/architectures/se_resnext.py +0 -290
  1332. paddlex/ppcls/modeling/architectures/se_resnext_vd.py +0 -285
  1333. paddlex/ppcls/modeling/architectures/shufflenet_v2.py +0 -320
  1334. paddlex/ppcls/modeling/architectures/squeezenet.py +0 -154
  1335. paddlex/ppcls/modeling/architectures/vgg.py +0 -152
  1336. paddlex/ppcls/modeling/architectures/vision_transformer.py +0 -402
  1337. paddlex/ppcls/modeling/architectures/xception.py +0 -345
  1338. paddlex/ppcls/modeling/architectures/xception_deeplab.py +0 -386
  1339. paddlex/ppcls/modeling/loss.py +0 -158
  1340. paddlex/ppcls/modeling/utils.py +0 -53
  1341. paddlex/ppcls/optimizer/__init__.py +0 -19
  1342. paddlex/ppcls/optimizer/learning_rate.py +0 -159
  1343. paddlex/ppcls/optimizer/optimizer.py +0 -165
  1344. paddlex/ppcls/utils/__init__.py +0 -27
  1345. paddlex/ppcls/utils/check.py +0 -151
  1346. paddlex/ppcls/utils/config.py +0 -201
  1347. paddlex/ppcls/utils/logger.py +0 -120
  1348. paddlex/ppcls/utils/metrics.py +0 -112
  1349. paddlex/ppcls/utils/misc.py +0 -62
  1350. paddlex/ppcls/utils/model_zoo.py +0 -213
  1351. paddlex/ppcls/utils/save_load.py +0 -163
  1352. paddlex/ppdet/__init__.py +0 -16
  1353. paddlex/ppdet/core/__init__.py +0 -15
  1354. paddlex/ppdet/core/config/__init__.py +0 -13
  1355. paddlex/ppdet/core/config/schema.py +0 -248
  1356. paddlex/ppdet/core/config/yaml_helpers.py +0 -118
  1357. paddlex/ppdet/core/workspace.py +0 -279
  1358. paddlex/ppdet/data/__init__.py +0 -21
  1359. paddlex/ppdet/data/reader.py +0 -304
  1360. paddlex/ppdet/data/shm_utils.py +0 -67
  1361. paddlex/ppdet/data/source/__init__.py +0 -27
  1362. paddlex/ppdet/data/source/category.py +0 -823
  1363. paddlex/ppdet/data/source/coco.py +0 -243
  1364. paddlex/ppdet/data/source/dataset.py +0 -192
  1365. paddlex/ppdet/data/source/keypoint_coco.py +0 -656
  1366. paddlex/ppdet/data/source/mot.py +0 -360
  1367. paddlex/ppdet/data/source/voc.py +0 -204
  1368. paddlex/ppdet/data/source/widerface.py +0 -180
  1369. paddlex/ppdet/data/transform/__init__.py +0 -28
  1370. paddlex/ppdet/data/transform/autoaugment_utils.py +0 -1593
  1371. paddlex/ppdet/data/transform/batch_operators.py +0 -758
  1372. paddlex/ppdet/data/transform/gridmask_utils.py +0 -83
  1373. paddlex/ppdet/data/transform/keypoint_operators.py +0 -665
  1374. paddlex/ppdet/data/transform/mot_operators.py +0 -636
  1375. paddlex/ppdet/data/transform/op_helper.py +0 -468
  1376. paddlex/ppdet/data/transform/operators.py +0 -2103
  1377. paddlex/ppdet/engine/__init__.py +0 -29
  1378. paddlex/ppdet/engine/callbacks.py +0 -262
  1379. paddlex/ppdet/engine/env.py +0 -47
  1380. paddlex/ppdet/engine/export_utils.py +0 -118
  1381. paddlex/ppdet/engine/tracker.py +0 -425
  1382. paddlex/ppdet/engine/trainer.py +0 -535
  1383. paddlex/ppdet/metrics/__init__.py +0 -23
  1384. paddlex/ppdet/metrics/coco_utils.py +0 -184
  1385. paddlex/ppdet/metrics/json_results.py +0 -151
  1386. paddlex/ppdet/metrics/keypoint_metrics.py +0 -202
  1387. paddlex/ppdet/metrics/map_utils.py +0 -396
  1388. paddlex/ppdet/metrics/metrics.py +0 -300
  1389. paddlex/ppdet/metrics/mot_eval_utils.py +0 -192
  1390. paddlex/ppdet/metrics/mot_metrics.py +0 -184
  1391. paddlex/ppdet/metrics/widerface_utils.py +0 -393
  1392. paddlex/ppdet/model_zoo/__init__.py +0 -18
  1393. paddlex/ppdet/model_zoo/model_zoo.py +0 -86
  1394. paddlex/ppdet/model_zoo/tests/__init__.py +0 -13
  1395. paddlex/ppdet/model_zoo/tests/test_get_model.py +0 -48
  1396. paddlex/ppdet/model_zoo/tests/test_list_model.py +0 -68
  1397. paddlex/ppdet/modeling/__init__.py +0 -41
  1398. paddlex/ppdet/modeling/architectures/__init__.py +0 -40
  1399. paddlex/ppdet/modeling/architectures/cascade_rcnn.py +0 -144
  1400. paddlex/ppdet/modeling/architectures/centernet.py +0 -103
  1401. paddlex/ppdet/modeling/architectures/deepsort.py +0 -111
  1402. paddlex/ppdet/modeling/architectures/fairmot.py +0 -107
  1403. paddlex/ppdet/modeling/architectures/faster_rcnn.py +0 -106
  1404. paddlex/ppdet/modeling/architectures/fcos.py +0 -105
  1405. paddlex/ppdet/modeling/architectures/jde.py +0 -125
  1406. paddlex/ppdet/modeling/architectures/keypoint_hrhrnet.py +0 -286
  1407. paddlex/ppdet/modeling/architectures/keypoint_hrnet.py +0 -203
  1408. paddlex/ppdet/modeling/architectures/mask_rcnn.py +0 -135
  1409. paddlex/ppdet/modeling/architectures/meta_arch.py +0 -45
  1410. paddlex/ppdet/modeling/architectures/s2anet.py +0 -103
  1411. paddlex/ppdet/modeling/architectures/solov2.py +0 -110
  1412. paddlex/ppdet/modeling/architectures/ssd.py +0 -84
  1413. paddlex/ppdet/modeling/architectures/ttfnet.py +0 -98
  1414. paddlex/ppdet/modeling/architectures/yolo.py +0 -104
  1415. paddlex/ppdet/modeling/backbones/__init__.py +0 -37
  1416. paddlex/ppdet/modeling/backbones/blazenet.py +0 -322
  1417. paddlex/ppdet/modeling/backbones/darknet.py +0 -341
  1418. paddlex/ppdet/modeling/backbones/dla.py +0 -244
  1419. paddlex/ppdet/modeling/backbones/ghostnet.py +0 -476
  1420. paddlex/ppdet/modeling/backbones/hrnet.py +0 -724
  1421. paddlex/ppdet/modeling/backbones/mobilenet_v1.py +0 -410
  1422. paddlex/ppdet/modeling/backbones/mobilenet_v3.py +0 -497
  1423. paddlex/ppdet/modeling/backbones/name_adapter.py +0 -69
  1424. paddlex/ppdet/modeling/backbones/res2net.py +0 -358
  1425. paddlex/ppdet/modeling/backbones/resnet.py +0 -606
  1426. paddlex/ppdet/modeling/backbones/senet.py +0 -140
  1427. paddlex/ppdet/modeling/backbones/vgg.py +0 -216
  1428. paddlex/ppdet/modeling/bbox_utils.py +0 -464
  1429. paddlex/ppdet/modeling/heads/__init__.py +0 -41
  1430. paddlex/ppdet/modeling/heads/bbox_head.py +0 -379
  1431. paddlex/ppdet/modeling/heads/cascade_head.py +0 -285
  1432. paddlex/ppdet/modeling/heads/centernet_head.py +0 -194
  1433. paddlex/ppdet/modeling/heads/face_head.py +0 -113
  1434. paddlex/ppdet/modeling/heads/fcos_head.py +0 -270
  1435. paddlex/ppdet/modeling/heads/keypoint_hrhrnet_head.py +0 -108
  1436. paddlex/ppdet/modeling/heads/mask_head.py +0 -253
  1437. paddlex/ppdet/modeling/heads/roi_extractor.py +0 -111
  1438. paddlex/ppdet/modeling/heads/s2anet_head.py +0 -845
  1439. paddlex/ppdet/modeling/heads/solov2_head.py +0 -537
  1440. paddlex/ppdet/modeling/heads/ssd_head.py +0 -175
  1441. paddlex/ppdet/modeling/heads/ttf_head.py +0 -314
  1442. paddlex/ppdet/modeling/heads/yolo_head.py +0 -124
  1443. paddlex/ppdet/modeling/keypoint_utils.py +0 -302
  1444. paddlex/ppdet/modeling/layers.py +0 -1142
  1445. paddlex/ppdet/modeling/losses/__init__.py +0 -35
  1446. paddlex/ppdet/modeling/losses/ctfocal_loss.py +0 -67
  1447. paddlex/ppdet/modeling/losses/fairmot_loss.py +0 -41
  1448. paddlex/ppdet/modeling/losses/fcos_loss.py +0 -225
  1449. paddlex/ppdet/modeling/losses/iou_aware_loss.py +0 -48
  1450. paddlex/ppdet/modeling/losses/iou_loss.py +0 -210
  1451. paddlex/ppdet/modeling/losses/jde_loss.py +0 -182
  1452. paddlex/ppdet/modeling/losses/keypoint_loss.py +0 -228
  1453. paddlex/ppdet/modeling/losses/solov2_loss.py +0 -101
  1454. paddlex/ppdet/modeling/losses/ssd_loss.py +0 -163
  1455. paddlex/ppdet/modeling/losses/yolo_loss.py +0 -212
  1456. paddlex/ppdet/modeling/mot/__init__.py +0 -25
  1457. paddlex/ppdet/modeling/mot/matching/__init__.py +0 -19
  1458. paddlex/ppdet/modeling/mot/matching/deepsort_matching.py +0 -382
  1459. paddlex/ppdet/modeling/mot/matching/jde_matching.py +0 -145
  1460. paddlex/ppdet/modeling/mot/motion/__init__.py +0 -17
  1461. paddlex/ppdet/modeling/mot/motion/kalman_filter.py +0 -270
  1462. paddlex/ppdet/modeling/mot/tracker/__init__.py +0 -23
  1463. paddlex/ppdet/modeling/mot/tracker/base_jde_tracker.py +0 -267
  1464. paddlex/ppdet/modeling/mot/tracker/base_sde_tracker.py +0 -145
  1465. paddlex/ppdet/modeling/mot/tracker/deepsort_tracker.py +0 -165
  1466. paddlex/ppdet/modeling/mot/tracker/jde_tracker.py +0 -262
  1467. paddlex/ppdet/modeling/mot/utils.py +0 -181
  1468. paddlex/ppdet/modeling/mot/visualization.py +0 -130
  1469. paddlex/ppdet/modeling/necks/__init__.py +0 -25
  1470. paddlex/ppdet/modeling/necks/centernet_fpn.py +0 -185
  1471. paddlex/ppdet/modeling/necks/fpn.py +0 -233
  1472. paddlex/ppdet/modeling/necks/hrfpn.py +0 -131
  1473. paddlex/ppdet/modeling/necks/ttf_fpn.py +0 -243
  1474. paddlex/ppdet/modeling/necks/yolo_fpn.py +0 -1034
  1475. paddlex/ppdet/modeling/ops.py +0 -1599
  1476. paddlex/ppdet/modeling/post_process.py +0 -449
  1477. paddlex/ppdet/modeling/proposal_generator/__init__.py +0 -2
  1478. paddlex/ppdet/modeling/proposal_generator/anchor_generator.py +0 -135
  1479. paddlex/ppdet/modeling/proposal_generator/proposal_generator.py +0 -81
  1480. paddlex/ppdet/modeling/proposal_generator/rpn_head.py +0 -269
  1481. paddlex/ppdet/modeling/proposal_generator/target.py +0 -671
  1482. paddlex/ppdet/modeling/proposal_generator/target_layer.py +0 -476
  1483. paddlex/ppdet/modeling/reid/__init__.py +0 -23
  1484. paddlex/ppdet/modeling/reid/fairmot_embedding_head.py +0 -117
  1485. paddlex/ppdet/modeling/reid/jde_embedding_head.py +0 -189
  1486. paddlex/ppdet/modeling/reid/pyramidal_embedding.py +0 -151
  1487. paddlex/ppdet/modeling/reid/resnet.py +0 -320
  1488. paddlex/ppdet/modeling/shape_spec.py +0 -33
  1489. paddlex/ppdet/modeling/tests/__init__.py +0 -13
  1490. paddlex/ppdet/modeling/tests/test_architectures.py +0 -59
  1491. paddlex/ppdet/modeling/tests/test_base.py +0 -75
  1492. paddlex/ppdet/modeling/tests/test_ops.py +0 -839
  1493. paddlex/ppdet/modeling/tests/test_yolov3_loss.py +0 -420
  1494. paddlex/ppdet/optimizer.py +0 -285
  1495. paddlex/ppdet/slim/__init__.py +0 -62
  1496. paddlex/ppdet/slim/distill.py +0 -111
  1497. paddlex/ppdet/slim/prune.py +0 -85
  1498. paddlex/ppdet/slim/quant.py +0 -52
  1499. paddlex/ppdet/utils/__init__.py +0 -13
  1500. paddlex/ppdet/utils/check.py +0 -93
  1501. paddlex/ppdet/utils/checkpoint.py +0 -216
  1502. paddlex/ppdet/utils/cli.py +0 -151
  1503. paddlex/ppdet/utils/colormap.py +0 -56
  1504. paddlex/ppdet/utils/download.py +0 -477
  1505. paddlex/ppdet/utils/logger.py +0 -71
  1506. paddlex/ppdet/utils/stats.py +0 -95
  1507. paddlex/ppdet/utils/visualizer.py +0 -292
  1508. paddlex/ppdet/utils/voc_utils.py +0 -87
  1509. paddlex/seg.py +0 -38
  1510. paddlex/tools/__init__.py +0 -16
  1511. paddlex/tools/convert.py +0 -52
  1512. paddlex/tools/dataset_conversion/__init__.py +0 -24
  1513. paddlex/tools/dataset_conversion/x2coco.py +0 -379
  1514. paddlex/tools/dataset_conversion/x2imagenet.py +0 -82
  1515. paddlex/tools/dataset_conversion/x2seg.py +0 -343
  1516. paddlex/tools/dataset_conversion/x2voc.py +0 -230
  1517. paddlex/tools/dataset_split/__init__.py +0 -23
  1518. paddlex/tools/dataset_split/coco_split.py +0 -69
  1519. paddlex/tools/dataset_split/imagenet_split.py +0 -75
  1520. paddlex/tools/dataset_split/seg_split.py +0 -96
  1521. paddlex/tools/dataset_split/utils.py +0 -75
  1522. paddlex/tools/dataset_split/voc_split.py +0 -91
  1523. paddlex/tools/split.py +0 -41
  1524. paddlex/utils/checkpoint.py +0 -439
  1525. paddlex/utils/shm.py +0 -67
  1526. paddlex/utils/stats.py +0 -68
  1527. paddlex/utils/utils.py +0 -140
  1528. paddlex-2.0.0rc4.dist-info/LICENSE +0 -201
  1529. paddlex-2.0.0rc4.dist-info/METADATA +0 -29
  1530. paddlex-2.0.0rc4.dist-info/RECORD +0 -445
  1531. paddlex-2.0.0rc4.dist-info/WHEEL +0 -5
  1532. paddlex-2.0.0rc4.dist-info/entry_points.txt +0 -3
  1533. paddlex-2.0.0rc4.dist-info/top_level.txt +0 -2
@@ -0,0 +1,1606 @@
1
+ # Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved.
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+
15
+ import math
16
+ from functools import partial
17
+ from typing import List, Optional, Tuple, Union
18
+
19
+ import paddle
20
+ import paddle.distributed.fleet.meta_parallel as mpu
21
+ import paddle.nn as nn
22
+ import paddle.nn.functional as F
23
+ from paddle import Tensor
24
+ from paddle.distributed import fleet
25
+ from paddle.distributed.fleet.utils import sequence_parallel_utils
26
+
27
+ from .....utils import logging
28
+ from .....utils.env import get_device_type
29
+ from ...common.vlm import fusion_ops
30
+ from ...common.vlm.activations import ACT2FN
31
+ from ...common.vlm.transformers import PretrainedConfig, PretrainedModel
32
+ from ...common.vlm.transformers.model_outputs import (
33
+ BaseModelOutputWithPast,
34
+ CausalLMOutputWithPast,
35
+ )
36
+
37
+ try:
38
+ from paddle.incubate.nn.functional import fused_rotary_position_embedding
39
+ except ImportError:
40
+ fused_rotary_position_embedding = None
41
+
42
+ try:
43
+ from paddle.distributed.fleet.utils.sequence_parallel_utils import (
44
+ GatherOp,
45
+ ScatterOp,
46
+ mark_as_sequence_parallel_parameter,
47
+ )
48
+ except:
49
+ pass
50
+
51
+ try:
52
+ from paddle.nn.functional.flash_attention import flash_attention
53
+ except:
54
+ flash_attention = None
55
+
56
+
57
+ Linear = nn.Linear
58
+ ColumnParallelLinear = mpu.ColumnParallelLinear
59
+ RowParallelLinear = mpu.RowParallelLinear
60
+ ColumnSequenceParallelLinear = sequence_parallel_utils.ColumnSequenceParallelLinear
61
+ RowSequenceParallelLinear = sequence_parallel_utils.RowSequenceParallelLinear
62
+
63
+
64
+ class Qwen2Config(PretrainedConfig):
65
+ r"""
66
+ This is the configuration class to store the configuration of a [`Qwen2Model`]. It is used to instantiate a
67
+ Qwen2 model according to the specified arguments, defining the model architecture. Instantiating a configuration
68
+ with the defaults will yield a similar configuration to that of
69
+ Qwen2-7B-beta [Qwen/Qwen2-7B-beta](https://huggingface.co/Qwen/Qwen2-7B-beta).
70
+
71
+ Configuration objects inherit from [`PretrainedConfig`] and can be used to control the model outputs. Read the
72
+ documentation from [`PretrainedConfig`] for more information.
73
+
74
+
75
+ Args:
76
+ vocab_size (`int`, *optional*, defaults to 151936):
77
+ Vocabulary size of the Qwen2 model. Defines the number of different tokens that can be represented by the
78
+ `inputs_ids` passed when calling [`Qwen2Model`]
79
+ hidden_size (`int`, *optional*, defaults to 4096):
80
+ Dimension of the hidden representations.
81
+ intermediate_size (`int`, *optional*, defaults to 22016):
82
+ Dimension of the MLP representations.
83
+ num_hidden_layers (`int`, *optional*, defaults to 32):
84
+ Number of hidden layers in the Transformer encoder.
85
+ num_attention_heads (`int`, *optional*, defaults to 32):
86
+ Number of attention heads for each attention layer in the Transformer encoder.
87
+ num_key_value_heads (`int`, *optional*, defaults to 32):
88
+ This is the number of key_value heads that should be used to implement Grouped Query Attention. If
89
+ `num_key_value_heads=num_attention_heads`, the model will use Multi Head Attention (MHA), if
90
+ `num_key_value_heads=1 the model will use Multi Query Attention (MQA) otherwise GQA is used. When
91
+ converting a multi-head checkpoint to a GQA checkpoint, each group key and value head should be constructed
92
+ by meanpooling all the original heads within that group. For more details checkout [this
93
+ paper](https://arxiv.org/pdf/2305.13245.pdf). If it is not specified, will default to `32`.
94
+ hidden_act (`str` or `function`, *optional*, defaults to `"silu"`):
95
+ The non-linear activation function (function or string) in the decoder.
96
+ max_position_embeddings (`int`, *optional*, defaults to 32768):
97
+ The maximum sequence length that this model might ever be used with.
98
+ initializer_range (`float`, *optional*, defaults to 0.02):
99
+ The standard deviation of the truncated_normal_initializer for initializing all weight matrices.
100
+ rms_norm_eps (`float`, *optional*, defaults to 1e-06):
101
+ The epsilon used by the rms normalization layers.
102
+ use_cache (`bool`, *optional*, defaults to `True`):
103
+ Whether or not the model should return the last key/values attentions (not used by all models). Only
104
+ relevant if `config.is_decoder=True`.
105
+ tie_word_embeddings (`bool`, *optional*, defaults to `False`):
106
+ Whether the model's input and output word embeddings should be tied.
107
+ rope_theta (`float`, *optional*, defaults to 10000.0):
108
+ The base period of the RoPE embeddings.
109
+ use_sliding_window (`bool`, *optional*, defaults to `False`):
110
+ Whether to use sliding window attention.
111
+ sliding_window (`int`, *optional*, defaults to 4096):
112
+ Sliding window attention (SWA) window size. If not specified, will default to `4096`.
113
+ max_window_layers (`int`, *optional*, defaults to 28):
114
+ The number of layers that use SWA (Sliding Window Attention). The bottom layers use SWA while the top use full attention.
115
+ attention_dropout (`float`, *optional*, defaults to 0.0):
116
+ The dropout ratio for the attention probabilities.
117
+ """
118
+
119
+ model_type = "qwen2"
120
+ keys_to_ignore_at_inference = ["past_key_values"]
121
+
122
+ def __init__(
123
+ self,
124
+ vocab_size=151936,
125
+ hidden_size=4096,
126
+ intermediate_size=22016,
127
+ num_hidden_layers=32,
128
+ num_attention_heads=32,
129
+ num_key_value_heads=32,
130
+ hidden_act="silu",
131
+ max_position_embeddings=32768,
132
+ seq_length=32768,
133
+ initializer_range=0.02,
134
+ rms_norm_eps=1e-6,
135
+ use_cache=True,
136
+ tie_word_embeddings=False,
137
+ rope_theta=10000.0,
138
+ pad_token_id=0,
139
+ bos_token_id=151643,
140
+ eos_token_id=151643,
141
+ use_sliding_window=False,
142
+ sliding_window=4096,
143
+ max_window_layers=28,
144
+ attention_dropout=0.0,
145
+ rope_scaling_factor=1.0,
146
+ rope_scaling_type=None,
147
+ dpo_config=None,
148
+ **kwargs,
149
+ ):
150
+ self.vocab_size = vocab_size
151
+ self.max_position_embeddings = max_position_embeddings
152
+ self.seq_length = seq_length
153
+ self.hidden_size = hidden_size
154
+ self.intermediate_size = intermediate_size
155
+ self.num_hidden_layers = num_hidden_layers
156
+ self.num_attention_heads = num_attention_heads
157
+ self.use_sliding_window = use_sliding_window
158
+ self.sliding_window = sliding_window
159
+ self.max_window_layers = max_window_layers
160
+
161
+ # for backward compatibility
162
+ if num_key_value_heads is None:
163
+ num_key_value_heads = num_attention_heads
164
+
165
+ self.num_key_value_heads = num_key_value_heads
166
+ self.hidden_act = hidden_act
167
+ self.initializer_range = initializer_range
168
+ self.rms_norm_eps = rms_norm_eps
169
+ self.use_cache = use_cache
170
+ self.rope_theta = rope_theta
171
+ self.attention_dropout = attention_dropout
172
+
173
+ self.use_cache = use_cache
174
+ self.rope_scaling_factor = rope_scaling_factor
175
+ self.rope_scaling_type = rope_scaling_type
176
+
177
+ self.pad_token_id = pad_token_id
178
+ self.bos_token_id = bos_token_id
179
+ self.eos_token_id = eos_token_id
180
+ self.dpo_config = dpo_config
181
+
182
+ super().__init__(
183
+ pad_token_id=pad_token_id,
184
+ bos_token_id=bos_token_id,
185
+ eos_token_id=eos_token_id,
186
+ tie_word_embeddings=tie_word_embeddings,
187
+ **kwargs,
188
+ )
189
+
190
+
191
+ def get_triangle_upper_mask(x, mask=None):
192
+ if mask is not None:
193
+ return mask
194
+ # [bsz, n_head, q_len, kv_seq_len]
195
+ shape = x.shape
196
+ # [bsz, 1, q_len, kv_seq_len]
197
+ shape[1] = 1
198
+ mask = paddle.full(shape, paddle.finfo(x.dtype).min, dtype=x.dtype)
199
+ mask = paddle.triu(mask, diagonal=1)
200
+ mask.stop_gradient = True
201
+ return mask
202
+
203
+
204
+ def parallel_matmul(
205
+ x: Tensor, y: Tensor, transpose_y=True, tensor_parallel_output=True
206
+ ):
207
+ is_fleet_init = True
208
+ tensor_parallel_degree = 1
209
+ try:
210
+ hcg = fleet.get_hybrid_communicate_group()
211
+ model_parallel_group = hcg.get_model_parallel_group()
212
+ tensor_parallel_degree = hcg.get_model_parallel_world_size()
213
+ except:
214
+ is_fleet_init = False
215
+
216
+ if paddle.in_dynamic_mode():
217
+ y_is_distributed = y.is_distributed
218
+ else:
219
+ y_is_distributed = tensor_parallel_degree > 1
220
+
221
+ if is_fleet_init and tensor_parallel_degree > 1 and y_is_distributed:
222
+ # if not running under distributed.launch, it will raise AttributeError: 'Fleet' object has no attribute '_hcg'
223
+ input_parallel = paddle.distributed.collective._c_identity(
224
+ x, group=model_parallel_group
225
+ )
226
+ logits = paddle.matmul(input_parallel, y, transpose_y=transpose_y)
227
+
228
+ if tensor_parallel_output:
229
+ return logits
230
+
231
+ return paddle.distributed.collective._c_concat(
232
+ logits, group=model_parallel_group
233
+ )
234
+
235
+ else:
236
+ logits = paddle.matmul(x, y, transpose_y=transpose_y)
237
+ return logits
238
+
239
+
240
+ def scaled_dot_product_attention(
241
+ query_states,
242
+ config,
243
+ key_states,
244
+ value_states,
245
+ attention_mask,
246
+ output_attentions,
247
+ attn_mask_startend_row_indices=None,
248
+ training=True,
249
+ sequence_parallel=False,
250
+ skip_recompute=False,
251
+ ):
252
+ bsz, q_len, num_heads, head_dim = query_states.shape
253
+ _, kv_seq_len, _, _ = value_states.shape
254
+
255
+ # [ bz, seqlen, nhead, head_dim] -> [bs, nhead, seq_len, head_dim]
256
+ query_states = paddle.transpose(query_states, [0, 2, 1, 3])
257
+ # merge with the next transpose
258
+ key_states = paddle.transpose(key_states, [0, 2, 1, 3])
259
+ value_states = paddle.transpose(value_states, [0, 2, 1, 3])
260
+
261
+ # Add pre divided factor to fix nan under float16.
262
+ if paddle.in_dynamic_mode() and query_states.dtype == paddle.float16:
263
+ pre_divided_factor = 32
264
+ else:
265
+ pre_divided_factor = 1
266
+
267
+ attn_weights = paddle.matmul(
268
+ query_states / (math.sqrt(head_dim) * pre_divided_factor),
269
+ key_states.transpose([0, 1, 3, 2]),
270
+ )
271
+
272
+ if attn_weights.shape != [bsz, num_heads, q_len, kv_seq_len]:
273
+ raise ValueError(
274
+ f"Attention weights should be of shape {(bsz, num_heads, q_len, kv_seq_len)}, but is"
275
+ f" {attn_weights.shape}"
276
+ )
277
+
278
+ if attention_mask is None:
279
+ attention_mask = get_triangle_upper_mask(attn_weights)
280
+
281
+ attention_mask = attention_mask.reshape([bsz, 1, q_len, kv_seq_len])
282
+ if attention_mask.shape != [bsz, 1, q_len, kv_seq_len]:
283
+ raise ValueError(
284
+ f"Attention mask should be of shape {(bsz, 1, q_len, kv_seq_len)}, but is {attention_mask.shape}"
285
+ )
286
+
287
+ attn_weights = attn_weights + attention_mask
288
+
289
+ if not paddle.in_dynamic_mode():
290
+ attn_weights = F.softmax(
291
+ attn_weights * pre_divided_factor, axis=-1, dtype="float32"
292
+ ).astype(query_states.dtype)
293
+ else:
294
+ with paddle.amp.auto_cast(False):
295
+ attn_weights = F.softmax(
296
+ attn_weights.astype("float32") * pre_divided_factor,
297
+ axis=-1,
298
+ dtype="float32",
299
+ ).astype(query_states.dtype)
300
+
301
+ attn_weights = F.dropout(
302
+ attn_weights, p=config.attention_dropout, training=training
303
+ )
304
+
305
+ attn_output = paddle.matmul(attn_weights, value_states)
306
+ attn_output = attn_output.transpose([0, 2, 1, 3])
307
+
308
+ if sequence_parallel:
309
+ attn_output = attn_output.reshape([bsz * q_len, head_dim * num_heads])
310
+ else:
311
+ attn_output = attn_output.reshape([bsz, q_len, head_dim * num_heads])
312
+ return (attn_output, attn_weights) if output_attentions else attn_output
313
+
314
+
315
+ def is_casual_mask(attention_mask):
316
+ """
317
+ Upper triangular of attention_mask equals to attention_mask is casual
318
+ """
319
+ return (paddle.triu(attention_mask) == attention_mask).all().item()
320
+
321
+
322
+ def _make_causal_mask(input_ids_shape, past_key_values_length):
323
+ """
324
+ Make causal mask used for self-attention
325
+ """
326
+ batch_size, target_length = input_ids_shape # target_length: seq_len
327
+
328
+ mask = paddle.tril(paddle.ones((target_length, target_length), dtype="bool"))
329
+
330
+ if past_key_values_length > 0:
331
+ # [tgt_len, tgt_len + past_len]
332
+ mask = paddle.concat(
333
+ [paddle.ones([target_length, past_key_values_length], dtype="bool"), mask],
334
+ axis=-1,
335
+ )
336
+
337
+ # [bs, 1, tgt_len, tgt_len + past_len]
338
+ return mask[None, None, :, :].expand(
339
+ [batch_size, 1, target_length, target_length + past_key_values_length]
340
+ )
341
+
342
+
343
+ def _expand_2d_mask(mask, dtype, tgt_length):
344
+ """
345
+ Expands attention_mask from `[batch_size, src_length]` to `[batch_size, 1, tgt_length, src_length]`.
346
+ """
347
+ batch_size, src_length = mask.shape[0], mask.shape[-1]
348
+ tgt_length = tgt_length if tgt_length is not None else src_length
349
+
350
+ mask = mask[:, None, None, :].astype("bool")
351
+ mask.stop_gradient = True
352
+ expanded_mask = mask.expand([batch_size, 1, tgt_length, src_length])
353
+
354
+ return expanded_mask
355
+
356
+
357
+ class Qwen2RMSNorm(nn.Layer):
358
+ def __init__(self, config: Qwen2Config):
359
+ """
360
+ Qwen2RMSNorm is equivalent to T5LayerNorm
361
+ """
362
+ super().__init__()
363
+ self.hidden_size = config.hidden_size
364
+ self.weight = paddle.create_parameter(
365
+ shape=[self.hidden_size],
366
+ dtype=paddle.get_default_dtype(),
367
+ default_initializer=nn.initializer.Constant(1.0),
368
+ )
369
+ self.variance_epsilon = config.rms_norm_eps
370
+ self.config = config
371
+
372
+ if config.sequence_parallel:
373
+ mark_as_sequence_parallel_parameter(self.weight)
374
+
375
+ def forward(self, hidden_states):
376
+ if self.config.use_fused_rms_norm:
377
+ return fusion_ops.fusion_rms_norm(
378
+ hidden_states, self.weight, self.variance_epsilon, False
379
+ )
380
+
381
+ if paddle.in_dynamic_mode():
382
+ with paddle.amp.auto_cast(False):
383
+ variance = hidden_states.astype("float32").pow(2).mean(-1, keepdim=True)
384
+ hidden_states = (
385
+ paddle.rsqrt(variance + self.variance_epsilon) * hidden_states
386
+ )
387
+ else:
388
+ variance = hidden_states.astype("float32").pow(2).mean(-1, keepdim=True)
389
+ hidden_states = (
390
+ paddle.rsqrt(variance + self.variance_epsilon) * hidden_states
391
+ )
392
+
393
+ if self.weight.dtype in [paddle.float16, paddle.bfloat16]:
394
+ hidden_states = paddle.cast(hidden_states, self.weight.dtype)
395
+ return hidden_states * self.weight
396
+
397
+
398
+ class Qwen2RotaryEmbedding(nn.Layer):
399
+ def __init__(self, dim, max_position_embeddings=2048, base=10000):
400
+ super().__init__()
401
+ self.dim = dim
402
+ self.max_position_embeddings = max_position_embeddings
403
+ self.base = base
404
+ # [dim / 2]
405
+ self.inv_freq = 1.0 / (
406
+ self.base
407
+ ** (paddle.cast(paddle.arange(0, self.dim, 2), dtype="float32") / self.dim)
408
+ )
409
+ self._set_cos_sin_cache(seq_len=max_position_embeddings)
410
+
411
+ def _set_cos_sin_cache(self, seq_len):
412
+ self.max_seq_len_cached = seq_len
413
+ # [seq_len]
414
+ t = paddle.arange(seq_len, dtype="float32")
415
+ # [seq_len, dim/2]
416
+ freqs = paddle.einsum("i,j->ij", t, self.inv_freq)
417
+ # Different from paper, but it uses a different permutation in order to obtain the same calculation
418
+ # [seq_len, dim]
419
+ emb = paddle.concat([freqs, freqs], axis=-1)
420
+ # [1, seqlen, 1, dim]
421
+ self.cos_cached = emb.cos()[None, :, None, :]
422
+ self.sin_cached = emb.sin()[None, :, None, :]
423
+
424
+ def forward(self, x, seq_len=None):
425
+ # x: [bs, num_attention_heads, seq_len, head_size]
426
+ if seq_len > self.max_seq_len_cached:
427
+ self._set_cos_sin_cache(seq_len)
428
+ cos = self.cos_cached[:, :seq_len, :, :]
429
+ sin = self.sin_cached[:, :seq_len, :, :]
430
+ return (
431
+ cos.cast(x.dtype) if cos.dtype != x.dtype else cos,
432
+ sin.cast(x.dtype) if sin.dtype != x.dtype else sin,
433
+ )
434
+
435
+
436
+ def rotate_half(x):
437
+ """Rotates half the hidden dims of the input."""
438
+ x1 = x[..., : x.shape[-1] // 2]
439
+ x2 = x[..., x.shape[-1] // 2 :]
440
+ return paddle.concat([-x2, x1], axis=-1) # shape is the same as x
441
+
442
+
443
+ def apply_rotary_pos_emb(q, k, cos, sin, position_ids):
444
+ if position_ids is None:
445
+ # Note: Only for Qwen2MoEForCausalLMPipe model pretraining
446
+ cos = cos[:, : q.shape[1], :, :] # [bs, seq_len, 1, dim]
447
+ sin = sin[:, : q.shape[1], :, :] # [bs, seq_len, 1, dim]
448
+ else:
449
+ cos = cos.squeeze(axis=[0, 2]) # [seq_len, dim]
450
+ sin = sin.squeeze(axis=[0, 2]) # [seq_len, dim]
451
+ cos = cos[position_ids].unsqueeze(2) # [bs, seq_len, 1, dim]
452
+ sin = sin[position_ids].unsqueeze(2) # [bs, seq_len, 1, dim]
453
+ q_embed = (q * cos) + (rotate_half(q) * sin)
454
+ k_embed = (k * cos) + (rotate_half(k) * sin)
455
+ return q_embed, k_embed
456
+
457
+
458
+ class Qwen2MLP(nn.Layer):
459
+ def __init__(self, config: Qwen2Config, is_shared=False, skip_recompute_ops=None):
460
+ super().__init__()
461
+ if skip_recompute_ops is None:
462
+ skip_recompute_ops = {}
463
+ self.skip_recompute_ops = skip_recompute_ops
464
+ self.hidden_size = config.hidden_size
465
+ self.intermediate_size = config.intermediate_size
466
+ self.fuse_attention_ffn = config.fuse_attention_ffn
467
+
468
+ self.tensor_parallel_degree = config.tensor_parallel_degree
469
+
470
+ if config.sequence_parallel:
471
+ ColumnParallelLinear = ColumnSequenceParallelLinear
472
+ RowParallelLinear = RowSequenceParallelLinear
473
+
474
+ if config.tensor_parallel_degree > 1:
475
+ if self.fuse_attention_ffn:
476
+ self.gate_up_fused_proj = ColumnParallelLinear(
477
+ self.hidden_size,
478
+ self.intermediate_size * 2,
479
+ gather_output=False,
480
+ has_bias=False,
481
+ )
482
+ else:
483
+ self.gate_proj = ColumnParallelLinear(
484
+ self.hidden_size,
485
+ self.intermediate_size,
486
+ gather_output=False,
487
+ has_bias=False,
488
+ )
489
+ self.up_proj = ColumnParallelLinear(
490
+ self.hidden_size,
491
+ self.intermediate_size,
492
+ gather_output=False,
493
+ has_bias=False,
494
+ )
495
+ self.down_proj = RowParallelLinear(
496
+ self.intermediate_size,
497
+ self.hidden_size,
498
+ input_is_parallel=True,
499
+ has_bias=False,
500
+ )
501
+ else:
502
+ if self.fuse_attention_ffn:
503
+ self.gate_up_fused_proj = Linear(
504
+ self.hidden_size, self.intermediate_size * 2, bias_attr=False
505
+ )
506
+ else:
507
+ self.gate_proj = Linear(
508
+ self.hidden_size, self.intermediate_size, bias_attr=False
509
+ ) # w1
510
+ self.up_proj = Linear(
511
+ self.hidden_size, self.intermediate_size, bias_attr=False
512
+ ) # w3
513
+ self.down_proj = Linear(
514
+ self.intermediate_size, self.hidden_size, bias_attr=False
515
+ ) # w2
516
+
517
+ if config.hidden_act == "silu":
518
+ self.act_fn = fusion_ops.swiglu
519
+ self.fuse_swiglu = True
520
+ else:
521
+ self.act_fn = ACT2FN[config.hidden_act]
522
+ self.fuse_swiglu = False
523
+
524
+ def forward(self, x):
525
+ if self.fuse_attention_ffn:
526
+ x = self.gate_up_fused_proj(x)
527
+ if self.fuse_swiglu:
528
+ y = None
529
+ else:
530
+ x, y = x.chunk(2, axis=-1)
531
+ else:
532
+ x, y = self.gate_proj(x), self.up_proj(x)
533
+
534
+ if self.fuse_swiglu:
535
+ x = self.act_fn(x, y)
536
+ else:
537
+ x = self.act_fn(x) * y
538
+
539
+ return self.down_proj(x)
540
+
541
+
542
+ def repeat_kv(hidden_states: paddle.Tensor, n_rep: int) -> paddle.Tensor:
543
+ """
544
+ This is the equivalent of paddle.repeat_interleave(hidden_states, n_rep, axis=1). The hidden states go from (batch,
545
+ num_key_value_heads, seqlen, head_dim) to (batch, num_attention_heads, seqlen, head_dim)
546
+ """
547
+ batch, slen, num_key_value_heads, head_dim = hidden_states.shape
548
+ if n_rep == 1:
549
+ return hidden_states
550
+
551
+ hidden_states = hidden_states.unsqueeze(-2).tile([1, 1, 1, n_rep, 1])
552
+ return hidden_states.reshape([batch, slen, num_key_value_heads * n_rep, head_dim])
553
+
554
+
555
+ class Qwen2Attention(nn.Layer):
556
+ """
557
+ Multi-headed attention from 'Attention Is All You Need' paper. Modified to use sliding window attention: Longformer
558
+ and "Generating Long Sequences with Sparse Transformers".
559
+ """
560
+
561
+ def __init__(
562
+ self,
563
+ config: Qwen2Config,
564
+ layerwise_recompute: bool = True,
565
+ skip_recompute_ops=None,
566
+ ):
567
+ super().__init__()
568
+ if skip_recompute_ops is None:
569
+ skip_recompute_ops = {}
570
+ self.config = config
571
+ self.skip_recompute_ops = skip_recompute_ops
572
+ self.hidden_size = config.hidden_size
573
+ self.num_heads = config.num_attention_heads
574
+
575
+ self.head_dim = self.hidden_size // config.num_attention_heads
576
+
577
+ self.num_key_value_heads = config.num_key_value_heads
578
+ assert config.num_attention_heads // config.num_key_value_heads
579
+ self.num_key_value_groups = (
580
+ config.num_attention_heads // config.num_key_value_heads
581
+ )
582
+ self.gqa_or_mqa = config.num_attention_heads != config.num_key_value_heads
583
+ self.max_position_embeddings = config.max_position_embeddings
584
+ self.rope_theta = config.rope_theta
585
+ self.is_causal = True
586
+ self.attention_dropout = config.attention_dropout
587
+
588
+ self.seq_length = config.seq_length
589
+ self.sequence_parallel = config.sequence_parallel
590
+
591
+ self.fuse_attention_qkv = config.fuse_attention_qkv
592
+
593
+ # Note that we will actually perform a recompute only if both enable_recompute and layerwise_recompute are set to True
594
+ # Enable_recompute defaults to False and is controlled by Trainer
595
+ self.enable_recompute = False
596
+ self.layerwise_recompute = layerwise_recompute
597
+ self.recompute_granularity = config.recompute_granularity
598
+ if config.tensor_parallel_degree > 1:
599
+ assert (
600
+ self.num_heads % config.tensor_parallel_degree == 0
601
+ ), f"num_heads: {self.num_heads}, tensor_parallel_degree: {config.tensor_parallel_degree}"
602
+ self.num_heads = self.num_heads // config.tensor_parallel_degree
603
+
604
+ assert (
605
+ self.num_key_value_heads % config.tensor_parallel_degree == 0
606
+ ), f"num_key_value_heads: {self.num_key_value_heads}, tensor_parallel_degree: {config.tensor_parallel_degree}"
607
+ self.num_key_value_heads = (
608
+ self.num_key_value_heads // config.tensor_parallel_degree
609
+ )
610
+
611
+ self.use_fused_rope = config.use_fused_rope
612
+ if self.use_fused_rope:
613
+ if (
614
+ get_device_type() not in ["gpu", "xpu"]
615
+ or fused_rotary_position_embedding is None
616
+ ):
617
+ logging.warning(
618
+ "Enable fuse rope in the config, but fuse rope is not available. "
619
+ "Will disable fuse rope. Try using latest gpu version of Paddle."
620
+ )
621
+ self.use_fused_rope = False
622
+
623
+ if config.sequence_parallel:
624
+ ColumnParallelLinear = ColumnSequenceParallelLinear
625
+ RowParallelLinear = RowSequenceParallelLinear
626
+
627
+ if config.tensor_parallel_degree > 1:
628
+ if self.fuse_attention_qkv:
629
+ self.qkv_proj = ColumnParallelLinear(
630
+ self.hidden_size,
631
+ self.hidden_size
632
+ + 2 * self.config.num_key_value_heads * self.head_dim,
633
+ has_bias=True,
634
+ gather_output=False,
635
+ )
636
+ else:
637
+ self.q_proj = ColumnParallelLinear(
638
+ self.hidden_size,
639
+ self.hidden_size,
640
+ has_bias=True,
641
+ gather_output=False,
642
+ )
643
+ self.k_proj = ColumnParallelLinear(self.hidden_size, self.config.num_key_value_heads * self.head_dim, has_bias=True, gather_output=False) # fmt:skip
644
+ self.v_proj = ColumnParallelLinear(self.hidden_size, self.config.num_key_value_heads * self.head_dim, has_bias=True, gather_output=False) # fmt:skip
645
+ self.o_proj = RowParallelLinear(
646
+ self.hidden_size,
647
+ self.hidden_size,
648
+ has_bias=False,
649
+ input_is_parallel=True,
650
+ )
651
+ else:
652
+ if self.fuse_attention_qkv:
653
+ self.qkv_proj = Linear(
654
+ self.hidden_size,
655
+ self.hidden_size
656
+ + 2 * self.config.num_key_value_heads * self.head_dim,
657
+ )
658
+ else:
659
+ self.q_proj = Linear(self.hidden_size, self.hidden_size, bias_attr=True)
660
+ self.k_proj = Linear(
661
+ self.hidden_size,
662
+ self.config.num_key_value_heads * self.head_dim,
663
+ bias_attr=True,
664
+ )
665
+ self.v_proj = Linear(
666
+ self.hidden_size,
667
+ self.config.num_key_value_heads * self.head_dim,
668
+ bias_attr=True,
669
+ )
670
+ self.o_proj = Linear(self.hidden_size, self.hidden_size, bias_attr=False)
671
+
672
+ self.rotary_emb = Qwen2RotaryEmbedding(
673
+ self.head_dim,
674
+ max_position_embeddings=self.max_position_embeddings,
675
+ base=self.rope_theta,
676
+ )
677
+
678
+ self.attn_func = scaled_dot_product_attention
679
+
680
+ def forward(
681
+ self,
682
+ hidden_states,
683
+ position_ids: Optional[Tuple[paddle.Tensor]] = None,
684
+ past_key_value: Optional[Tuple[paddle.Tensor]] = None,
685
+ attention_mask: Optional[paddle.Tensor] = None,
686
+ output_attentions: bool = False,
687
+ use_cache: bool = False,
688
+ attn_mask_startend_row_indices: Optional[paddle.Tensor] = None,
689
+ **kwargs,
690
+ ) -> Tuple[paddle.Tensor, Optional[paddle.Tensor], Optional[Tuple[paddle.Tensor]]]:
691
+ """Input shape: Batch x Time x Channel"""
692
+ # [bs, seq_len, num_head * head_dim] -> [seq_len / n, bs, num_head * head_dim] (n is model parallelism)
693
+
694
+ if self.fuse_attention_qkv:
695
+ mix_layer = self.qkv_proj(hidden_states)
696
+ if self.sequence_parallel:
697
+ target_shape = [
698
+ -1,
699
+ self.seq_length,
700
+ self.num_key_value_heads,
701
+ (self.num_key_value_groups + 2) * self.head_dim,
702
+ ]
703
+ else:
704
+ target_shape = [
705
+ 0,
706
+ 0,
707
+ self.num_key_value_heads,
708
+ (self.num_key_value_groups + 2) * self.head_dim,
709
+ ]
710
+ mix_layer = paddle.reshape_(mix_layer, target_shape)
711
+ query_states, key_states, value_states = paddle.split(
712
+ mix_layer,
713
+ num_or_sections=[
714
+ self.num_key_value_groups * self.head_dim,
715
+ self.head_dim,
716
+ self.head_dim,
717
+ ],
718
+ axis=-1,
719
+ )
720
+ if self.gqa_or_mqa:
721
+ query_states = paddle.reshape_(
722
+ query_states, [0, 0, self.num_heads, self.head_dim]
723
+ )
724
+ else:
725
+ query_states = self.q_proj(hidden_states)
726
+ key_states = self.k_proj(hidden_states)
727
+ value_states = self.v_proj(hidden_states)
728
+
729
+ if self.sequence_parallel:
730
+ target_query_shape = [
731
+ -1,
732
+ self.seq_length,
733
+ self.num_heads,
734
+ self.head_dim,
735
+ ]
736
+ target_key_value_shape = [
737
+ -1,
738
+ self.seq_length,
739
+ self.num_key_value_heads,
740
+ self.head_dim,
741
+ ]
742
+ else:
743
+ target_query_shape = [0, 0, self.num_heads, self.head_dim]
744
+ target_key_value_shape = [0, 0, self.num_key_value_heads, self.head_dim]
745
+ query_states = query_states.reshape(shape=target_query_shape)
746
+ key_states = key_states.reshape(shape=target_key_value_shape)
747
+ value_states = value_states.reshape(shape=target_key_value_shape)
748
+
749
+ kv_seq_len = key_states.shape[-3]
750
+ if past_key_value is not None:
751
+ kv_seq_len += past_key_value[0].shape[-3]
752
+ if self.use_fused_rope:
753
+ assert past_key_value is None, "fuse rotary not support cache kv for now"
754
+ cos, sin = self.rotary_emb(value_states, seq_len=kv_seq_len)
755
+ query_states, key_states, _ = fused_rotary_position_embedding(
756
+ query_states,
757
+ key_states,
758
+ v=None,
759
+ sin=sin,
760
+ cos=cos,
761
+ position_ids=position_ids,
762
+ use_neox_rotary_style=False,
763
+ )
764
+ else:
765
+ cos, sin = self.rotary_emb(value_states, seq_len=kv_seq_len)
766
+ query_states, key_states = apply_rotary_pos_emb(
767
+ query_states, key_states, cos, sin, position_ids
768
+ )
769
+
770
+ # [bs, seq_len, num_head, head_dim]
771
+ if past_key_value is not None:
772
+ key_states = paddle.concat([past_key_value[0], key_states], axis=1)
773
+ value_states = paddle.concat([past_key_value[1], value_states], axis=1)
774
+ past_key_value = (key_states, value_states) if use_cache else None
775
+
776
+ # TODO(wj-Mcat): use broadcast strategy when n_kv_heads = 1
777
+ # repeat k/v heads if n_kv_heads < n_heads
778
+ paddle_version = float(paddle.__version__[:3])
779
+ if not self.config.use_flash_attention or (
780
+ (paddle_version != 0.0) and (paddle_version <= 2.6)
781
+ ):
782
+ key_states = repeat_kv(key_states, self.num_key_value_groups)
783
+ value_states = repeat_kv(value_states, self.num_key_value_groups)
784
+
785
+ outputs = self.attn_func(
786
+ query_states,
787
+ self.config,
788
+ key_states,
789
+ value_states,
790
+ attention_mask,
791
+ output_attentions,
792
+ attn_mask_startend_row_indices=attn_mask_startend_row_indices,
793
+ training=self.training,
794
+ sequence_parallel=self.sequence_parallel,
795
+ )
796
+ if output_attentions:
797
+ attn_output, attn_weights = outputs
798
+ else:
799
+ attn_output = outputs
800
+
801
+ # if sequence_parallel is true, out shape are [q_len / n, bs, num_head * head_dim]
802
+ # else their shape are [bs, q_len, num_head * head_dim], n is mp parallelism.
803
+ attn_output = self.o_proj(attn_output)
804
+
805
+ if not output_attentions:
806
+ attn_weights = None
807
+
808
+ outputs = (attn_output,)
809
+
810
+ if output_attentions:
811
+ outputs += (attn_weights,)
812
+
813
+ if use_cache:
814
+ outputs += (past_key_value,)
815
+
816
+ if type(outputs) is tuple and len(outputs) == 1:
817
+ outputs = outputs[0]
818
+
819
+ return outputs
820
+
821
+
822
+ class Qwen2DecoderLayer(nn.Layer):
823
+ def __init__(
824
+ self,
825
+ config: Qwen2Config,
826
+ layerwise_recompute: bool = False,
827
+ skip_recompute_ops=None,
828
+ ):
829
+ super().__init__()
830
+ if skip_recompute_ops is None:
831
+ skip_recompute_ops = {}
832
+ self.config = config
833
+ self.skip_recompute_ops = skip_recompute_ops
834
+ self.hidden_size = config.hidden_size
835
+ self.self_attn = Qwen2Attention(
836
+ config, layerwise_recompute, skip_recompute_ops=skip_recompute_ops
837
+ )
838
+
839
+ self.mlp = Qwen2MLP(config, skip_recompute_ops=skip_recompute_ops)
840
+ self.input_layernorm = Qwen2RMSNorm(config)
841
+ self.post_attention_layernorm = Qwen2RMSNorm(config)
842
+
843
+ # Note that we will actually perform a recompute only if both enable_recompute and layerwise_recompute are set to True
844
+ # Enable_recompute defaults to False and is controlled by Trainer
845
+ self.enable_recompute = False
846
+ self.layerwise_recompute = layerwise_recompute
847
+ self.recompute_granularity = config.recompute_granularity
848
+
849
+ def forward(
850
+ self,
851
+ hidden_states: paddle.Tensor,
852
+ position_ids: Optional[paddle.Tensor] = None,
853
+ attention_mask: Optional[paddle.Tensor] = None,
854
+ output_attentions: Optional[bool] = False,
855
+ past_key_value: Optional[Tuple[paddle.Tensor]] = None,
856
+ use_cache: Optional[bool] = False,
857
+ attn_mask_startend_row_indices: Optional[paddle.Tensor] = None,
858
+ **kwargs,
859
+ ) -> Tuple[paddle.Tensor, Optional[Tuple[paddle.Tensor, paddle.Tensor]]]:
860
+ """
861
+ Args:
862
+ hidden_states (`paddle.Tensor`): input to the layer of shape `(batch, seq_len, embed_dim)`
863
+ attention_mask (`paddle.Tensor`, *optional*): attention mask of size
864
+ `(batch, sequence_length)` where padding elements are indicated by 0.
865
+ output_attentions (`bool`, *optional*):
866
+ Whether or not to return the attentions tensors of all attention layers. See `attentions` under
867
+ returned tensors for more detail.
868
+ use_cache (`bool`, *optional*):
869
+ If set to `True`, `past_key_values` key value states are returned and can be used to speed up decoding
870
+ (see `past_key_values`).
871
+ past_key_value (`Tuple(paddle.Tensor)`, *optional*): cached past key and value projection states
872
+ """
873
+
874
+ # [bs * seq_len, embed_dim] -> [seq_len * bs / n, embed_dim] (sequence_parallel)
875
+ residual = hidden_states
876
+
877
+ hidden_states = self.input_layernorm(hidden_states)
878
+
879
+ # Self Attention
880
+ outputs = self.self_attn(
881
+ hidden_states,
882
+ position_ids,
883
+ past_key_value,
884
+ attention_mask,
885
+ output_attentions,
886
+ use_cache,
887
+ attn_mask_startend_row_indices=attn_mask_startend_row_indices,
888
+ )
889
+
890
+ if type(outputs) is tuple:
891
+ hidden_states = outputs[0]
892
+ else:
893
+ hidden_states = outputs
894
+
895
+ if output_attentions:
896
+ self_attn_weights = outputs[1]
897
+
898
+ if use_cache:
899
+ present_key_value = outputs[2 if output_attentions else 1]
900
+
901
+ hidden_states = residual + hidden_states
902
+
903
+ # Fully Connected
904
+ residual = hidden_states
905
+ hidden_states = self.post_attention_layernorm(hidden_states)
906
+ hidden_states = self.mlp(hidden_states)
907
+
908
+ hidden_states = residual + hidden_states
909
+
910
+ outputs = (hidden_states,)
911
+
912
+ if output_attentions:
913
+ outputs += (self_attn_weights,)
914
+
915
+ if use_cache:
916
+ outputs += (present_key_value,)
917
+
918
+ if type(outputs) is tuple and len(outputs) == 1:
919
+ outputs = outputs[0]
920
+
921
+ return outputs
922
+
923
+
924
+ class Qwen2PretrainedModel(PretrainedModel):
925
+ config_class = Qwen2Config
926
+ base_model_prefix = "qwen2"
927
+ _keys_to_ignore_on_load_unexpected = [r"self_attn.rotary_emb.inv_freq"]
928
+
929
+ @classmethod
930
+ def _get_fuse_or_split_param_mappings(cls, config: Qwen2Config, is_fuse=False):
931
+ # return parameter fuse utils
932
+ from ...common.vlm.conversion_utils import split_or_fuse_func
933
+
934
+ fn = split_or_fuse_func(is_fuse=is_fuse)
935
+
936
+ # last key is fused key, other keys are to be fused.
937
+ fuse_qkv_keys = [
938
+ (
939
+ "layers.0.self_attn.q_proj.weight",
940
+ "layers.0.self_attn.k_proj.weight",
941
+ "layers.0.self_attn.v_proj.weight",
942
+ "layers.0.self_attn.qkv_proj.weight",
943
+ ),
944
+ (
945
+ "layers.0.self_attn.q_proj.bias",
946
+ "layers.0.self_attn.k_proj.bias",
947
+ "layers.0.self_attn.v_proj.bias",
948
+ "layers.0.self_attn.qkv_proj.bias",
949
+ ),
950
+ ]
951
+
952
+ fuse_gate_up_keys = (
953
+ "layers.0.mlp.gate_proj.weight",
954
+ "layers.0.mlp.up_proj.weight",
955
+ "layers.0.mlp.gate_up_fused_proj.weight",
956
+ )
957
+ num_heads = config.num_attention_heads
958
+ num_key_value_heads = getattr(config, "num_key_value_heads", num_heads)
959
+ fuse_attention_qkv = getattr(config, "fuse_attention_qkv", False)
960
+ fuse_attention_ffn = getattr(config, "fuse_attention_ffn", False)
961
+
962
+ final_actions = {}
963
+ if is_fuse:
964
+ if fuse_attention_qkv:
965
+ for i in range(config.num_hidden_layers):
966
+ for fuse_keys in fuse_qkv_keys:
967
+ keys = tuple(
968
+ [
969
+ key.replace("layers.0.", f"layers.{i}.")
970
+ for key in fuse_keys
971
+ ]
972
+ )
973
+ final_actions[keys] = partial(
974
+ fn,
975
+ is_qkv=True,
976
+ num_heads=num_heads,
977
+ num_key_value_heads=num_key_value_heads,
978
+ )
979
+ if fuse_attention_ffn:
980
+ for i in range(config.num_hidden_layers):
981
+ keys = tuple(
982
+ [
983
+ key.replace("layers.0.", f"layers.{i}.")
984
+ for key in fuse_gate_up_keys
985
+ ]
986
+ )
987
+ final_actions[keys] = fn
988
+ else:
989
+ if not fuse_attention_qkv:
990
+ for i in range(config.num_hidden_layers):
991
+ for fuse_keys in fuse_qkv_keys:
992
+ keys = tuple(
993
+ [
994
+ key.replace("layers.0.", f"layers.{i}.")
995
+ for key in fuse_keys
996
+ ]
997
+ )
998
+ final_actions[keys] = partial(
999
+ fn,
1000
+ split_nums=3,
1001
+ is_qkv=True,
1002
+ num_heads=num_heads,
1003
+ num_key_value_heads=num_key_value_heads,
1004
+ )
1005
+ if not fuse_attention_ffn:
1006
+ for i in range(config.num_hidden_layers):
1007
+ keys = tuple(
1008
+ [
1009
+ key.replace("layers.0.", f"layers.{i}.")
1010
+ for key in fuse_gate_up_keys
1011
+ ]
1012
+ )
1013
+ final_actions[keys] = partial(fn, split_nums=2)
1014
+ return final_actions
1015
+
1016
+
1017
+ class Qwen2Model(Qwen2PretrainedModel):
1018
+ """
1019
+ Transformer decoder consisting of *config.num_hidden_layers* layers. Each layer is a [`Qwen2DecoderLayer`]
1020
+
1021
+ Args:
1022
+ config: Qwen2Config
1023
+ """
1024
+
1025
+ def __init__(self, config: Qwen2Config):
1026
+ super().__init__(config)
1027
+ self.padding_idx = config.pad_token_id
1028
+ self.vocab_size = config.vocab_size
1029
+
1030
+ self.hidden_size = config.hidden_size
1031
+ self.sequence_parallel = config.sequence_parallel
1032
+ self.recompute_granularity = config.recompute_granularity
1033
+ self.no_recompute_layers = (
1034
+ config.no_recompute_layers if config.no_recompute_layers is not None else []
1035
+ )
1036
+
1037
+ # Recompute defaults to False and is controlled by Trainer
1038
+ self.enable_recompute = False
1039
+ if (
1040
+ config.tensor_parallel_degree > 1
1041
+ and config.vocab_size % config.tensor_parallel_degree == 0
1042
+ ):
1043
+ self.embed_tokens = mpu.VocabParallelEmbedding(
1044
+ self.vocab_size,
1045
+ self.hidden_size,
1046
+ weight_attr=paddle.ParamAttr(initializer=nn.initializer.XavierNormal()),
1047
+ )
1048
+ else:
1049
+ self.embed_tokens = nn.Embedding(
1050
+ self.vocab_size,
1051
+ self.hidden_size,
1052
+ )
1053
+
1054
+ self.layers = nn.LayerList(
1055
+ [
1056
+ Qwen2DecoderLayer(
1057
+ config=config,
1058
+ layerwise_recompute=layer_idx not in self.no_recompute_layers,
1059
+ )
1060
+ for layer_idx in range(config.num_hidden_layers)
1061
+ ]
1062
+ )
1063
+ self.norm = Qwen2RMSNorm(config)
1064
+
1065
+ def get_input_embeddings(self):
1066
+ return self.embed_tokens
1067
+
1068
+ def set_input_embeddings(self, value):
1069
+ self.embed_tokens = value
1070
+
1071
+ @staticmethod
1072
+ def _prepare_decoder_attention_mask(
1073
+ attention_mask, input_shape, past_key_values_length, dtype
1074
+ ):
1075
+ if attention_mask is not None:
1076
+ # [bsz, seq_len] -> [bsz, 1, tgt_seq_len, src_seq_len]
1077
+ if len(attention_mask.shape) == 2:
1078
+ expanded_attn_mask = _expand_2d_mask(
1079
+ attention_mask, dtype, tgt_length=input_shape[-1]
1080
+ )
1081
+ # For decoding phase in generation, seq_length = 1, we don't need to add causal mask
1082
+ if input_shape[-1] > 1:
1083
+ combined_attention_mask = _make_causal_mask(
1084
+ input_shape,
1085
+ past_key_values_length=past_key_values_length,
1086
+ )
1087
+ expanded_attn_mask = expanded_attn_mask & combined_attention_mask
1088
+ # [bsz, seq_len, seq_len] -> [bsz, 1, seq_len, seq_len]
1089
+ elif len(attention_mask.shape) == 3:
1090
+ expanded_attn_mask = attention_mask.unsqueeze(1).astype("bool")
1091
+ # if attention_mask is already 4-D, do nothing
1092
+ else:
1093
+ expanded_attn_mask = attention_mask
1094
+ else:
1095
+ expanded_attn_mask = _make_causal_mask(
1096
+ input_shape,
1097
+ past_key_values_length=past_key_values_length,
1098
+ )
1099
+ # Convert bool attention_mask to float attention mask, which will be added to attention_scores later
1100
+ if get_device_type() == "xpu":
1101
+ x = paddle.to_tensor(0.0, dtype="float32")
1102
+ y = paddle.to_tensor(-1.7005809656952787e38, dtype="float32")
1103
+ expanded_attn_mask = paddle.where(expanded_attn_mask, x, y)
1104
+ else:
1105
+ expanded_attn_mask = paddle.where(
1106
+ expanded_attn_mask.cast("bool"), 0.0, paddle.finfo(dtype).min
1107
+ ).astype(dtype)
1108
+ return expanded_attn_mask
1109
+
1110
+ def forward(
1111
+ self,
1112
+ input_ids: paddle.Tensor = None,
1113
+ position_ids: Optional[paddle.Tensor] = None,
1114
+ attention_mask: Optional[paddle.Tensor] = None,
1115
+ inputs_embeds: Optional[paddle.Tensor] = None,
1116
+ use_cache: Optional[bool] = None,
1117
+ past_key_values: Optional[List[paddle.Tensor]] = None,
1118
+ output_attentions: Optional[bool] = None,
1119
+ output_hidden_states: Optional[bool] = None,
1120
+ return_dict: Optional[bool] = None,
1121
+ attn_mask_startend_row_indices=None,
1122
+ ) -> Union[Tuple, BaseModelOutputWithPast]:
1123
+
1124
+ output_attentions = (
1125
+ output_attentions
1126
+ if output_attentions is not None
1127
+ else self.config.output_attentions
1128
+ )
1129
+ output_hidden_states = output_hidden_states if output_hidden_states is not None else self.config.output_hidden_states # fmt:skip
1130
+ use_cache = use_cache if use_cache is not None else self.config.use_cache
1131
+ return_dict = (
1132
+ return_dict if return_dict is not None else self.config.use_return_dict
1133
+ )
1134
+
1135
+ # retrieve input_ids and inputs_embeds
1136
+ if input_ids is not None and inputs_embeds is not None:
1137
+ raise ValueError(
1138
+ "You cannot specify both decoder_input_ids and decoder_inputs_embeds at the same time"
1139
+ )
1140
+ elif input_ids is not None:
1141
+ batch_size, seq_length = input_ids.shape
1142
+ elif inputs_embeds is not None:
1143
+ batch_size, seq_length, _ = inputs_embeds.shape
1144
+ else:
1145
+ raise ValueError(
1146
+ "You have to specify either decoder_input_ids or decoder_inputs_embeds"
1147
+ )
1148
+
1149
+ if past_key_values is None:
1150
+ past_key_values = tuple([None] * len(self.layers))
1151
+ # NOTE: to make cache can be clear in-time
1152
+ past_key_values = list(past_key_values)
1153
+
1154
+ seq_length_with_past = seq_length
1155
+ cache_length = 0
1156
+ if past_key_values[0] is not None:
1157
+ cache_length = past_key_values[0][0].shape[1]
1158
+ seq_length_with_past += cache_length
1159
+ if inputs_embeds is None:
1160
+ # [bs, seq_len, dim]
1161
+ inputs_embeds = self.embed_tokens(input_ids)
1162
+
1163
+ if self.sequence_parallel:
1164
+ # [bs, seq_len, num_head * head_dim] -> [bs * seq_len, num_head * head_dim]
1165
+ bs, seq_len, hidden_size = inputs_embeds.shape
1166
+ inputs_embeds = paddle.reshape_(inputs_embeds, [bs * seq_len, hidden_size])
1167
+ # [seq_len * bs / n, num_head * head_dim] (n is mp parallelism)
1168
+ inputs_embeds = ScatterOp.apply(inputs_embeds)
1169
+
1170
+ # [bs, seq_len]
1171
+ attention_mask = (
1172
+ paddle.ones((batch_size, seq_length_with_past), dtype=paddle.bool)
1173
+ if attention_mask is None
1174
+ else attention_mask
1175
+ )
1176
+ attention_mask = self._prepare_decoder_attention_mask(
1177
+ attention_mask, (batch_size, seq_length), cache_length, inputs_embeds.dtype
1178
+ ) # [bs, 1, seq_len, seq_len]
1179
+ if self.config.use_flash_attention:
1180
+ attention_mask = None if is_casual_mask(attention_mask) else attention_mask
1181
+
1182
+ if position_ids is None:
1183
+ position_ids = paddle.arange(seq_length, dtype="int64").expand(
1184
+ (batch_size, seq_length)
1185
+ )
1186
+
1187
+ hidden_states = inputs_embeds
1188
+
1189
+ # decoder layers
1190
+ all_hidden_states = () if output_hidden_states else None
1191
+ all_self_attns = () if output_attentions else None
1192
+ next_decoder_cache = () if use_cache else None
1193
+
1194
+ for idx, (decoder_layer) in enumerate(self.layers):
1195
+ if output_hidden_states:
1196
+ all_hidden_states += (hidden_states,)
1197
+ past_key_value = (
1198
+ past_key_values[idx] if past_key_values is not None else None
1199
+ )
1200
+
1201
+ has_gradient = not hidden_states.stop_gradient
1202
+ if (
1203
+ self.enable_recompute
1204
+ and idx not in self.no_recompute_layers
1205
+ and has_gradient
1206
+ and self.recompute_granularity == "full"
1207
+ ):
1208
+ layer_outputs = self.recompute_training_full(
1209
+ decoder_layer,
1210
+ hidden_states,
1211
+ position_ids,
1212
+ attention_mask,
1213
+ output_attentions,
1214
+ past_key_value,
1215
+ use_cache,
1216
+ attn_mask_startend_row_indices=attn_mask_startend_row_indices,
1217
+ )
1218
+ else:
1219
+ layer_outputs = decoder_layer(
1220
+ hidden_states,
1221
+ position_ids,
1222
+ attention_mask,
1223
+ output_attentions,
1224
+ past_key_value,
1225
+ use_cache,
1226
+ attn_mask_startend_row_indices=attn_mask_startend_row_indices,
1227
+ )
1228
+
1229
+ # NOTE: clear outdate cache after it has been used for memory saving
1230
+ past_key_value = past_key_values[idx] = None
1231
+ if type(layer_outputs) is tuple:
1232
+ hidden_states = layer_outputs[0]
1233
+ else:
1234
+ hidden_states = layer_outputs
1235
+
1236
+ if output_attentions:
1237
+ all_self_attns += (layer_outputs[1],)
1238
+
1239
+ if use_cache:
1240
+ next_decoder_cache += (layer_outputs[2 if output_attentions else 1],)
1241
+
1242
+ hidden_states = self.norm(hidden_states)
1243
+
1244
+ # add hidden states from the last decoder layer
1245
+ if output_hidden_states:
1246
+ all_hidden_states += (hidden_states,)
1247
+
1248
+ next_cache = next_decoder_cache if use_cache else None
1249
+
1250
+ if not return_dict:
1251
+ return tuple(
1252
+ v
1253
+ for v in [hidden_states, next_cache, all_hidden_states, all_self_attns]
1254
+ if v is not None
1255
+ )
1256
+ return BaseModelOutputWithPast(
1257
+ last_hidden_state=hidden_states,
1258
+ past_key_values=next_cache,
1259
+ hidden_states=all_hidden_states,
1260
+ attentions=all_self_attns,
1261
+ )
1262
+
1263
+
1264
+ class Qwen2PretrainingCriterion(nn.Layer):
1265
+ """
1266
+ Criterion for Mixtral.
1267
+ It calculates the final loss.
1268
+ """
1269
+
1270
+ def __init__(self, config: Qwen2Config):
1271
+ super(Qwen2PretrainingCriterion, self).__init__()
1272
+ self.ignore_index = getattr(config, "ignore_index", -100)
1273
+ self.config = config
1274
+ self.enable_parallel_cross_entropy = (
1275
+ config.tensor_parallel_degree > 1 and config.tensor_parallel_output
1276
+ )
1277
+
1278
+ if (
1279
+ self.enable_parallel_cross_entropy
1280
+ ): # and False: # and lm_head is distributed
1281
+ self.loss_func = mpu.ParallelCrossEntropy(ignore_index=self.ignore_index)
1282
+ else:
1283
+ self.loss_func = paddle.nn.CrossEntropyLoss(
1284
+ reduction="none", ignore_index=self.ignore_index
1285
+ )
1286
+
1287
+ def forward(self, prediction_scores, masked_lm_labels):
1288
+ if self.enable_parallel_cross_entropy:
1289
+ if prediction_scores.shape[-1] == self.config.vocab_size:
1290
+ logging.warning(
1291
+ f"enable_parallel_cross_entropy, the vocab_size should be splitted: {prediction_scores.shape[-1]}, {self.config.vocab_size}"
1292
+ )
1293
+ self.loss_func = paddle.nn.CrossEntropyLoss(
1294
+ reduction="none", ignore_index=self.ignore_index
1295
+ )
1296
+
1297
+ with paddle.amp.auto_cast(False):
1298
+ masked_lm_loss = self.loss_func(
1299
+ prediction_scores.astype("float32"), masked_lm_labels.unsqueeze(2)
1300
+ )
1301
+
1302
+ # skip ignore_index which loss == 0
1303
+ # masked_lm_loss = masked_lm_loss[masked_lm_loss > 0]
1304
+ # loss = paddle.mean(masked_lm_loss)
1305
+ binary_sequence = paddle.where(
1306
+ masked_lm_loss > 0,
1307
+ paddle.ones_like(masked_lm_loss),
1308
+ paddle.zeros_like(masked_lm_loss),
1309
+ )
1310
+ count = paddle.sum(binary_sequence)
1311
+ if count == 0:
1312
+ loss = paddle.sum(masked_lm_loss * binary_sequence)
1313
+ else:
1314
+ loss = paddle.sum(masked_lm_loss * binary_sequence) / count
1315
+
1316
+ return loss
1317
+
1318
+
1319
+ class Qwen2LMHead(nn.Layer):
1320
+ def __init__(self, config: Qwen2Config, embedding_weights=None, transpose_y=False):
1321
+ super(Qwen2LMHead, self).__init__()
1322
+ self.config = config
1323
+ if (
1324
+ config.tensor_parallel_degree > 1
1325
+ and config.vocab_size % config.tensor_parallel_degree == 0
1326
+ ):
1327
+ vocab_size = config.vocab_size // config.tensor_parallel_degree
1328
+ else:
1329
+ vocab_size = config.vocab_size
1330
+
1331
+ self.transpose_y = transpose_y
1332
+ if transpose_y:
1333
+ if embedding_weights is not None:
1334
+ self.weight = embedding_weights
1335
+ else:
1336
+ self.weight = self.create_parameter(
1337
+ shape=[vocab_size, config.hidden_size],
1338
+ dtype=paddle.get_default_dtype(),
1339
+ )
1340
+ else:
1341
+ if vocab_size != config.vocab_size:
1342
+ self.weight = self.create_parameter(
1343
+ shape=[config.hidden_size, vocab_size],
1344
+ dtype=paddle.get_default_dtype(),
1345
+ )
1346
+ else:
1347
+ self.weight = self.create_parameter(
1348
+ shape=[config.hidden_size, vocab_size],
1349
+ dtype=paddle.get_default_dtype(),
1350
+ )
1351
+
1352
+ # Must set distributed attr for Tensor Parallel !
1353
+ self.weight.is_distributed = (
1354
+ True if (vocab_size != config.vocab_size) else False
1355
+ )
1356
+ if self.weight.is_distributed:
1357
+ # for tie_word_embeddings
1358
+ self.weight.split_axis = 0 if self.transpose_y else 1
1359
+
1360
+ def forward(self, hidden_states, tensor_parallel_output=None):
1361
+ if self.config.sequence_parallel:
1362
+ hidden_states = GatherOp.apply(hidden_states)
1363
+ seq_length = self.config.seq_length
1364
+ hidden_states = paddle.reshape_(
1365
+ hidden_states, [-1, seq_length, self.config.hidden_size]
1366
+ )
1367
+
1368
+ if tensor_parallel_output is None:
1369
+ tensor_parallel_output = self.config.tensor_parallel_output
1370
+
1371
+ logits = parallel_matmul(
1372
+ hidden_states,
1373
+ self.weight,
1374
+ transpose_y=self.transpose_y,
1375
+ tensor_parallel_output=tensor_parallel_output,
1376
+ )
1377
+ return logits
1378
+
1379
+
1380
+ class Qwen2ForCausalLM(Qwen2PretrainedModel):
1381
+ enable_to_static_method = True
1382
+ _tied_weights_keys = ["lm_head.weight"]
1383
+
1384
+ def __init__(self, config: Qwen2Config):
1385
+ super().__init__(config)
1386
+ self.qwen2 = Qwen2Model(config)
1387
+ if config.tie_word_embeddings:
1388
+ self.lm_head = Qwen2LMHead(
1389
+ config,
1390
+ embedding_weights=self.qwen2.embed_tokens.weight,
1391
+ transpose_y=True,
1392
+ )
1393
+ self.tie_weights()
1394
+ else:
1395
+ self.lm_head = Qwen2LMHead(config)
1396
+ self.criterion = Qwen2PretrainingCriterion(config)
1397
+ self.vocab_size = config.vocab_size
1398
+
1399
+ def get_input_embeddings(self):
1400
+ return self.qwen2.embed_tokens
1401
+
1402
+ def set_input_embeddings(self, value):
1403
+ self.qwen2.embed_tokens = value
1404
+
1405
+ def get_output_embeddings(self):
1406
+ return self.lm_head
1407
+
1408
+ def set_output_embeddings(self, new_embeddings):
1409
+ self.lm_head = new_embeddings
1410
+
1411
+ def set_decoder(self, decoder):
1412
+ self.qwen2 = decoder
1413
+
1414
+ def get_decoder(self):
1415
+ return self.qwen2
1416
+
1417
+ def prepare_inputs_for_generation(
1418
+ self,
1419
+ input_ids,
1420
+ use_cache=False,
1421
+ past_key_values=None,
1422
+ attention_mask=None,
1423
+ inputs_embeds=None,
1424
+ **kwargs,
1425
+ ):
1426
+ batch_size, seq_length = input_ids.shape
1427
+ position_ids = kwargs.get(
1428
+ "position_ids", paddle.arange(seq_length).expand((batch_size, seq_length))
1429
+ )
1430
+ if past_key_values:
1431
+ input_ids = input_ids[:, -1].unsqueeze(axis=-1)
1432
+ position_ids = position_ids[:, -1].unsqueeze(-1)
1433
+
1434
+ # if `inputs_embeds` are passed, we only want to use them in the 1st generation step
1435
+ if inputs_embeds is not None and past_key_values is None:
1436
+ model_inputs = {"inputs_embeds": inputs_embeds}
1437
+ else:
1438
+ model_inputs = {"input_ids": input_ids}
1439
+
1440
+ model_inputs.update(
1441
+ {
1442
+ "position_ids": position_ids,
1443
+ "past_key_values": past_key_values,
1444
+ "use_cache": use_cache,
1445
+ "attention_mask": attention_mask,
1446
+ }
1447
+ )
1448
+ return model_inputs
1449
+
1450
+ def _get_model_inputs_spec(self, dtype: str):
1451
+ return {
1452
+ "input_ids": paddle.static.InputSpec(shape=[None, None], dtype="int64"),
1453
+ "attention_mask": paddle.static.InputSpec(
1454
+ shape=[None, None], dtype="int64"
1455
+ ),
1456
+ "position_ids": paddle.static.InputSpec(shape=[None, None], dtype="int64"),
1457
+ }
1458
+
1459
+ @staticmethod
1460
+ def update_model_kwargs_for_generation(
1461
+ outputs, model_kwargs, is_encoder_decoder=False
1462
+ ):
1463
+ # update cache
1464
+ if (
1465
+ isinstance(outputs, tuple)
1466
+ and len(outputs) > 1
1467
+ and not isinstance(outputs[1], paddle.Tensor)
1468
+ ):
1469
+ model_kwargs["past_key_values"] = outputs[1]
1470
+
1471
+ if isinstance(outputs, CausalLMOutputWithPast) and "past_key_values" in outputs:
1472
+ model_kwargs["past_key_values"] = outputs.past_key_values
1473
+
1474
+ # update position_ids
1475
+ if "position_ids" in model_kwargs and model_kwargs["position_ids"] is not None:
1476
+ position_ids = model_kwargs["position_ids"]
1477
+ model_kwargs["position_ids"] = paddle.concat(
1478
+ [position_ids, position_ids[..., -1:] + 1], axis=-1
1479
+ )
1480
+
1481
+ if not is_encoder_decoder and "attention_mask" in model_kwargs:
1482
+ # TODO: support attention mask for other models
1483
+ attention_mask = model_kwargs["attention_mask"]
1484
+ if len(attention_mask.shape) == 2:
1485
+ model_kwargs["attention_mask"] = paddle.concat(
1486
+ [
1487
+ attention_mask,
1488
+ paddle.ones(
1489
+ [attention_mask.shape[0], 1], dtype=attention_mask.dtype
1490
+ ),
1491
+ ],
1492
+ axis=-1,
1493
+ )
1494
+ elif len(attention_mask.shape) == 4:
1495
+ model_kwargs["attention_mask"] = paddle.concat(
1496
+ [
1497
+ attention_mask,
1498
+ paddle.ones(
1499
+ [*attention_mask.shape[:3], 1], dtype=attention_mask.dtype
1500
+ ),
1501
+ ],
1502
+ axis=-1,
1503
+ )[:, :, -1:, :]
1504
+
1505
+ return model_kwargs
1506
+
1507
+ def forward(
1508
+ self,
1509
+ input_ids: paddle.Tensor = None,
1510
+ position_ids: Optional[paddle.Tensor] = None,
1511
+ attention_mask: Optional[paddle.Tensor] = None,
1512
+ inputs_embeds: Optional[paddle.Tensor] = None,
1513
+ labels: Optional[paddle.Tensor] = None,
1514
+ use_cache: Optional[bool] = None,
1515
+ past_key_values: Optional[List[paddle.Tensor]] = None,
1516
+ output_attentions: Optional[bool] = None,
1517
+ output_hidden_states: Optional[bool] = None,
1518
+ return_dict: Optional[bool] = None,
1519
+ attn_mask_startend_row_indices=None,
1520
+ ) -> Union[Tuple, CausalLMOutputWithPast]:
1521
+ r"""
1522
+ Args:
1523
+ labels (`paddle.Tensor` of shape `(batch_size, sequence_length)`, *optional*):
1524
+ Labels for computing the masked language modeling loss. Indices should either be in `[0, ...,
1525
+ config.vocab_size]` or -100 (see `input_ids` docstring). Tokens with indices set to `-100` are ignored
1526
+ (masked), the loss is only computed for the tokens with labels in `[0, ..., config.vocab_size]`.
1527
+
1528
+ Returns:
1529
+
1530
+ Example:
1531
+
1532
+ ```python
1533
+ >>> from transformers import AutoTokenizer, Qwen2ForCausalLM
1534
+
1535
+ >>> model = Qwen2ForCausalLM.from_pretrained(PATH_TO_CONVERTED_WEIGHTS)
1536
+ >>> tokenizer = AutoTokenizer.from_pretrained(PATH_TO_CONVERTED_TOKENIZER)
1537
+
1538
+ >>> prompt = "Hey, are you conscious? Can you talk to me?"
1539
+ >>> inputs = tokenizer(prompt, return_tensors="pt")
1540
+
1541
+ >>> # Generate
1542
+ >>> generate_ids = model.generate(inputs.input_ids, max_length=30)
1543
+ >>> tokenizer.batch_decode(generate_ids, skip_special_tokens=True, clean_up_tokenization_spaces=False)[0]
1544
+ "Hey, are you conscious? Can you talk to me?\nI'm not conscious, but I can talk to you."
1545
+ ```"""
1546
+
1547
+ output_attentions = (
1548
+ output_attentions
1549
+ if output_attentions is not None
1550
+ else self.config.output_attentions
1551
+ )
1552
+ output_hidden_states = (
1553
+ output_hidden_states
1554
+ if output_hidden_states is not None
1555
+ else self.config.output_hidden_states
1556
+ )
1557
+ return_dict = (
1558
+ return_dict if return_dict is not None else self.config.use_return_dict
1559
+ )
1560
+
1561
+ if attn_mask_startend_row_indices is not None and attention_mask is not None:
1562
+ logging.warning(
1563
+ "You have provided both attn_mask_startend_row_indices and attention_mask. "
1564
+ "The attn_mask_startend_row_indices will be used."
1565
+ )
1566
+ attention_mask = None
1567
+
1568
+ # decoder outputs consists of (dec_features, layer_state, dec_hidden, dec_attn)
1569
+ outputs = self.qwen2(
1570
+ input_ids=input_ids,
1571
+ position_ids=position_ids,
1572
+ attention_mask=attention_mask,
1573
+ inputs_embeds=inputs_embeds,
1574
+ use_cache=use_cache,
1575
+ past_key_values=past_key_values,
1576
+ output_attentions=output_attentions,
1577
+ output_hidden_states=output_hidden_states,
1578
+ return_dict=return_dict,
1579
+ attn_mask_startend_row_indices=attn_mask_startend_row_indices,
1580
+ )
1581
+
1582
+ hidden_states = outputs[0]
1583
+
1584
+ # if labels is None,means we need full output, instead of tensor_parallel_output
1585
+ # tensor_parallel_output is together with ParallelCrossEntropy
1586
+ tensor_parallel_output = (
1587
+ self.config.tensor_parallel_output
1588
+ and self.config.tensor_parallel_degree > 1
1589
+ )
1590
+
1591
+ logits = self.lm_head(
1592
+ hidden_states, tensor_parallel_output=tensor_parallel_output
1593
+ )
1594
+ loss = None
1595
+
1596
+ if not return_dict:
1597
+ output = (logits,) + outputs[1:]
1598
+ return (loss,) + output if loss is not None else output
1599
+
1600
+ return CausalLMOutputWithPast(
1601
+ loss=loss,
1602
+ logits=logits,
1603
+ past_key_values=outputs.past_key_values,
1604
+ hidden_states=outputs.hidden_states,
1605
+ attentions=outputs.attentions,
1606
+ )