paddlex 3.0.0rc1__py3-none-any.whl → 3.0.2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (240) hide show
  1. paddlex/.version +1 -1
  2. paddlex/__init__.py +1 -1
  3. paddlex/configs/modules/chart_parsing/PP-Chart2Table.yaml +13 -0
  4. paddlex/configs/modules/doc_vlm/PP-DocBee2-3B.yaml +14 -0
  5. paddlex/configs/modules/formula_recognition/PP-FormulaNet_plus-L.yaml +40 -0
  6. paddlex/configs/modules/formula_recognition/PP-FormulaNet_plus-M.yaml +40 -0
  7. paddlex/configs/modules/formula_recognition/PP-FormulaNet_plus-S.yaml +40 -0
  8. paddlex/configs/modules/layout_detection/PP-DocBlockLayout.yaml +40 -0
  9. paddlex/configs/modules/layout_detection/PP-DocLayout-L.yaml +2 -2
  10. paddlex/configs/modules/layout_detection/PP-DocLayout-M.yaml +2 -2
  11. paddlex/configs/modules/layout_detection/PP-DocLayout-S.yaml +2 -2
  12. paddlex/configs/modules/layout_detection/PP-DocLayout_plus-L.yaml +40 -0
  13. paddlex/configs/modules/text_detection/PP-OCRv5_mobile_det.yaml +40 -0
  14. paddlex/configs/modules/text_detection/PP-OCRv5_server_det.yaml +40 -0
  15. paddlex/configs/modules/text_recognition/PP-OCRv5_mobile_rec.yaml +39 -0
  16. paddlex/configs/modules/text_recognition/PP-OCRv5_server_rec.yaml +39 -0
  17. paddlex/configs/modules/textline_orientation/PP-LCNet_x1_0_textline_ori.yaml +41 -0
  18. paddlex/configs/pipelines/OCR.yaml +7 -6
  19. paddlex/configs/pipelines/PP-ChatOCRv3-doc.yaml +3 -1
  20. paddlex/configs/pipelines/PP-ChatOCRv4-doc.yaml +91 -34
  21. paddlex/configs/pipelines/PP-StructureV3.yaml +72 -72
  22. paddlex/configs/pipelines/doc_understanding.yaml +1 -1
  23. paddlex/configs/pipelines/formula_recognition.yaml +2 -2
  24. paddlex/configs/pipelines/layout_parsing.yaml +3 -2
  25. paddlex/configs/pipelines/seal_recognition.yaml +1 -0
  26. paddlex/configs/pipelines/table_recognition.yaml +2 -1
  27. paddlex/configs/pipelines/table_recognition_v2.yaml +7 -1
  28. paddlex/hpip_links.html +20 -20
  29. paddlex/inference/common/batch_sampler/doc_vlm_batch_sampler.py +33 -10
  30. paddlex/inference/common/batch_sampler/image_batch_sampler.py +34 -25
  31. paddlex/inference/common/result/mixin.py +19 -12
  32. paddlex/inference/models/base/predictor/base_predictor.py +2 -8
  33. paddlex/inference/models/common/static_infer.py +29 -73
  34. paddlex/inference/models/common/tokenizer/__init__.py +2 -0
  35. paddlex/inference/models/common/tokenizer/clip_tokenizer.py +1 -1
  36. paddlex/inference/models/common/tokenizer/gpt_tokenizer.py +2 -2
  37. paddlex/inference/models/common/tokenizer/qwen2_5_tokenizer.py +112 -0
  38. paddlex/inference/models/common/tokenizer/qwen2_tokenizer.py +7 -1
  39. paddlex/inference/models/common/tokenizer/qwen_tokenizer.py +288 -0
  40. paddlex/inference/models/common/tokenizer/tokenizer_utils.py +13 -13
  41. paddlex/inference/models/common/tokenizer/tokenizer_utils_base.py +3 -3
  42. paddlex/inference/models/common/tokenizer/vocab.py +7 -7
  43. paddlex/inference/models/common/ts/funcs.py +19 -8
  44. paddlex/inference/models/common/vlm/conversion_utils.py +99 -0
  45. paddlex/inference/models/common/vlm/fusion_ops.py +205 -0
  46. paddlex/inference/models/common/vlm/generation/configuration_utils.py +1 -1
  47. paddlex/inference/models/common/vlm/generation/logits_process.py +1 -1
  48. paddlex/inference/models/common/vlm/generation/utils.py +1 -1
  49. paddlex/inference/models/common/vlm/transformers/configuration_utils.py +3 -3
  50. paddlex/inference/models/common/vlm/transformers/conversion_utils.py +3 -3
  51. paddlex/inference/models/common/vlm/transformers/model_outputs.py +2 -2
  52. paddlex/inference/models/common/vlm/transformers/model_utils.py +7 -31
  53. paddlex/inference/models/doc_vlm/modeling/GOT_ocr_2_0.py +830 -0
  54. paddlex/inference/models/doc_vlm/modeling/__init__.py +2 -0
  55. paddlex/inference/models/doc_vlm/modeling/qwen2.py +1606 -0
  56. paddlex/inference/models/doc_vlm/modeling/qwen2_5_vl.py +3006 -0
  57. paddlex/inference/models/doc_vlm/modeling/qwen2_vl.py +0 -105
  58. paddlex/inference/models/doc_vlm/predictor.py +79 -24
  59. paddlex/inference/models/doc_vlm/processors/GOT_ocr_2_0.py +97 -0
  60. paddlex/inference/models/doc_vlm/processors/__init__.py +2 -0
  61. paddlex/inference/models/doc_vlm/processors/common.py +189 -0
  62. paddlex/inference/models/doc_vlm/processors/qwen2_5_vl.py +548 -0
  63. paddlex/inference/models/doc_vlm/processors/qwen2_vl.py +21 -176
  64. paddlex/inference/models/formula_recognition/predictor.py +8 -2
  65. paddlex/inference/models/formula_recognition/processors.py +90 -77
  66. paddlex/inference/models/formula_recognition/result.py +28 -27
  67. paddlex/inference/models/image_feature/processors.py +3 -4
  68. paddlex/inference/models/keypoint_detection/predictor.py +3 -0
  69. paddlex/inference/models/object_detection/predictor.py +2 -0
  70. paddlex/inference/models/object_detection/processors.py +28 -3
  71. paddlex/inference/models/object_detection/utils.py +2 -0
  72. paddlex/inference/models/table_structure_recognition/result.py +0 -10
  73. paddlex/inference/models/text_detection/predictor.py +8 -0
  74. paddlex/inference/models/text_detection/processors.py +44 -10
  75. paddlex/inference/models/text_detection/result.py +0 -10
  76. paddlex/inference/models/text_recognition/result.py +1 -1
  77. paddlex/inference/pipelines/__init__.py +9 -5
  78. paddlex/inference/pipelines/_parallel.py +172 -0
  79. paddlex/inference/pipelines/anomaly_detection/pipeline.py +16 -6
  80. paddlex/inference/pipelines/attribute_recognition/pipeline.py +11 -1
  81. paddlex/inference/pipelines/base.py +14 -4
  82. paddlex/inference/pipelines/components/faisser.py +1 -1
  83. paddlex/inference/pipelines/doc_preprocessor/pipeline.py +53 -27
  84. paddlex/inference/pipelines/formula_recognition/pipeline.py +120 -82
  85. paddlex/inference/pipelines/formula_recognition/result.py +1 -11
  86. paddlex/inference/pipelines/image_classification/pipeline.py +16 -6
  87. paddlex/inference/pipelines/image_multilabel_classification/pipeline.py +16 -6
  88. paddlex/inference/pipelines/instance_segmentation/pipeline.py +16 -6
  89. paddlex/inference/pipelines/keypoint_detection/pipeline.py +16 -6
  90. paddlex/inference/pipelines/layout_parsing/layout_objects.py +859 -0
  91. paddlex/inference/pipelines/layout_parsing/pipeline.py +34 -47
  92. paddlex/inference/pipelines/layout_parsing/pipeline_v2.py +832 -260
  93. paddlex/inference/pipelines/layout_parsing/result.py +4 -17
  94. paddlex/inference/pipelines/layout_parsing/result_v2.py +259 -245
  95. paddlex/inference/pipelines/layout_parsing/setting.py +88 -0
  96. paddlex/inference/pipelines/layout_parsing/utils.py +391 -2028
  97. paddlex/inference/pipelines/layout_parsing/xycut_enhanced/__init__.py +16 -0
  98. paddlex/inference/pipelines/layout_parsing/xycut_enhanced/utils.py +1199 -0
  99. paddlex/inference/pipelines/layout_parsing/xycut_enhanced/xycuts.py +615 -0
  100. paddlex/inference/pipelines/m_3d_bev_detection/pipeline.py +2 -2
  101. paddlex/inference/pipelines/multilingual_speech_recognition/pipeline.py +2 -2
  102. paddlex/inference/pipelines/object_detection/pipeline.py +16 -6
  103. paddlex/inference/pipelines/ocr/pipeline.py +127 -70
  104. paddlex/inference/pipelines/ocr/result.py +21 -18
  105. paddlex/inference/pipelines/open_vocabulary_detection/pipeline.py +2 -2
  106. paddlex/inference/pipelines/open_vocabulary_segmentation/pipeline.py +2 -2
  107. paddlex/inference/pipelines/pp_chatocr/pipeline_base.py +2 -2
  108. paddlex/inference/pipelines/pp_chatocr/pipeline_v3.py +2 -5
  109. paddlex/inference/pipelines/pp_chatocr/pipeline_v4.py +6 -6
  110. paddlex/inference/pipelines/rotated_object_detection/pipeline.py +16 -6
  111. paddlex/inference/pipelines/seal_recognition/pipeline.py +109 -53
  112. paddlex/inference/pipelines/semantic_segmentation/pipeline.py +16 -6
  113. paddlex/inference/pipelines/small_object_detection/pipeline.py +16 -6
  114. paddlex/inference/pipelines/table_recognition/pipeline.py +26 -18
  115. paddlex/inference/pipelines/table_recognition/pipeline_v2.py +624 -53
  116. paddlex/inference/pipelines/table_recognition/result.py +1 -1
  117. paddlex/inference/pipelines/table_recognition/table_recognition_post_processing_v2.py +9 -5
  118. paddlex/inference/pipelines/ts_anomaly_detection/pipeline.py +2 -2
  119. paddlex/inference/pipelines/ts_classification/pipeline.py +2 -2
  120. paddlex/inference/pipelines/ts_forecasting/pipeline.py +2 -2
  121. paddlex/inference/pipelines/video_classification/pipeline.py +2 -2
  122. paddlex/inference/pipelines/video_detection/pipeline.py +2 -2
  123. paddlex/inference/serving/basic_serving/_app.py +46 -13
  124. paddlex/inference/serving/basic_serving/_pipeline_apps/_common/common.py +5 -1
  125. paddlex/inference/serving/basic_serving/_pipeline_apps/layout_parsing.py +0 -1
  126. paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv3_doc.py +0 -1
  127. paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv4_doc.py +1 -1
  128. paddlex/inference/serving/basic_serving/_pipeline_apps/pp_structurev3.py +6 -2
  129. paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition.py +1 -5
  130. paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition_v2.py +4 -5
  131. paddlex/inference/serving/infra/utils.py +20 -22
  132. paddlex/inference/serving/schemas/formula_recognition.py +1 -1
  133. paddlex/inference/serving/schemas/layout_parsing.py +1 -2
  134. paddlex/inference/serving/schemas/pp_chatocrv3_doc.py +1 -2
  135. paddlex/inference/serving/schemas/pp_chatocrv4_doc.py +2 -2
  136. paddlex/inference/serving/schemas/pp_structurev3.py +10 -6
  137. paddlex/inference/serving/schemas/seal_recognition.py +1 -1
  138. paddlex/inference/serving/schemas/table_recognition.py +2 -6
  139. paddlex/inference/serving/schemas/table_recognition_v2.py +5 -6
  140. paddlex/inference/utils/hpi.py +30 -16
  141. paddlex/inference/utils/hpi_model_info_collection.json +666 -162
  142. paddlex/inference/utils/io/readers.py +12 -12
  143. paddlex/inference/utils/misc.py +20 -0
  144. paddlex/inference/utils/mkldnn_blocklist.py +59 -0
  145. paddlex/inference/utils/official_models.py +140 -5
  146. paddlex/inference/utils/pp_option.py +74 -9
  147. paddlex/model.py +2 -2
  148. paddlex/modules/__init__.py +1 -1
  149. paddlex/modules/anomaly_detection/evaluator.py +2 -2
  150. paddlex/modules/base/__init__.py +1 -1
  151. paddlex/modules/base/evaluator.py +5 -5
  152. paddlex/modules/base/trainer.py +1 -1
  153. paddlex/modules/doc_vlm/dataset_checker.py +2 -2
  154. paddlex/modules/doc_vlm/evaluator.py +2 -2
  155. paddlex/modules/doc_vlm/exportor.py +2 -2
  156. paddlex/modules/doc_vlm/model_list.py +1 -1
  157. paddlex/modules/doc_vlm/trainer.py +2 -2
  158. paddlex/modules/face_recognition/evaluator.py +2 -2
  159. paddlex/modules/formula_recognition/evaluator.py +5 -2
  160. paddlex/modules/formula_recognition/model_list.py +3 -0
  161. paddlex/modules/formula_recognition/trainer.py +3 -0
  162. paddlex/modules/general_recognition/evaluator.py +1 -1
  163. paddlex/modules/image_classification/evaluator.py +2 -2
  164. paddlex/modules/image_classification/model_list.py +1 -0
  165. paddlex/modules/instance_segmentation/evaluator.py +1 -1
  166. paddlex/modules/keypoint_detection/evaluator.py +1 -1
  167. paddlex/modules/m_3d_bev_detection/evaluator.py +2 -2
  168. paddlex/modules/multilabel_classification/evaluator.py +2 -2
  169. paddlex/modules/object_detection/dataset_checker/dataset_src/convert_dataset.py +4 -4
  170. paddlex/modules/object_detection/evaluator.py +2 -2
  171. paddlex/modules/object_detection/model_list.py +2 -0
  172. paddlex/modules/semantic_segmentation/dataset_checker/__init__.py +12 -2
  173. paddlex/modules/semantic_segmentation/evaluator.py +2 -2
  174. paddlex/modules/table_recognition/evaluator.py +2 -2
  175. paddlex/modules/text_detection/evaluator.py +2 -2
  176. paddlex/modules/text_detection/model_list.py +2 -0
  177. paddlex/modules/text_recognition/evaluator.py +2 -2
  178. paddlex/modules/text_recognition/model_list.py +2 -0
  179. paddlex/modules/ts_anomaly_detection/evaluator.py +2 -2
  180. paddlex/modules/ts_classification/dataset_checker/dataset_src/split_dataset.py +1 -1
  181. paddlex/modules/ts_classification/evaluator.py +2 -2
  182. paddlex/modules/ts_forecast/evaluator.py +2 -2
  183. paddlex/modules/video_classification/evaluator.py +2 -2
  184. paddlex/modules/video_detection/evaluator.py +2 -2
  185. paddlex/ops/__init__.py +8 -5
  186. paddlex/paddlex_cli.py +19 -13
  187. paddlex/repo_apis/Paddle3D_api/bev_fusion/model.py +2 -2
  188. paddlex/repo_apis/PaddleClas_api/cls/config.py +1 -1
  189. paddlex/repo_apis/PaddleClas_api/cls/model.py +1 -1
  190. paddlex/repo_apis/PaddleClas_api/cls/register.py +10 -0
  191. paddlex/repo_apis/PaddleClas_api/cls/runner.py +1 -1
  192. paddlex/repo_apis/PaddleDetection_api/instance_seg/model.py +1 -1
  193. paddlex/repo_apis/PaddleDetection_api/instance_seg/runner.py +1 -1
  194. paddlex/repo_apis/PaddleDetection_api/object_det/config.py +1 -1
  195. paddlex/repo_apis/PaddleDetection_api/object_det/model.py +1 -1
  196. paddlex/repo_apis/PaddleDetection_api/object_det/official_categories.py +25 -0
  197. paddlex/repo_apis/PaddleDetection_api/object_det/register.py +30 -0
  198. paddlex/repo_apis/PaddleDetection_api/object_det/runner.py +1 -1
  199. paddlex/repo_apis/PaddleOCR_api/formula_rec/config.py +3 -3
  200. paddlex/repo_apis/PaddleOCR_api/formula_rec/model.py +5 -9
  201. paddlex/repo_apis/PaddleOCR_api/formula_rec/register.py +27 -0
  202. paddlex/repo_apis/PaddleOCR_api/formula_rec/runner.py +1 -1
  203. paddlex/repo_apis/PaddleOCR_api/table_rec/model.py +1 -1
  204. paddlex/repo_apis/PaddleOCR_api/table_rec/runner.py +1 -1
  205. paddlex/repo_apis/PaddleOCR_api/text_det/model.py +1 -1
  206. paddlex/repo_apis/PaddleOCR_api/text_det/register.py +18 -0
  207. paddlex/repo_apis/PaddleOCR_api/text_det/runner.py +1 -1
  208. paddlex/repo_apis/PaddleOCR_api/text_rec/config.py +3 -3
  209. paddlex/repo_apis/PaddleOCR_api/text_rec/model.py +5 -9
  210. paddlex/repo_apis/PaddleOCR_api/text_rec/register.py +18 -0
  211. paddlex/repo_apis/PaddleOCR_api/text_rec/runner.py +1 -1
  212. paddlex/repo_apis/PaddleSeg_api/seg/model.py +1 -1
  213. paddlex/repo_apis/PaddleSeg_api/seg/runner.py +1 -1
  214. paddlex/repo_apis/PaddleTS_api/ts_ad/config.py +3 -3
  215. paddlex/repo_apis/PaddleTS_api/ts_cls/config.py +2 -2
  216. paddlex/repo_apis/PaddleTS_api/ts_fc/config.py +4 -4
  217. paddlex/repo_apis/PaddleVideo_api/video_cls/config.py +1 -1
  218. paddlex/repo_apis/PaddleVideo_api/video_cls/model.py +1 -1
  219. paddlex/repo_apis/PaddleVideo_api/video_cls/runner.py +1 -1
  220. paddlex/repo_apis/PaddleVideo_api/video_det/config.py +1 -1
  221. paddlex/repo_apis/PaddleVideo_api/video_det/model.py +1 -1
  222. paddlex/repo_apis/PaddleVideo_api/video_det/runner.py +1 -1
  223. paddlex/repo_apis/base/config.py +1 -1
  224. paddlex/repo_manager/core.py +3 -3
  225. paddlex/repo_manager/meta.py +6 -2
  226. paddlex/repo_manager/repo.py +17 -16
  227. paddlex/utils/custom_device_list.py +26 -2
  228. paddlex/utils/deps.py +3 -3
  229. paddlex/utils/device.py +5 -13
  230. paddlex/utils/env.py +4 -0
  231. paddlex/utils/flags.py +11 -4
  232. paddlex/utils/fonts/__init__.py +34 -4
  233. paddlex/utils/misc.py +1 -1
  234. paddlex/utils/subclass_register.py +2 -2
  235. {paddlex-3.0.0rc1.dist-info → paddlex-3.0.2.dist-info}/METADATA +349 -208
  236. {paddlex-3.0.0rc1.dist-info → paddlex-3.0.2.dist-info}/RECORD +240 -211
  237. {paddlex-3.0.0rc1.dist-info → paddlex-3.0.2.dist-info}/WHEEL +1 -1
  238. {paddlex-3.0.0rc1.dist-info → paddlex-3.0.2.dist-info}/entry_points.txt +1 -0
  239. {paddlex-3.0.0rc1.dist-info/licenses → paddlex-3.0.2.dist-info}/LICENSE +0 -0
  240. {paddlex-3.0.0rc1.dist-info → paddlex-3.0.2.dist-info}/top_level.txt +0 -0
paddlex/.version CHANGED
@@ -1 +1 @@
1
- 3.0.0.rc1
1
+ 3.0.2
paddlex/__init__.py CHANGED
@@ -24,7 +24,7 @@ for mod in _SPECIAL_MODS:
24
24
  from . import version
25
25
  from .inference import create_pipeline, create_predictor
26
26
  from .model import create_model
27
- from .modules import build_dataset_checker, build_evaluater, build_trainer
27
+ from .modules import build_dataset_checker, build_evaluator, build_trainer
28
28
 
29
29
 
30
30
  def _initialize():
@@ -0,0 +1,13 @@
1
+ Global:
2
+ model: PP-Chart2Table
3
+ mode: predict # only support predict
4
+ device: gpu:0
5
+ output: "output"
6
+
7
+ Predict:
8
+ batch_size: 1
9
+ model_dir: "/path/to/PP-Chart2Table"
10
+ input:
11
+ image: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/chart_parsing_02.png"
12
+ kernel_option:
13
+ run_mode: paddle
@@ -0,0 +1,14 @@
1
+ Global:
2
+ model: PP-DocBee2-3B
3
+ mode: predict # only support predict
4
+ device: gpu:0
5
+ output: "output"
6
+
7
+ Predict:
8
+ batch_size: 1
9
+ model_dir: "/path/to/PP-DocBee2-3B"
10
+ input:
11
+ image: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/medal_table.png"
12
+ query: "识别这份表格的内容, 以markdown格式输出"
13
+ kernel_option:
14
+ run_mode: paddle
@@ -0,0 +1,40 @@
1
+ Global:
2
+ model: PP-FormulaNet_plus-L
3
+ mode: check_dataset # check_dataset/train/evaluate/predict
4
+ dataset_dir: "./dataset/ocr_rec_latexocr_dataset_example"
5
+ device: gpu:0,1,2,3
6
+ output: "output"
7
+
8
+ CheckDataset:
9
+ convert:
10
+ enable: False
11
+ src_dataset_type: FormulaRecDataset
12
+ split:
13
+ enable: False
14
+ train_percent: null
15
+ val_percent: null
16
+
17
+ Train:
18
+ epochs_iters: 20
19
+ batch_size: 3
20
+ learning_rate: 0.0001
21
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-FormulaNet_plus-L_pretrained.pdparams
22
+ resume_path: null
23
+ log_interval: 20
24
+ eval_interval: 1
25
+ save_interval: 1
26
+
27
+ Evaluate:
28
+ batch_size: 3
29
+ weight_path: output/best_accuracy/best_accuracy.pdparams
30
+ log_interval: 1
31
+
32
+ Export:
33
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-FormulaNet_plus-L_pretrained.pdparams
34
+
35
+ Predict:
36
+ batch_size: 1
37
+ model_dir: "output/best_accuracy/inference"
38
+ input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_formula_rec_001.png"
39
+ kernel_option:
40
+ run_mode: paddle
@@ -0,0 +1,40 @@
1
+ Global:
2
+ model: PP-FormulaNet_plus-M
3
+ mode: check_dataset # check_dataset/train/evaluate/predict
4
+ dataset_dir: "./dataset/ocr_rec_latexocr_dataset_example"
5
+ device: gpu:0,1,2,3
6
+ output: "output"
7
+
8
+ CheckDataset:
9
+ convert:
10
+ enable: False
11
+ src_dataset_type: FormulaRecDataset
12
+ split:
13
+ enable: False
14
+ train_percent: null
15
+ val_percent: null
16
+
17
+ Train:
18
+ epochs_iters: 20
19
+ batch_size: 14
20
+ learning_rate: 0.0001
21
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-FormulaNet_plus-M_pretrained.pdparams
22
+ resume_path: null
23
+ log_interval: 20
24
+ eval_interval: 1
25
+ save_interval: 1
26
+
27
+ Evaluate:
28
+ batch_size: 20
29
+ weight_path: output/best_accuracy/best_accuracy.pdparams
30
+ log_interval: 1
31
+
32
+ Export:
33
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-FormulaNet_plus-M_pretrained.pdparams
34
+
35
+ Predict:
36
+ batch_size: 1
37
+ model_dir: "output/best_accuracy/inference"
38
+ input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_formula_rec_001.png"
39
+ kernel_option:
40
+ run_mode: paddle
@@ -0,0 +1,40 @@
1
+ Global:
2
+ model: PP-FormulaNet_plus-S
3
+ mode: check_dataset # check_dataset/train/evaluate/predict
4
+ dataset_dir: "./dataset/ocr_rec_latexocr_dataset_example"
5
+ device: gpu:0,1,2,3
6
+ output: "output"
7
+
8
+ CheckDataset:
9
+ convert:
10
+ enable: False
11
+ src_dataset_type: FormulaRecDataset
12
+ split:
13
+ enable: False
14
+ train_percent: null
15
+ val_percent: null
16
+
17
+ Train:
18
+ epochs_iters: 20
19
+ batch_size: 14
20
+ learning_rate: 0.0001
21
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-FormulaNet_plus-S_pretrained.pdparams
22
+ resume_path: null
23
+ log_interval: 20
24
+ eval_interval: 1
25
+ save_interval: 1
26
+
27
+ Evaluate:
28
+ batch_size: 20
29
+ weight_path: output/best_accuracy/best_accuracy.pdparams
30
+ log_interval: 1
31
+
32
+ Export:
33
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-FormulaNet_plus-S_pretrained.pdparams
34
+
35
+ Predict:
36
+ batch_size: 1
37
+ model_dir: "output/best_accuracy/inference"
38
+ input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_formula_rec_001.png"
39
+ kernel_option:
40
+ run_mode: paddle
@@ -0,0 +1,40 @@
1
+ Global:
2
+ model: PP-DocBlockLayout
3
+ mode: check_dataset # check_dataset/train/evaluate/predict
4
+ dataset_dir: "/paddle/dataset/paddlex/layout/det_layout_examples"
5
+ device: gpu:0,1,2,3
6
+ output: "output"
7
+
8
+ CheckDataset:
9
+ convert:
10
+ enable: False
11
+ src_dataset_type: null
12
+ split:
13
+ enable: False
14
+ train_percent: null
15
+ val_percent: null
16
+
17
+ Train:
18
+ num_classes: 11
19
+ epochs_iters: 100
20
+ batch_size: 1
21
+ learning_rate: 0.0001
22
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocBlockLayout_pretrained.pdparams
23
+ warmup_steps: 100
24
+ resume_path: null
25
+ log_interval: 10
26
+ eval_interval: 1
27
+
28
+ Evaluate:
29
+ weight_path: "output/best_model/best_model.pdparams"
30
+ log_interval: 10
31
+
32
+ Export:
33
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocBlockLayout_pretrained.pdparams
34
+
35
+ Predict:
36
+ batch_size: 1
37
+ model_dir: "output/best_model/inference"
38
+ input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/layout.jpg"
39
+ kernel_option:
40
+ run_mode: paddle
@@ -19,7 +19,7 @@ Train:
19
19
  epochs_iters: 100
20
20
  batch_size: 1
21
21
  learning_rate: 0.0001
22
- pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-L_pretrain.pdparams
22
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-L_pretrained.pdparams
23
23
  warmup_steps: 100
24
24
  resume_path: null
25
25
  log_interval: 10
@@ -30,7 +30,7 @@ Evaluate:
30
30
  log_interval: 10
31
31
 
32
32
  Export:
33
- weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-L_pretrain.pdparams
33
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-L_pretrained.pdparams
34
34
 
35
35
  Predict:
36
36
  batch_size: 1
@@ -19,7 +19,7 @@ Train:
19
19
  epochs_iters: 100
20
20
  batch_size: 1
21
21
  learning_rate: 0.0001
22
- pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-M_pretrain.pdparams
22
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-M_pretrained.pdparams
23
23
  warmup_steps: 100
24
24
  resume_path: null
25
25
  log_interval: 10
@@ -30,7 +30,7 @@ Evaluate:
30
30
  log_interval: 10
31
31
 
32
32
  Export:
33
- weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-M_pretrain.pdparams
33
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-M_pretrained.pdparams
34
34
 
35
35
  Predict:
36
36
  batch_size: 1
@@ -19,7 +19,7 @@ Train:
19
19
  epochs_iters: 100
20
20
  batch_size: 1
21
21
  learning_rate: 0.0001
22
- pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-S_pretrain.pdparams
22
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-S_pretrained.pdparams
23
23
  warmup_steps: 100
24
24
  resume_path: null
25
25
  log_interval: 10
@@ -30,7 +30,7 @@ Evaluate:
30
30
  log_interval: 10
31
31
 
32
32
  Export:
33
- weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-S_pretrain.pdparams
33
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-S_pretrained.pdparams
34
34
 
35
35
  Predict:
36
36
  batch_size: 1
@@ -0,0 +1,40 @@
1
+ Global:
2
+ model: PP-DocLayout_plus-L
3
+ mode: check_dataset # check_dataset/train/evaluate/predict
4
+ dataset_dir: "/paddle/dataset/paddlex/layout/det_layout_examples"
5
+ device: gpu:0,1,2,3
6
+ output: "output"
7
+
8
+ CheckDataset:
9
+ convert:
10
+ enable: False
11
+ src_dataset_type: null
12
+ split:
13
+ enable: False
14
+ train_percent: null
15
+ val_percent: null
16
+
17
+ Train:
18
+ num_classes: 11
19
+ epochs_iters: 100
20
+ batch_size: 1
21
+ learning_rate: 0.0001
22
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout_plus-L_pretrained.pdparams
23
+ warmup_steps: 100
24
+ resume_path: null
25
+ log_interval: 10
26
+ eval_interval: 1
27
+
28
+ Evaluate:
29
+ weight_path: "output/best_model/best_model.pdparams"
30
+ log_interval: 10
31
+
32
+ Export:
33
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout_plus-L_pretrained.pdparams
34
+
35
+ Predict:
36
+ batch_size: 1
37
+ model_dir: "output/best_model/inference"
38
+ input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/layout.jpg"
39
+ kernel_option:
40
+ run_mode: paddle
@@ -0,0 +1,40 @@
1
+ Global:
2
+ model: PP-OCRv5_mobile_det
3
+ mode: check_dataset # check_dataset/train/evaluate/predict
4
+ module: text_det
5
+ dataset_dir: "/paddle/dataset/paddlex/ocr_det/ocr_det_dataset_examples"
6
+ device: gpu:0,1,2,3
7
+ output: "output"
8
+
9
+ CheckDataset:
10
+ convert:
11
+ enable: False
12
+ src_dataset_type: null
13
+ split:
14
+ enable: False
15
+ train_percent: null
16
+ val_percent: null
17
+
18
+ Train:
19
+ epochs_iters: 100
20
+ batch_size: 4
21
+ learning_rate: 0.001
22
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_mobile_det_pretrained.pdparams
23
+ resume_path: null
24
+ log_interval: 10
25
+ eval_interval: 1
26
+ save_interval: 1
27
+
28
+ Evaluate:
29
+ weight_path: "output/best_accuracy/best_accuracy.pdparams"
30
+ log_interval: 1
31
+
32
+ Export:
33
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_mobile_det_pretrained.pdparams
34
+
35
+ Predict:
36
+ batch_size: 1
37
+ model_dir: "output/best_accuracy/inference"
38
+ input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_ocr_001.png"
39
+ kernel_option:
40
+ run_mode: paddle
@@ -0,0 +1,40 @@
1
+ Global:
2
+ model: PP-OCRv5_server_det
3
+ mode: check_dataset # check_dataset/train/evaluate/predict
4
+ module: text_det
5
+ dataset_dir: "/paddle/dataset/paddlex/ocr_det/ocr_det_dataset_examples"
6
+ device: gpu:0,1,2,3
7
+ output: "output"
8
+
9
+ CheckDataset:
10
+ convert:
11
+ enable: False
12
+ src_dataset_type: null
13
+ split:
14
+ enable: False
15
+ train_percent: null
16
+ val_percent: null
17
+
18
+ Train:
19
+ epochs_iters: 100
20
+ batch_size: 4
21
+ learning_rate: 0.001
22
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_server_det_pretrained.pdparams
23
+ resume_path: null
24
+ log_interval: 10
25
+ eval_interval: 1
26
+ save_interval: 1
27
+
28
+ Evaluate:
29
+ weight_path: "output/best_accuracy/best_accuracy.pdparams"
30
+ log_interval: 1
31
+
32
+ Export:
33
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_server_det_pretrained.pdparams
34
+
35
+ Predict:
36
+ batch_size: 1
37
+ model_dir: "output/best_accuracy/inference"
38
+ input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_ocr_001.png"
39
+ kernel_option:
40
+ run_mode: paddle
@@ -0,0 +1,39 @@
1
+ Global:
2
+ model: PP-OCRv5_mobile_rec
3
+ mode: check_dataset # check_dataset/train/evaluate/predict
4
+ dataset_dir: "/paddle/dataset/paddlex/ocr_rec/ocr_rec_dataset_examples"
5
+ device: gpu:0,1,2,3
6
+ output: "output"
7
+
8
+ CheckDataset:
9
+ convert:
10
+ enable: False
11
+ src_dataset_type: null
12
+ split:
13
+ enable: False
14
+ train_percent: null
15
+ val_percent: null
16
+
17
+ Train:
18
+ epochs_iters: 20
19
+ batch_size: 8
20
+ learning_rate: 0.001
21
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_mobile_rec_pretrained.pdparams
22
+ resume_path: null
23
+ log_interval: 20
24
+ eval_interval: 1
25
+ save_interval: 1
26
+
27
+ Evaluate:
28
+ weight_path: "output/best_accuracy/best_accuracy.pdparams"
29
+ log_interval: 1
30
+
31
+ Export:
32
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_mobile_rec_pretrained.pdparams
33
+
34
+ Predict:
35
+ batch_size: 1
36
+ model_dir: "output/best_accuracy/inference"
37
+ input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_ocr_rec_001.png"
38
+ kernel_option:
39
+ run_mode: paddle
@@ -0,0 +1,39 @@
1
+ Global:
2
+ model: PP-OCRv5_server_rec
3
+ mode: check_dataset # check_dataset/train/evaluate/predict
4
+ dataset_dir: "/paddle/dataset/paddlex/ocr_rec/ocr_rec_dataset_examples"
5
+ device: gpu:0,1,2,3
6
+ output: "output"
7
+
8
+ CheckDataset:
9
+ convert:
10
+ enable: False
11
+ src_dataset_type: null
12
+ split:
13
+ enable: False
14
+ train_percent: null
15
+ val_percent: null
16
+
17
+ Train:
18
+ epochs_iters: 20
19
+ batch_size: 8
20
+ learning_rate: 0.001
21
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_server_rec_pretrained.pdparams
22
+ resume_path: null
23
+ log_interval: 20
24
+ eval_interval: 1
25
+ save_interval: 1
26
+
27
+ Evaluate:
28
+ weight_path: "output/best_accuracy/best_accuracy.pdparams"
29
+ log_interval: 1
30
+
31
+ Export:
32
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_server_rec_pretrained.pdparams
33
+
34
+ Predict:
35
+ batch_size: 1
36
+ model_dir: "output/best_accuracy/inference"
37
+ input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_ocr_rec_001.png"
38
+ kernel_option:
39
+ run_mode: paddle
@@ -0,0 +1,41 @@
1
+ Global:
2
+ model: PP-LCNet_x1_0_textline_ori
3
+ mode: check_dataset # check_dataset/train/evaluate/predict
4
+ dataset_dir: "/paddle/dataset/paddlex/cls/textline_orientation_example_data"
5
+ device: gpu:0,1,2,3
6
+ output: "output"
7
+
8
+ CheckDataset:
9
+ convert:
10
+ enable: False
11
+ src_dataset_type: null
12
+ split:
13
+ enable: False
14
+ train_percent: null
15
+ val_percent: null
16
+
17
+ Train:
18
+ num_classes: 2
19
+ epochs_iters: 20
20
+ batch_size: 32
21
+ learning_rate: 0.8
22
+ pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-LCNet_x1_0_textline_ori_pretrained.pdparams
23
+ warmup_steps: 100
24
+ resume_path: null
25
+ log_interval: 10
26
+ eval_interval: 1
27
+ save_interval: 1
28
+
29
+ Evaluate:
30
+ weight_path: "output/best_model/best_model.pdparams"
31
+ log_interval: 10
32
+
33
+ Export:
34
+ weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-LCNet_x1_0_textline_ori_pretrained.pdparams
35
+
36
+ Predict:
37
+ batch_size: 1
38
+ model_dir: "output/best_model/inference"
39
+ input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/img_textline180_demo.jpg"
40
+ kernel_option:
41
+ run_mode: paddle
@@ -24,21 +24,22 @@ SubPipelines:
24
24
  SubModules:
25
25
  TextDetection:
26
26
  module_name: text_detection
27
- model_name: PP-OCRv4_mobile_det
27
+ model_name: PP-OCRv5_server_det
28
28
  model_dir: null
29
- limit_side_len: 960
30
- limit_type: max
29
+ limit_side_len: 64
30
+ limit_type: min
31
+ max_side_limit: 4000
31
32
  thresh: 0.3
32
33
  box_thresh: 0.6
33
- unclip_ratio: 2.0
34
+ unclip_ratio: 1.5
34
35
  TextLineOrientation:
35
36
  module_name: textline_orientation
36
- model_name: PP-LCNet_x0_25_textline_ori
37
+ model_name: PP-LCNet_x1_0_textline_ori
37
38
  model_dir: null
38
39
  batch_size: 6
39
40
  TextRecognition:
40
41
  module_name: text_recognition
41
- model_name: PP-OCRv4_mobile_rec
42
+ model_name: PP-OCRv5_server_rec
42
43
  model_dir: null
43
44
  batch_size: 6
44
45
  score_thresh: 0.0
@@ -99,9 +99,10 @@ SubPipelines:
99
99
  model_dir: null
100
100
  limit_side_len: 960
101
101
  limit_type: max
102
+ max_side_limit: 4000
102
103
  thresh: 0.3
103
104
  box_thresh: 0.6
104
- unclip_ratio: 2.0
105
+ unclip_ratio: 1.5
105
106
 
106
107
  TextRecognition:
107
108
  module_name: text_recognition
@@ -138,6 +139,7 @@ SubPipelines:
138
139
  model_dir: null
139
140
  limit_side_len: 736
140
141
  limit_type: min
142
+ max_side_limit: 4000
141
143
  thresh: 0.2
142
144
  box_thresh: 0.6
143
145
  unclip_ratio: 0.5