paddlex 3.0.0rc1__py3-none-any.whl → 3.0.1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- paddlex/.version +1 -1
- paddlex/__init__.py +1 -1
- paddlex/configs/modules/chart_parsing/PP-Chart2Table.yaml +13 -0
- paddlex/configs/modules/doc_vlm/PP-DocBee2-3B.yaml +14 -0
- paddlex/configs/modules/formula_recognition/PP-FormulaNet_plus-L.yaml +40 -0
- paddlex/configs/modules/formula_recognition/PP-FormulaNet_plus-M.yaml +40 -0
- paddlex/configs/modules/formula_recognition/PP-FormulaNet_plus-S.yaml +40 -0
- paddlex/configs/modules/layout_detection/PP-DocBlockLayout.yaml +40 -0
- paddlex/configs/modules/layout_detection/PP-DocLayout-L.yaml +2 -2
- paddlex/configs/modules/layout_detection/PP-DocLayout-M.yaml +2 -2
- paddlex/configs/modules/layout_detection/PP-DocLayout-S.yaml +2 -2
- paddlex/configs/modules/layout_detection/PP-DocLayout_plus-L.yaml +40 -0
- paddlex/configs/modules/text_detection/PP-OCRv5_mobile_det.yaml +40 -0
- paddlex/configs/modules/text_detection/PP-OCRv5_server_det.yaml +40 -0
- paddlex/configs/modules/text_recognition/PP-OCRv5_mobile_rec.yaml +39 -0
- paddlex/configs/modules/text_recognition/PP-OCRv5_server_rec.yaml +39 -0
- paddlex/configs/modules/textline_orientation/PP-LCNet_x1_0_textline_ori.yaml +41 -0
- paddlex/configs/pipelines/OCR.yaml +7 -6
- paddlex/configs/pipelines/PP-ChatOCRv3-doc.yaml +3 -1
- paddlex/configs/pipelines/PP-ChatOCRv4-doc.yaml +91 -34
- paddlex/configs/pipelines/PP-StructureV3.yaml +72 -72
- paddlex/configs/pipelines/doc_understanding.yaml +1 -1
- paddlex/configs/pipelines/formula_recognition.yaml +2 -2
- paddlex/configs/pipelines/layout_parsing.yaml +3 -2
- paddlex/configs/pipelines/seal_recognition.yaml +1 -0
- paddlex/configs/pipelines/table_recognition.yaml +2 -1
- paddlex/configs/pipelines/table_recognition_v2.yaml +7 -1
- paddlex/hpip_links.html +20 -20
- paddlex/inference/common/batch_sampler/doc_vlm_batch_sampler.py +33 -10
- paddlex/inference/common/batch_sampler/image_batch_sampler.py +34 -25
- paddlex/inference/common/result/mixin.py +19 -12
- paddlex/inference/models/base/predictor/base_predictor.py +2 -8
- paddlex/inference/models/common/static_infer.py +11 -59
- paddlex/inference/models/common/tokenizer/__init__.py +2 -0
- paddlex/inference/models/common/tokenizer/clip_tokenizer.py +1 -1
- paddlex/inference/models/common/tokenizer/gpt_tokenizer.py +2 -2
- paddlex/inference/models/common/tokenizer/qwen2_5_tokenizer.py +112 -0
- paddlex/inference/models/common/tokenizer/qwen2_tokenizer.py +7 -1
- paddlex/inference/models/common/tokenizer/qwen_tokenizer.py +288 -0
- paddlex/inference/models/common/tokenizer/tokenizer_utils.py +13 -13
- paddlex/inference/models/common/tokenizer/tokenizer_utils_base.py +3 -3
- paddlex/inference/models/common/tokenizer/vocab.py +7 -7
- paddlex/inference/models/common/vlm/conversion_utils.py +99 -0
- paddlex/inference/models/common/vlm/fusion_ops.py +205 -0
- paddlex/inference/models/common/vlm/generation/configuration_utils.py +1 -1
- paddlex/inference/models/common/vlm/generation/logits_process.py +1 -1
- paddlex/inference/models/common/vlm/generation/utils.py +1 -1
- paddlex/inference/models/common/vlm/transformers/configuration_utils.py +3 -3
- paddlex/inference/models/common/vlm/transformers/conversion_utils.py +3 -3
- paddlex/inference/models/common/vlm/transformers/model_outputs.py +2 -2
- paddlex/inference/models/common/vlm/transformers/model_utils.py +7 -31
- paddlex/inference/models/doc_vlm/modeling/GOT_ocr_2_0.py +830 -0
- paddlex/inference/models/doc_vlm/modeling/__init__.py +2 -0
- paddlex/inference/models/doc_vlm/modeling/qwen2.py +1606 -0
- paddlex/inference/models/doc_vlm/modeling/qwen2_5_vl.py +3006 -0
- paddlex/inference/models/doc_vlm/modeling/qwen2_vl.py +0 -105
- paddlex/inference/models/doc_vlm/predictor.py +79 -24
- paddlex/inference/models/doc_vlm/processors/GOT_ocr_2_0.py +97 -0
- paddlex/inference/models/doc_vlm/processors/__init__.py +2 -0
- paddlex/inference/models/doc_vlm/processors/common.py +189 -0
- paddlex/inference/models/doc_vlm/processors/qwen2_5_vl.py +548 -0
- paddlex/inference/models/doc_vlm/processors/qwen2_vl.py +21 -176
- paddlex/inference/models/formula_recognition/predictor.py +7 -1
- paddlex/inference/models/formula_recognition/processors.py +92 -79
- paddlex/inference/models/formula_recognition/result.py +28 -27
- paddlex/inference/models/image_feature/processors.py +3 -4
- paddlex/inference/models/keypoint_detection/predictor.py +3 -0
- paddlex/inference/models/object_detection/predictor.py +2 -0
- paddlex/inference/models/object_detection/processors.py +28 -3
- paddlex/inference/models/object_detection/utils.py +2 -0
- paddlex/inference/models/table_structure_recognition/result.py +0 -10
- paddlex/inference/models/text_detection/predictor.py +8 -0
- paddlex/inference/models/text_detection/processors.py +44 -10
- paddlex/inference/models/text_detection/result.py +0 -10
- paddlex/inference/pipelines/__init__.py +9 -5
- paddlex/inference/pipelines/_parallel.py +172 -0
- paddlex/inference/pipelines/anomaly_detection/pipeline.py +16 -6
- paddlex/inference/pipelines/attribute_recognition/pipeline.py +11 -1
- paddlex/inference/pipelines/base.py +14 -4
- paddlex/inference/pipelines/components/faisser.py +1 -1
- paddlex/inference/pipelines/doc_preprocessor/pipeline.py +53 -27
- paddlex/inference/pipelines/formula_recognition/pipeline.py +120 -82
- paddlex/inference/pipelines/formula_recognition/result.py +1 -11
- paddlex/inference/pipelines/image_classification/pipeline.py +16 -6
- paddlex/inference/pipelines/image_multilabel_classification/pipeline.py +16 -6
- paddlex/inference/pipelines/instance_segmentation/pipeline.py +16 -6
- paddlex/inference/pipelines/keypoint_detection/pipeline.py +16 -6
- paddlex/inference/pipelines/layout_parsing/pipeline.py +34 -47
- paddlex/inference/pipelines/layout_parsing/pipeline_v2.py +893 -260
- paddlex/inference/pipelines/layout_parsing/result.py +4 -17
- paddlex/inference/pipelines/layout_parsing/result_v2.py +523 -245
- paddlex/inference/pipelines/layout_parsing/setting.py +87 -0
- paddlex/inference/pipelines/layout_parsing/utils.py +565 -1998
- paddlex/inference/pipelines/layout_parsing/xycut_enhanced/__init__.py +16 -0
- paddlex/inference/pipelines/layout_parsing/xycut_enhanced/utils.py +1144 -0
- paddlex/inference/pipelines/layout_parsing/xycut_enhanced/xycuts.py +563 -0
- paddlex/inference/pipelines/m_3d_bev_detection/pipeline.py +2 -2
- paddlex/inference/pipelines/multilingual_speech_recognition/pipeline.py +2 -2
- paddlex/inference/pipelines/object_detection/pipeline.py +16 -6
- paddlex/inference/pipelines/ocr/pipeline.py +127 -70
- paddlex/inference/pipelines/ocr/result.py +19 -16
- paddlex/inference/pipelines/open_vocabulary_detection/pipeline.py +2 -2
- paddlex/inference/pipelines/open_vocabulary_segmentation/pipeline.py +2 -2
- paddlex/inference/pipelines/pp_chatocr/pipeline_base.py +2 -2
- paddlex/inference/pipelines/pp_chatocr/pipeline_v3.py +2 -5
- paddlex/inference/pipelines/pp_chatocr/pipeline_v4.py +5 -5
- paddlex/inference/pipelines/rotated_object_detection/pipeline.py +16 -6
- paddlex/inference/pipelines/seal_recognition/pipeline.py +109 -53
- paddlex/inference/pipelines/semantic_segmentation/pipeline.py +16 -6
- paddlex/inference/pipelines/small_object_detection/pipeline.py +16 -6
- paddlex/inference/pipelines/table_recognition/pipeline.py +26 -18
- paddlex/inference/pipelines/table_recognition/pipeline_v2.py +624 -53
- paddlex/inference/pipelines/table_recognition/result.py +1 -1
- paddlex/inference/pipelines/table_recognition/table_recognition_post_processing_v2.py +9 -5
- paddlex/inference/pipelines/ts_anomaly_detection/pipeline.py +2 -2
- paddlex/inference/pipelines/ts_classification/pipeline.py +2 -2
- paddlex/inference/pipelines/ts_forecasting/pipeline.py +2 -2
- paddlex/inference/pipelines/video_classification/pipeline.py +2 -2
- paddlex/inference/pipelines/video_detection/pipeline.py +2 -2
- paddlex/inference/serving/basic_serving/_pipeline_apps/_common/common.py +5 -1
- paddlex/inference/serving/basic_serving/_pipeline_apps/layout_parsing.py +0 -1
- paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv3_doc.py +0 -1
- paddlex/inference/serving/basic_serving/_pipeline_apps/pp_chatocrv4_doc.py +1 -1
- paddlex/inference/serving/basic_serving/_pipeline_apps/pp_structurev3.py +6 -2
- paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition.py +1 -5
- paddlex/inference/serving/basic_serving/_pipeline_apps/table_recognition_v2.py +4 -5
- paddlex/inference/serving/infra/utils.py +20 -22
- paddlex/inference/serving/schemas/formula_recognition.py +1 -1
- paddlex/inference/serving/schemas/layout_parsing.py +1 -2
- paddlex/inference/serving/schemas/pp_chatocrv3_doc.py +1 -2
- paddlex/inference/serving/schemas/pp_chatocrv4_doc.py +2 -2
- paddlex/inference/serving/schemas/pp_structurev3.py +10 -6
- paddlex/inference/serving/schemas/seal_recognition.py +1 -1
- paddlex/inference/serving/schemas/table_recognition.py +2 -6
- paddlex/inference/serving/schemas/table_recognition_v2.py +5 -6
- paddlex/inference/utils/hpi.py +8 -1
- paddlex/inference/utils/hpi_model_info_collection.json +81 -2
- paddlex/inference/utils/io/readers.py +12 -12
- paddlex/inference/utils/mkldnn_blocklist.py +25 -0
- paddlex/inference/utils/official_models.py +14 -0
- paddlex/inference/utils/pp_option.py +29 -8
- paddlex/model.py +2 -2
- paddlex/modules/__init__.py +1 -1
- paddlex/modules/anomaly_detection/evaluator.py +2 -2
- paddlex/modules/base/__init__.py +1 -1
- paddlex/modules/base/evaluator.py +5 -5
- paddlex/modules/base/trainer.py +1 -1
- paddlex/modules/doc_vlm/dataset_checker.py +2 -2
- paddlex/modules/doc_vlm/evaluator.py +2 -2
- paddlex/modules/doc_vlm/exportor.py +2 -2
- paddlex/modules/doc_vlm/model_list.py +1 -1
- paddlex/modules/doc_vlm/trainer.py +2 -2
- paddlex/modules/face_recognition/evaluator.py +2 -2
- paddlex/modules/formula_recognition/evaluator.py +5 -2
- paddlex/modules/formula_recognition/model_list.py +3 -0
- paddlex/modules/formula_recognition/trainer.py +3 -0
- paddlex/modules/general_recognition/evaluator.py +1 -1
- paddlex/modules/image_classification/evaluator.py +2 -2
- paddlex/modules/image_classification/model_list.py +1 -0
- paddlex/modules/instance_segmentation/evaluator.py +1 -1
- paddlex/modules/keypoint_detection/evaluator.py +1 -1
- paddlex/modules/m_3d_bev_detection/evaluator.py +2 -2
- paddlex/modules/multilabel_classification/evaluator.py +2 -2
- paddlex/modules/object_detection/dataset_checker/dataset_src/convert_dataset.py +4 -4
- paddlex/modules/object_detection/evaluator.py +2 -2
- paddlex/modules/object_detection/model_list.py +2 -0
- paddlex/modules/semantic_segmentation/evaluator.py +2 -2
- paddlex/modules/table_recognition/evaluator.py +2 -2
- paddlex/modules/text_detection/evaluator.py +2 -2
- paddlex/modules/text_detection/model_list.py +2 -0
- paddlex/modules/text_recognition/evaluator.py +2 -2
- paddlex/modules/text_recognition/model_list.py +2 -0
- paddlex/modules/ts_anomaly_detection/evaluator.py +2 -2
- paddlex/modules/ts_classification/dataset_checker/dataset_src/split_dataset.py +1 -1
- paddlex/modules/ts_classification/evaluator.py +2 -2
- paddlex/modules/ts_forecast/evaluator.py +2 -2
- paddlex/modules/video_classification/evaluator.py +2 -2
- paddlex/modules/video_detection/evaluator.py +2 -2
- paddlex/ops/__init__.py +2 -2
- paddlex/paddlex_cli.py +19 -13
- paddlex/repo_apis/Paddle3D_api/bev_fusion/model.py +2 -2
- paddlex/repo_apis/PaddleClas_api/cls/config.py +1 -1
- paddlex/repo_apis/PaddleClas_api/cls/model.py +1 -1
- paddlex/repo_apis/PaddleClas_api/cls/register.py +10 -0
- paddlex/repo_apis/PaddleClas_api/cls/runner.py +1 -1
- paddlex/repo_apis/PaddleDetection_api/instance_seg/model.py +1 -1
- paddlex/repo_apis/PaddleDetection_api/instance_seg/runner.py +1 -1
- paddlex/repo_apis/PaddleDetection_api/object_det/config.py +1 -1
- paddlex/repo_apis/PaddleDetection_api/object_det/model.py +1 -1
- paddlex/repo_apis/PaddleDetection_api/object_det/official_categories.py +25 -0
- paddlex/repo_apis/PaddleDetection_api/object_det/register.py +30 -0
- paddlex/repo_apis/PaddleDetection_api/object_det/runner.py +1 -1
- paddlex/repo_apis/PaddleOCR_api/formula_rec/config.py +3 -3
- paddlex/repo_apis/PaddleOCR_api/formula_rec/model.py +5 -9
- paddlex/repo_apis/PaddleOCR_api/formula_rec/register.py +27 -0
- paddlex/repo_apis/PaddleOCR_api/formula_rec/runner.py +1 -1
- paddlex/repo_apis/PaddleOCR_api/table_rec/model.py +1 -1
- paddlex/repo_apis/PaddleOCR_api/table_rec/runner.py +1 -1
- paddlex/repo_apis/PaddleOCR_api/text_det/model.py +1 -1
- paddlex/repo_apis/PaddleOCR_api/text_det/register.py +18 -0
- paddlex/repo_apis/PaddleOCR_api/text_det/runner.py +1 -1
- paddlex/repo_apis/PaddleOCR_api/text_rec/config.py +3 -3
- paddlex/repo_apis/PaddleOCR_api/text_rec/model.py +5 -9
- paddlex/repo_apis/PaddleOCR_api/text_rec/register.py +18 -0
- paddlex/repo_apis/PaddleOCR_api/text_rec/runner.py +1 -1
- paddlex/repo_apis/PaddleSeg_api/seg/model.py +1 -1
- paddlex/repo_apis/PaddleSeg_api/seg/runner.py +1 -1
- paddlex/repo_apis/PaddleTS_api/ts_ad/config.py +3 -3
- paddlex/repo_apis/PaddleTS_api/ts_cls/config.py +2 -2
- paddlex/repo_apis/PaddleTS_api/ts_fc/config.py +4 -4
- paddlex/repo_apis/PaddleVideo_api/video_cls/config.py +1 -1
- paddlex/repo_apis/PaddleVideo_api/video_cls/model.py +1 -1
- paddlex/repo_apis/PaddleVideo_api/video_cls/runner.py +1 -1
- paddlex/repo_apis/PaddleVideo_api/video_det/config.py +1 -1
- paddlex/repo_apis/PaddleVideo_api/video_det/model.py +1 -1
- paddlex/repo_apis/PaddleVideo_api/video_det/runner.py +1 -1
- paddlex/repo_apis/base/config.py +1 -1
- paddlex/repo_manager/core.py +3 -3
- paddlex/repo_manager/meta.py +6 -2
- paddlex/repo_manager/repo.py +17 -16
- paddlex/utils/custom_device_list.py +26 -2
- paddlex/utils/deps.py +1 -1
- paddlex/utils/device.py +15 -8
- paddlex/utils/env.py +4 -0
- paddlex/utils/flags.py +2 -4
- paddlex/utils/fonts/__init__.py +34 -4
- paddlex/utils/misc.py +1 -1
- {paddlex-3.0.0rc1.dist-info → paddlex-3.0.1.dist-info}/METADATA +52 -56
- {paddlex-3.0.0rc1.dist-info → paddlex-3.0.1.dist-info}/RECORD +233 -206
- {paddlex-3.0.0rc1.dist-info → paddlex-3.0.1.dist-info}/WHEEL +1 -1
- {paddlex-3.0.0rc1.dist-info → paddlex-3.0.1.dist-info}/entry_points.txt +0 -0
- {paddlex-3.0.0rc1.dist-info → paddlex-3.0.1.dist-info}/licenses/LICENSE +0 -0
- {paddlex-3.0.0rc1.dist-info → paddlex-3.0.1.dist-info}/top_level.txt +0 -0
paddlex/.version
CHANGED
@@ -1 +1 @@
|
|
1
|
-
3.0.
|
1
|
+
3.0.1
|
paddlex/__init__.py
CHANGED
@@ -24,7 +24,7 @@ for mod in _SPECIAL_MODS:
|
|
24
24
|
from . import version
|
25
25
|
from .inference import create_pipeline, create_predictor
|
26
26
|
from .model import create_model
|
27
|
-
from .modules import build_dataset_checker,
|
27
|
+
from .modules import build_dataset_checker, build_evaluator, build_trainer
|
28
28
|
|
29
29
|
|
30
30
|
def _initialize():
|
@@ -0,0 +1,13 @@
|
|
1
|
+
Global:
|
2
|
+
model: PP-Chart2Table
|
3
|
+
mode: predict # only support predict
|
4
|
+
device: gpu:0
|
5
|
+
output: "output"
|
6
|
+
|
7
|
+
Predict:
|
8
|
+
batch_size: 1
|
9
|
+
model_dir: "/path/to/PP-Chart2Table"
|
10
|
+
input:
|
11
|
+
image: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/chart_parsing_02.png"
|
12
|
+
kernel_option:
|
13
|
+
run_mode: paddle
|
@@ -0,0 +1,14 @@
|
|
1
|
+
Global:
|
2
|
+
model: PP-DocBee2-3B
|
3
|
+
mode: predict # only support predict
|
4
|
+
device: gpu:0
|
5
|
+
output: "output"
|
6
|
+
|
7
|
+
Predict:
|
8
|
+
batch_size: 1
|
9
|
+
model_dir: "/path/to/PP-DocBee2-3B"
|
10
|
+
input:
|
11
|
+
image: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/medal_table.png"
|
12
|
+
query: "识别这份表格的内容, 以markdown格式输出"
|
13
|
+
kernel_option:
|
14
|
+
run_mode: paddle
|
@@ -0,0 +1,40 @@
|
|
1
|
+
Global:
|
2
|
+
model: PP-FormulaNet_plus-L
|
3
|
+
mode: check_dataset # check_dataset/train/evaluate/predict
|
4
|
+
dataset_dir: "./dataset/ocr_rec_latexocr_dataset_example"
|
5
|
+
device: gpu:0,1,2,3
|
6
|
+
output: "output"
|
7
|
+
|
8
|
+
CheckDataset:
|
9
|
+
convert:
|
10
|
+
enable: False
|
11
|
+
src_dataset_type: FormulaRecDataset
|
12
|
+
split:
|
13
|
+
enable: False
|
14
|
+
train_percent: null
|
15
|
+
val_percent: null
|
16
|
+
|
17
|
+
Train:
|
18
|
+
epochs_iters: 20
|
19
|
+
batch_size: 3
|
20
|
+
learning_rate: 0.0001
|
21
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-FormulaNet_plus-L_pretrained.pdparams
|
22
|
+
resume_path: null
|
23
|
+
log_interval: 20
|
24
|
+
eval_interval: 1
|
25
|
+
save_interval: 1
|
26
|
+
|
27
|
+
Evaluate:
|
28
|
+
batch_size: 3
|
29
|
+
weight_path: output/best_accuracy/best_accuracy.pdparams
|
30
|
+
log_interval: 1
|
31
|
+
|
32
|
+
Export:
|
33
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-FormulaNet_plus-L_pretrained.pdparams
|
34
|
+
|
35
|
+
Predict:
|
36
|
+
batch_size: 1
|
37
|
+
model_dir: "output/best_accuracy/inference"
|
38
|
+
input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_formula_rec_001.png"
|
39
|
+
kernel_option:
|
40
|
+
run_mode: paddle
|
@@ -0,0 +1,40 @@
|
|
1
|
+
Global:
|
2
|
+
model: PP-FormulaNet_plus-M
|
3
|
+
mode: check_dataset # check_dataset/train/evaluate/predict
|
4
|
+
dataset_dir: "./dataset/ocr_rec_latexocr_dataset_example"
|
5
|
+
device: gpu:0,1,2,3
|
6
|
+
output: "output"
|
7
|
+
|
8
|
+
CheckDataset:
|
9
|
+
convert:
|
10
|
+
enable: False
|
11
|
+
src_dataset_type: FormulaRecDataset
|
12
|
+
split:
|
13
|
+
enable: False
|
14
|
+
train_percent: null
|
15
|
+
val_percent: null
|
16
|
+
|
17
|
+
Train:
|
18
|
+
epochs_iters: 20
|
19
|
+
batch_size: 14
|
20
|
+
learning_rate: 0.0001
|
21
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-FormulaNet_plus-M_pretrained.pdparams
|
22
|
+
resume_path: null
|
23
|
+
log_interval: 20
|
24
|
+
eval_interval: 1
|
25
|
+
save_interval: 1
|
26
|
+
|
27
|
+
Evaluate:
|
28
|
+
batch_size: 20
|
29
|
+
weight_path: output/best_accuracy/best_accuracy.pdparams
|
30
|
+
log_interval: 1
|
31
|
+
|
32
|
+
Export:
|
33
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-FormulaNet_plus-M_pretrained.pdparams
|
34
|
+
|
35
|
+
Predict:
|
36
|
+
batch_size: 1
|
37
|
+
model_dir: "output/best_accuracy/inference"
|
38
|
+
input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_formula_rec_001.png"
|
39
|
+
kernel_option:
|
40
|
+
run_mode: paddle
|
@@ -0,0 +1,40 @@
|
|
1
|
+
Global:
|
2
|
+
model: PP-FormulaNet_plus-S
|
3
|
+
mode: check_dataset # check_dataset/train/evaluate/predict
|
4
|
+
dataset_dir: "./dataset/ocr_rec_latexocr_dataset_example"
|
5
|
+
device: gpu:0,1,2,3
|
6
|
+
output: "output"
|
7
|
+
|
8
|
+
CheckDataset:
|
9
|
+
convert:
|
10
|
+
enable: False
|
11
|
+
src_dataset_type: FormulaRecDataset
|
12
|
+
split:
|
13
|
+
enable: False
|
14
|
+
train_percent: null
|
15
|
+
val_percent: null
|
16
|
+
|
17
|
+
Train:
|
18
|
+
epochs_iters: 20
|
19
|
+
batch_size: 14
|
20
|
+
learning_rate: 0.0001
|
21
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-FormulaNet_plus-S_pretrained.pdparams
|
22
|
+
resume_path: null
|
23
|
+
log_interval: 20
|
24
|
+
eval_interval: 1
|
25
|
+
save_interval: 1
|
26
|
+
|
27
|
+
Evaluate:
|
28
|
+
batch_size: 20
|
29
|
+
weight_path: output/best_accuracy/best_accuracy.pdparams
|
30
|
+
log_interval: 1
|
31
|
+
|
32
|
+
Export:
|
33
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-FormulaNet_plus-S_pretrained.pdparams
|
34
|
+
|
35
|
+
Predict:
|
36
|
+
batch_size: 1
|
37
|
+
model_dir: "output/best_accuracy/inference"
|
38
|
+
input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_formula_rec_001.png"
|
39
|
+
kernel_option:
|
40
|
+
run_mode: paddle
|
@@ -0,0 +1,40 @@
|
|
1
|
+
Global:
|
2
|
+
model: PP-DocBlockLayout
|
3
|
+
mode: check_dataset # check_dataset/train/evaluate/predict
|
4
|
+
dataset_dir: "/paddle/dataset/paddlex/layout/det_layout_examples"
|
5
|
+
device: gpu:0,1,2,3
|
6
|
+
output: "output"
|
7
|
+
|
8
|
+
CheckDataset:
|
9
|
+
convert:
|
10
|
+
enable: False
|
11
|
+
src_dataset_type: null
|
12
|
+
split:
|
13
|
+
enable: False
|
14
|
+
train_percent: null
|
15
|
+
val_percent: null
|
16
|
+
|
17
|
+
Train:
|
18
|
+
num_classes: 11
|
19
|
+
epochs_iters: 100
|
20
|
+
batch_size: 1
|
21
|
+
learning_rate: 0.0001
|
22
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocBlockLayout_pretrained.pdparams
|
23
|
+
warmup_steps: 100
|
24
|
+
resume_path: null
|
25
|
+
log_interval: 10
|
26
|
+
eval_interval: 1
|
27
|
+
|
28
|
+
Evaluate:
|
29
|
+
weight_path: "output/best_model/best_model.pdparams"
|
30
|
+
log_interval: 10
|
31
|
+
|
32
|
+
Export:
|
33
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocBlockLayout_pretrained.pdparams
|
34
|
+
|
35
|
+
Predict:
|
36
|
+
batch_size: 1
|
37
|
+
model_dir: "output/best_model/inference"
|
38
|
+
input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/layout.jpg"
|
39
|
+
kernel_option:
|
40
|
+
run_mode: paddle
|
@@ -19,7 +19,7 @@ Train:
|
|
19
19
|
epochs_iters: 100
|
20
20
|
batch_size: 1
|
21
21
|
learning_rate: 0.0001
|
22
|
-
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-
|
22
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-L_pretrained.pdparams
|
23
23
|
warmup_steps: 100
|
24
24
|
resume_path: null
|
25
25
|
log_interval: 10
|
@@ -30,7 +30,7 @@ Evaluate:
|
|
30
30
|
log_interval: 10
|
31
31
|
|
32
32
|
Export:
|
33
|
-
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-
|
33
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-L_pretrained.pdparams
|
34
34
|
|
35
35
|
Predict:
|
36
36
|
batch_size: 1
|
@@ -19,7 +19,7 @@ Train:
|
|
19
19
|
epochs_iters: 100
|
20
20
|
batch_size: 1
|
21
21
|
learning_rate: 0.0001
|
22
|
-
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-
|
22
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-M_pretrained.pdparams
|
23
23
|
warmup_steps: 100
|
24
24
|
resume_path: null
|
25
25
|
log_interval: 10
|
@@ -30,7 +30,7 @@ Evaluate:
|
|
30
30
|
log_interval: 10
|
31
31
|
|
32
32
|
Export:
|
33
|
-
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-
|
33
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-M_pretrained.pdparams
|
34
34
|
|
35
35
|
Predict:
|
36
36
|
batch_size: 1
|
@@ -19,7 +19,7 @@ Train:
|
|
19
19
|
epochs_iters: 100
|
20
20
|
batch_size: 1
|
21
21
|
learning_rate: 0.0001
|
22
|
-
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-
|
22
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-S_pretrained.pdparams
|
23
23
|
warmup_steps: 100
|
24
24
|
resume_path: null
|
25
25
|
log_interval: 10
|
@@ -30,7 +30,7 @@ Evaluate:
|
|
30
30
|
log_interval: 10
|
31
31
|
|
32
32
|
Export:
|
33
|
-
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-
|
33
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout-S_pretrained.pdparams
|
34
34
|
|
35
35
|
Predict:
|
36
36
|
batch_size: 1
|
@@ -0,0 +1,40 @@
|
|
1
|
+
Global:
|
2
|
+
model: PP-DocLayout_plus-L
|
3
|
+
mode: check_dataset # check_dataset/train/evaluate/predict
|
4
|
+
dataset_dir: "/paddle/dataset/paddlex/layout/det_layout_examples"
|
5
|
+
device: gpu:0,1,2,3
|
6
|
+
output: "output"
|
7
|
+
|
8
|
+
CheckDataset:
|
9
|
+
convert:
|
10
|
+
enable: False
|
11
|
+
src_dataset_type: null
|
12
|
+
split:
|
13
|
+
enable: False
|
14
|
+
train_percent: null
|
15
|
+
val_percent: null
|
16
|
+
|
17
|
+
Train:
|
18
|
+
num_classes: 11
|
19
|
+
epochs_iters: 100
|
20
|
+
batch_size: 1
|
21
|
+
learning_rate: 0.0001
|
22
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout_plus-L_pretrained.pdparams
|
23
|
+
warmup_steps: 100
|
24
|
+
resume_path: null
|
25
|
+
log_interval: 10
|
26
|
+
eval_interval: 1
|
27
|
+
|
28
|
+
Evaluate:
|
29
|
+
weight_path: "output/best_model/best_model.pdparams"
|
30
|
+
log_interval: 10
|
31
|
+
|
32
|
+
Export:
|
33
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayout_plus-L_pretrained.pdparams
|
34
|
+
|
35
|
+
Predict:
|
36
|
+
batch_size: 1
|
37
|
+
model_dir: "output/best_model/inference"
|
38
|
+
input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/layout.jpg"
|
39
|
+
kernel_option:
|
40
|
+
run_mode: paddle
|
@@ -0,0 +1,40 @@
|
|
1
|
+
Global:
|
2
|
+
model: PP-OCRv5_mobile_det
|
3
|
+
mode: check_dataset # check_dataset/train/evaluate/predict
|
4
|
+
module: text_det
|
5
|
+
dataset_dir: "/paddle/dataset/paddlex/ocr_det/ocr_det_dataset_examples"
|
6
|
+
device: gpu:0,1,2,3
|
7
|
+
output: "output"
|
8
|
+
|
9
|
+
CheckDataset:
|
10
|
+
convert:
|
11
|
+
enable: False
|
12
|
+
src_dataset_type: null
|
13
|
+
split:
|
14
|
+
enable: False
|
15
|
+
train_percent: null
|
16
|
+
val_percent: null
|
17
|
+
|
18
|
+
Train:
|
19
|
+
epochs_iters: 100
|
20
|
+
batch_size: 4
|
21
|
+
learning_rate: 0.001
|
22
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_mobile_det_pretrained.pdparams
|
23
|
+
resume_path: null
|
24
|
+
log_interval: 10
|
25
|
+
eval_interval: 1
|
26
|
+
save_interval: 1
|
27
|
+
|
28
|
+
Evaluate:
|
29
|
+
weight_path: "output/best_accuracy/best_accuracy.pdparams"
|
30
|
+
log_interval: 1
|
31
|
+
|
32
|
+
Export:
|
33
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_mobile_det_pretrained.pdparams
|
34
|
+
|
35
|
+
Predict:
|
36
|
+
batch_size: 1
|
37
|
+
model_dir: "output/best_accuracy/inference"
|
38
|
+
input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_ocr_001.png"
|
39
|
+
kernel_option:
|
40
|
+
run_mode: paddle
|
@@ -0,0 +1,40 @@
|
|
1
|
+
Global:
|
2
|
+
model: PP-OCRv5_server_det
|
3
|
+
mode: check_dataset # check_dataset/train/evaluate/predict
|
4
|
+
module: text_det
|
5
|
+
dataset_dir: "/paddle/dataset/paddlex/ocr_det/ocr_det_dataset_examples"
|
6
|
+
device: gpu:0,1,2,3
|
7
|
+
output: "output"
|
8
|
+
|
9
|
+
CheckDataset:
|
10
|
+
convert:
|
11
|
+
enable: False
|
12
|
+
src_dataset_type: null
|
13
|
+
split:
|
14
|
+
enable: False
|
15
|
+
train_percent: null
|
16
|
+
val_percent: null
|
17
|
+
|
18
|
+
Train:
|
19
|
+
epochs_iters: 100
|
20
|
+
batch_size: 4
|
21
|
+
learning_rate: 0.001
|
22
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_server_det_pretrained.pdparams
|
23
|
+
resume_path: null
|
24
|
+
log_interval: 10
|
25
|
+
eval_interval: 1
|
26
|
+
save_interval: 1
|
27
|
+
|
28
|
+
Evaluate:
|
29
|
+
weight_path: "output/best_accuracy/best_accuracy.pdparams"
|
30
|
+
log_interval: 1
|
31
|
+
|
32
|
+
Export:
|
33
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_server_det_pretrained.pdparams
|
34
|
+
|
35
|
+
Predict:
|
36
|
+
batch_size: 1
|
37
|
+
model_dir: "output/best_accuracy/inference"
|
38
|
+
input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_ocr_001.png"
|
39
|
+
kernel_option:
|
40
|
+
run_mode: paddle
|
@@ -0,0 +1,39 @@
|
|
1
|
+
Global:
|
2
|
+
model: PP-OCRv5_mobile_rec
|
3
|
+
mode: check_dataset # check_dataset/train/evaluate/predict
|
4
|
+
dataset_dir: "/paddle/dataset/paddlex/ocr_rec/ocr_rec_dataset_examples"
|
5
|
+
device: gpu:0,1,2,3
|
6
|
+
output: "output"
|
7
|
+
|
8
|
+
CheckDataset:
|
9
|
+
convert:
|
10
|
+
enable: False
|
11
|
+
src_dataset_type: null
|
12
|
+
split:
|
13
|
+
enable: False
|
14
|
+
train_percent: null
|
15
|
+
val_percent: null
|
16
|
+
|
17
|
+
Train:
|
18
|
+
epochs_iters: 20
|
19
|
+
batch_size: 8
|
20
|
+
learning_rate: 0.001
|
21
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_mobile_rec_pretrained.pdparams
|
22
|
+
resume_path: null
|
23
|
+
log_interval: 20
|
24
|
+
eval_interval: 1
|
25
|
+
save_interval: 1
|
26
|
+
|
27
|
+
Evaluate:
|
28
|
+
weight_path: "output/best_accuracy/best_accuracy.pdparams"
|
29
|
+
log_interval: 1
|
30
|
+
|
31
|
+
Export:
|
32
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_mobile_rec_pretrained.pdparams
|
33
|
+
|
34
|
+
Predict:
|
35
|
+
batch_size: 1
|
36
|
+
model_dir: "output/best_accuracy/inference"
|
37
|
+
input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_ocr_rec_001.png"
|
38
|
+
kernel_option:
|
39
|
+
run_mode: paddle
|
@@ -0,0 +1,39 @@
|
|
1
|
+
Global:
|
2
|
+
model: PP-OCRv5_server_rec
|
3
|
+
mode: check_dataset # check_dataset/train/evaluate/predict
|
4
|
+
dataset_dir: "/paddle/dataset/paddlex/ocr_rec/ocr_rec_dataset_examples"
|
5
|
+
device: gpu:0,1,2,3
|
6
|
+
output: "output"
|
7
|
+
|
8
|
+
CheckDataset:
|
9
|
+
convert:
|
10
|
+
enable: False
|
11
|
+
src_dataset_type: null
|
12
|
+
split:
|
13
|
+
enable: False
|
14
|
+
train_percent: null
|
15
|
+
val_percent: null
|
16
|
+
|
17
|
+
Train:
|
18
|
+
epochs_iters: 20
|
19
|
+
batch_size: 8
|
20
|
+
learning_rate: 0.001
|
21
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_server_rec_pretrained.pdparams
|
22
|
+
resume_path: null
|
23
|
+
log_interval: 20
|
24
|
+
eval_interval: 1
|
25
|
+
save_interval: 1
|
26
|
+
|
27
|
+
Evaluate:
|
28
|
+
weight_path: "output/best_accuracy/best_accuracy.pdparams"
|
29
|
+
log_interval: 1
|
30
|
+
|
31
|
+
Export:
|
32
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-OCRv5_server_rec_pretrained.pdparams
|
33
|
+
|
34
|
+
Predict:
|
35
|
+
batch_size: 1
|
36
|
+
model_dir: "output/best_accuracy/inference"
|
37
|
+
input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/general_ocr_rec_001.png"
|
38
|
+
kernel_option:
|
39
|
+
run_mode: paddle
|
@@ -0,0 +1,41 @@
|
|
1
|
+
Global:
|
2
|
+
model: PP-LCNet_x1_0_textline_ori
|
3
|
+
mode: check_dataset # check_dataset/train/evaluate/predict
|
4
|
+
dataset_dir: "/paddle/dataset/paddlex/cls/textline_orientation_example_data"
|
5
|
+
device: gpu:0,1,2,3
|
6
|
+
output: "output"
|
7
|
+
|
8
|
+
CheckDataset:
|
9
|
+
convert:
|
10
|
+
enable: False
|
11
|
+
src_dataset_type: null
|
12
|
+
split:
|
13
|
+
enable: False
|
14
|
+
train_percent: null
|
15
|
+
val_percent: null
|
16
|
+
|
17
|
+
Train:
|
18
|
+
num_classes: 2
|
19
|
+
epochs_iters: 20
|
20
|
+
batch_size: 32
|
21
|
+
learning_rate: 0.8
|
22
|
+
pretrain_weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-LCNet_x1_0_textline_ori_pretrained.pdparams
|
23
|
+
warmup_steps: 100
|
24
|
+
resume_path: null
|
25
|
+
log_interval: 10
|
26
|
+
eval_interval: 1
|
27
|
+
save_interval: 1
|
28
|
+
|
29
|
+
Evaluate:
|
30
|
+
weight_path: "output/best_model/best_model.pdparams"
|
31
|
+
log_interval: 10
|
32
|
+
|
33
|
+
Export:
|
34
|
+
weight_path: https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-LCNet_x1_0_textline_ori_pretrained.pdparams
|
35
|
+
|
36
|
+
Predict:
|
37
|
+
batch_size: 1
|
38
|
+
model_dir: "output/best_model/inference"
|
39
|
+
input: "https://paddle-model-ecology.bj.bcebos.com/paddlex/imgs/demo_image/img_textline180_demo.jpg"
|
40
|
+
kernel_option:
|
41
|
+
run_mode: paddle
|
@@ -24,21 +24,22 @@ SubPipelines:
|
|
24
24
|
SubModules:
|
25
25
|
TextDetection:
|
26
26
|
module_name: text_detection
|
27
|
-
model_name: PP-
|
27
|
+
model_name: PP-OCRv5_server_det
|
28
28
|
model_dir: null
|
29
|
-
limit_side_len:
|
30
|
-
limit_type:
|
29
|
+
limit_side_len: 64
|
30
|
+
limit_type: min
|
31
|
+
max_side_limit: 4000
|
31
32
|
thresh: 0.3
|
32
33
|
box_thresh: 0.6
|
33
|
-
unclip_ratio:
|
34
|
+
unclip_ratio: 1.5
|
34
35
|
TextLineOrientation:
|
35
36
|
module_name: textline_orientation
|
36
|
-
model_name: PP-
|
37
|
+
model_name: PP-LCNet_x1_0_textline_ori
|
37
38
|
model_dir: null
|
38
39
|
batch_size: 6
|
39
40
|
TextRecognition:
|
40
41
|
module_name: text_recognition
|
41
|
-
model_name: PP-
|
42
|
+
model_name: PP-OCRv5_server_rec
|
42
43
|
model_dir: null
|
43
44
|
batch_size: 6
|
44
45
|
score_thresh: 0.0
|
@@ -99,9 +99,10 @@ SubPipelines:
|
|
99
99
|
model_dir: null
|
100
100
|
limit_side_len: 960
|
101
101
|
limit_type: max
|
102
|
+
max_side_limit: 4000
|
102
103
|
thresh: 0.3
|
103
104
|
box_thresh: 0.6
|
104
|
-
unclip_ratio:
|
105
|
+
unclip_ratio: 1.5
|
105
106
|
|
106
107
|
TextRecognition:
|
107
108
|
module_name: text_recognition
|
@@ -138,6 +139,7 @@ SubPipelines:
|
|
138
139
|
model_dir: null
|
139
140
|
limit_side_len: 736
|
140
141
|
limit_type: min
|
142
|
+
max_side_limit: 4000
|
141
143
|
thresh: 0.2
|
142
144
|
box_thresh: 0.6
|
143
145
|
unclip_ratio: 0.5
|