mineru 2.6.1__py3-none-any.whl → 2.6.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (36) hide show
  1. mineru/backend/pipeline/batch_analyze.py +20 -43
  2. mineru/backend/pipeline/model_init.py +1 -1
  3. mineru/backend/pipeline/model_json_to_middle_json.py +1 -1
  4. mineru/backend/pipeline/pipeline_middle_json_mkcontent.py +17 -4
  5. mineru/backend/vlm/vlm_analyze.py +11 -1
  6. mineru/backend/vlm/vlm_middle_json_mkcontent.py +6 -3
  7. mineru/cli/client.py +24 -14
  8. mineru/cli/gradio_app.py +4 -1
  9. mineru/cli/models_download.py +1 -1
  10. mineru/model/ocr/{paddleocr2pytorch/pytorch_paddle.py → pytorch_paddle.py} +1 -1
  11. mineru/model/table/rec/RapidTable.py +1 -1
  12. mineru/model/utils/pytorchocr/utils/resources/arch_config.yaml +1 -317
  13. mineru/model/utils/pytorchocr/utils/resources/dict/ppocrv5_latin_dict.txt +545 -211
  14. mineru/model/utils/pytorchocr/utils/resources/models_config.yml +0 -12
  15. mineru/utils/block_sort.py +3 -2
  16. mineru/utils/check_mac_env.py +30 -0
  17. mineru/utils/llm_aided.py +13 -8
  18. mineru/version.py +1 -1
  19. {mineru-2.6.1.dist-info → mineru-2.6.3.dist-info}/METADATA +75 -39
  20. {mineru-2.6.1.dist-info → mineru-2.6.3.dist-info}/RECORD +24 -35
  21. mineru/model/ocr/paddleocr2pytorch/__init__.py +0 -1
  22. mineru/model/utils/pytorchocr/utils/resources/dict/arabic_dict.txt +0 -162
  23. mineru/model/utils/pytorchocr/utils/resources/dict/chinese_cht_dict.txt +0 -8421
  24. mineru/model/utils/pytorchocr/utils/resources/dict/cyrillic_dict.txt +0 -163
  25. mineru/model/utils/pytorchocr/utils/resources/dict/devanagari_dict.txt +0 -167
  26. mineru/model/utils/pytorchocr/utils/resources/dict/en_dict.txt +0 -95
  27. mineru/model/utils/pytorchocr/utils/resources/dict/japan_dict.txt +0 -4399
  28. mineru/model/utils/pytorchocr/utils/resources/dict/korean_dict.txt +0 -3688
  29. mineru/model/utils/pytorchocr/utils/resources/dict/latin_dict.txt +0 -185
  30. mineru/model/utils/pytorchocr/utils/resources/dict/ppocr_keys_v1.txt +0 -6623
  31. mineru/model/utils/pytorchocr/utils/resources/dict/ta_dict.txt +0 -128
  32. mineru/model/utils/pytorchocr/utils/resources/dict/te_dict.txt +0 -151
  33. {mineru-2.6.1.dist-info → mineru-2.6.3.dist-info}/WHEEL +0 -0
  34. {mineru-2.6.1.dist-info → mineru-2.6.3.dist-info}/entry_points.txt +0 -0
  35. {mineru-2.6.1.dist-info → mineru-2.6.3.dist-info}/licenses/LICENSE.md +0 -0
  36. {mineru-2.6.1.dist-info → mineru-2.6.3.dist-info}/top_level.txt +0 -0
@@ -28,82 +28,6 @@ Multilingual_PP-OCRv3_det_infer:
28
28
  name: DBHead
29
29
  k: 50
30
30
 
31
- en_PP-OCRv3_det_infer:
32
- model_type: det
33
- algorithm: DB
34
- Transform:
35
- Backbone:
36
- name: MobileNetV3
37
- scale: 0.5
38
- model_name: large
39
- disable_se: True
40
- Neck:
41
- name: RSEFPN
42
- out_channels: 96
43
- shortcut: True
44
- Head:
45
- name: DBHead
46
- k: 50
47
-
48
- ch_PP-OCRv3_det_infer:
49
- model_type: det
50
- algorithm: DB
51
- Transform:
52
- Backbone:
53
- name: MobileNetV3
54
- scale: 0.5
55
- model_name: large
56
- disable_se: True
57
- Neck:
58
- name: RSEFPN
59
- out_channels: 96
60
- shortcut: True
61
- Head:
62
- name: DBHead
63
- k: 50
64
-
65
- en_PP-OCRv4_rec_infer:
66
- model_type: rec
67
- algorithm: SVTR_LCNet
68
- Transform:
69
- Backbone:
70
- name: PPLCNetV3
71
- scale: 0.95
72
- Head:
73
- name: MultiHead
74
- out_channels_list:
75
- CTCLabelDecode: 97 #'blank' + ...(62) + ' '
76
- head_list:
77
- - CTCHead:
78
- Neck:
79
- name: svtr
80
- dims: 120
81
- depth: 2
82
- hidden_dims: 120
83
- kernel_size: [ 1, 3 ]
84
- use_guide: True
85
- Head:
86
- fc_decay: 0.00001
87
- - NRTRHead:
88
- nrtr_dim: 384
89
- max_text_length: 25
90
-
91
- ch_PP-OCRv4_det_infer:
92
- model_type: det
93
- algorithm: DB
94
- Transform: null
95
- Backbone:
96
- name: PPLCNetV3
97
- scale: 0.75
98
- det: True
99
- Neck:
100
- name: RSEFPN
101
- out_channels: 96
102
- shortcut: True
103
- Head:
104
- name: DBHead
105
- k: 50
106
-
107
31
  ch_PP-OCRv5_det_infer:
108
32
  model_type: det
109
33
  algorithm: DB
@@ -152,57 +76,6 @@ ch_PP-OCRv4_det_server_infer:
152
76
  k: 50
153
77
  mode: "large"
154
78
 
155
- ch_PP-OCRv4_rec_infer:
156
- model_type: rec
157
- algorithm: SVTR_LCNet
158
- Transform:
159
- Backbone:
160
- name: PPLCNetV3
161
- scale: 0.95
162
- Head:
163
- name: MultiHead
164
- out_channels_list:
165
- CTCLabelDecode: 6625 #'blank' + ...(6623) + ' '
166
- head_list:
167
- - CTCHead:
168
- Neck:
169
- name: svtr
170
- dims: 120
171
- depth: 2
172
- hidden_dims: 120
173
- kernel_size: [ 1, 3 ]
174
- use_guide: True
175
- Head:
176
- fc_decay: 0.00001
177
- - NRTRHead:
178
- nrtr_dim: 384
179
- max_text_length: 25
180
-
181
- ch_PP-OCRv4_rec_server_infer:
182
- model_type: rec
183
- algorithm: SVTR_HGNet
184
- Transform:
185
- Backbone:
186
- name: PPHGNet_small
187
- Head:
188
- name: MultiHead
189
- out_channels_list:
190
- CTCLabelDecode: 6625 #'blank' + ...(6623) + ' '
191
- head_list:
192
- - CTCHead:
193
- Neck:
194
- name: svtr
195
- dims: 120
196
- depth: 2
197
- hidden_dims: 120
198
- kernel_size: [ 1, 3 ]
199
- use_guide: True
200
- Head:
201
- fc_decay: 0.00001
202
- - NRTRHead:
203
- nrtr_dim: 384
204
- max_text_length: 25
205
-
206
79
  ch_PP-OCRv4_rec_server_doc_infer:
207
80
  model_type: rec
208
81
  algorithm: SVTR_HGNet
@@ -280,174 +153,6 @@ ch_PP-OCRv5_rec_infer:
280
153
  nrtr_dim: 384
281
154
  max_text_length: 25
282
155
 
283
- chinese_cht_PP-OCRv3_rec_infer:
284
- model_type: rec
285
- algorithm: SVTR
286
- Transform:
287
- Backbone:
288
- name: MobileNetV1Enhance
289
- scale: 0.5
290
- last_conv_stride: [1, 2]
291
- last_pool_type: avg
292
- Neck:
293
- name: SequenceEncoder
294
- encoder_type: svtr
295
- dims: 64
296
- depth: 2
297
- hidden_dims: 120
298
- use_guide: True
299
- Head:
300
- name: CTCHead
301
- # out_channels: 8423
302
- fc_decay: 0.00001
303
-
304
- latin_PP-OCRv3_rec_infer:
305
- model_type: rec
306
- algorithm: SVTR
307
- Transform:
308
- Backbone:
309
- name: MobileNetV1Enhance
310
- scale: 0.5
311
- last_conv_stride: [ 1, 2 ]
312
- last_pool_type: avg
313
- Neck:
314
- name: SequenceEncoder
315
- encoder_type: svtr
316
- dims: 64
317
- depth: 2
318
- hidden_dims: 120
319
- use_guide: True
320
- Head:
321
- name: CTCHead
322
- # out_channels: 187
323
- fc_decay: 0.00001
324
-
325
- cyrillic_PP-OCRv3_rec_infer:
326
- model_type: rec
327
- algorithm: SVTR
328
- Transform:
329
- Backbone:
330
- name: MobileNetV1Enhance
331
- scale: 0.5
332
- last_conv_stride: [ 1, 2 ]
333
- last_pool_type: avg
334
- Neck:
335
- name: SequenceEncoder
336
- encoder_type: svtr
337
- dims: 64
338
- depth: 2
339
- hidden_dims: 120
340
- use_guide: True
341
- Head:
342
- name: CTCHead
343
- # out_channels: 165
344
- fc_decay: 0.00001
345
-
346
- arabic_PP-OCRv3_rec_infer:
347
- model_type: rec
348
- algorithm: SVTR
349
- Transform:
350
- Backbone:
351
- name: MobileNetV1Enhance
352
- scale: 0.5
353
- last_conv_stride: [ 1, 2 ]
354
- last_pool_type: avg
355
- Neck:
356
- name: SequenceEncoder
357
- encoder_type: svtr
358
- dims: 64
359
- depth: 2
360
- hidden_dims: 120
361
- use_guide: True
362
- Head:
363
- name: CTCHead
364
- # out_channels: 164
365
- fc_decay: 0.00001
366
-
367
- korean_PP-OCRv3_rec_infer:
368
- model_type: rec
369
- algorithm: SVTR
370
- Transform:
371
- Backbone:
372
- name: MobileNetV1Enhance
373
- scale: 0.5
374
- last_conv_stride: [ 1, 2 ]
375
- last_pool_type: avg
376
- Neck:
377
- name: SequenceEncoder
378
- encoder_type: svtr
379
- dims: 64
380
- depth: 2
381
- hidden_dims: 120
382
- use_guide: True
383
- Head:
384
- name: CTCHead
385
- # out_channels: 3690
386
- fc_decay: 0.00001
387
-
388
- japan_PP-OCRv3_rec_infer:
389
- model_type: rec
390
- algorithm: SVTR
391
- Transform:
392
- Backbone:
393
- name: MobileNetV1Enhance
394
- scale: 0.5
395
- last_conv_stride: [ 1, 2 ]
396
- last_pool_type: avg
397
- Neck:
398
- name: SequenceEncoder
399
- encoder_type: svtr
400
- dims: 64
401
- depth: 2
402
- hidden_dims: 120
403
- use_guide: True
404
- Head:
405
- name: CTCHead
406
- # out_channels: 4401
407
- fc_decay: 0.00001
408
-
409
- ta_PP-OCRv3_rec_infer:
410
- model_type: rec
411
- algorithm: SVTR
412
- Transform:
413
- Backbone:
414
- name: MobileNetV1Enhance
415
- scale: 0.5
416
- last_conv_stride: [ 1, 2 ]
417
- last_pool_type: avg
418
- Neck:
419
- name: SequenceEncoder
420
- encoder_type: svtr
421
- dims: 64
422
- depth: 2
423
- hidden_dims: 120
424
- use_guide: True
425
- Head:
426
- name: CTCHead
427
- # out_channels: 130
428
- fc_decay: 0.00001
429
-
430
- te_PP-OCRv3_rec_infer:
431
- model_type: rec
432
- algorithm: SVTR
433
- Transform:
434
- Backbone:
435
- name: MobileNetV1Enhance
436
- scale: 0.5
437
- last_conv_stride: [ 1, 2 ]
438
- last_pool_type: avg
439
- Neck:
440
- name: SequenceEncoder
441
- encoder_type: svtr
442
- dims: 64
443
- depth: 2
444
- hidden_dims: 120
445
- use_guide: True
446
- Head:
447
- name: CTCHead
448
- # out_channels: 153
449
- fc_decay: 0.00001
450
-
451
156
  ka_PP-OCRv3_rec_infer:
452
157
  model_type: rec
453
158
  algorithm: SVTR
@@ -469,27 +174,6 @@ ka_PP-OCRv3_rec_infer:
469
174
  # out_channels: 155
470
175
  fc_decay: 0.00001
471
176
 
472
- devanagari_PP-OCRv3_rec_infer:
473
- model_type: rec
474
- algorithm: SVTR
475
- Transform:
476
- Backbone:
477
- name: MobileNetV1Enhance
478
- scale: 0.5
479
- last_conv_stride: [ 1, 2 ]
480
- last_pool_type: avg
481
- Neck:
482
- name: SequenceEncoder
483
- encoder_type: svtr
484
- dims: 64
485
- depth: 2
486
- hidden_dims: 120
487
- use_guide: True
488
- Head:
489
- name: CTCHead
490
- # out_channels: 169
491
- fc_decay: 0.00001
492
-
493
177
  korean_PP-OCRv5_rec_infer:
494
178
  model_type: rec
495
179
  algorithm: SVTR_HGNet
@@ -526,7 +210,7 @@ latin_PP-OCRv5_rec_infer:
526
210
  Head:
527
211
  name: MultiHead
528
212
  out_channels_list:
529
- CTCLabelDecode: 504
213
+ CTCLabelDecode: 838
530
214
  head_list:
531
215
  - CTCHead:
532
216
  Neck: