natural-pdf 0.1.5__py3-none-any.whl → 0.1.6__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (54) hide show
  1. docs/ocr/index.md +34 -47
  2. docs/tutorials/01-loading-and-extraction.ipynb +60 -46
  3. docs/tutorials/02-finding-elements.ipynb +42 -42
  4. docs/tutorials/03-extracting-blocks.ipynb +17 -17
  5. docs/tutorials/04-table-extraction.ipynb +12 -12
  6. docs/tutorials/05-excluding-content.ipynb +30 -30
  7. docs/tutorials/06-document-qa.ipynb +28 -28
  8. docs/tutorials/07-layout-analysis.ipynb +63 -35
  9. docs/tutorials/07-working-with-regions.ipynb +55 -51
  10. docs/tutorials/07-working-with-regions.md +2 -2
  11. docs/tutorials/08-spatial-navigation.ipynb +60 -60
  12. docs/tutorials/09-section-extraction.ipynb +113 -113
  13. docs/tutorials/10-form-field-extraction.ipynb +78 -50
  14. docs/tutorials/11-enhanced-table-processing.ipynb +6 -6
  15. docs/tutorials/12-ocr-integration.ipynb +149 -131
  16. docs/tutorials/12-ocr-integration.md +0 -13
  17. docs/tutorials/13-semantic-search.ipynb +313 -873
  18. natural_pdf/__init__.py +21 -23
  19. natural_pdf/analyzers/layout/gemini.py +264 -0
  20. natural_pdf/analyzers/layout/layout_manager.py +28 -1
  21. natural_pdf/analyzers/layout/layout_options.py +11 -0
  22. natural_pdf/analyzers/layout/yolo.py +6 -2
  23. natural_pdf/collections/pdf_collection.py +21 -0
  24. natural_pdf/core/element_manager.py +16 -13
  25. natural_pdf/core/page.py +165 -36
  26. natural_pdf/core/pdf.py +146 -41
  27. natural_pdf/elements/base.py +11 -17
  28. natural_pdf/elements/collections.py +100 -38
  29. natural_pdf/elements/region.py +77 -38
  30. natural_pdf/elements/text.py +5 -0
  31. natural_pdf/ocr/__init__.py +49 -36
  32. natural_pdf/ocr/engine.py +146 -51
  33. natural_pdf/ocr/engine_easyocr.py +141 -161
  34. natural_pdf/ocr/engine_paddle.py +107 -193
  35. natural_pdf/ocr/engine_surya.py +75 -148
  36. natural_pdf/ocr/ocr_factory.py +114 -0
  37. natural_pdf/ocr/ocr_manager.py +65 -93
  38. natural_pdf/ocr/ocr_options.py +7 -17
  39. natural_pdf/ocr/utils.py +98 -0
  40. natural_pdf/templates/spa/css/style.css +334 -0
  41. natural_pdf/templates/spa/index.html +31 -0
  42. natural_pdf/templates/spa/js/app.js +472 -0
  43. natural_pdf/templates/spa/words.txt +235976 -0
  44. natural_pdf/utils/debug.py +32 -0
  45. natural_pdf/utils/identifiers.py +29 -0
  46. natural_pdf/utils/packaging.py +418 -0
  47. {natural_pdf-0.1.5.dist-info → natural_pdf-0.1.6.dist-info}/METADATA +41 -19
  48. {natural_pdf-0.1.5.dist-info → natural_pdf-0.1.6.dist-info}/RECORD +51 -44
  49. {natural_pdf-0.1.5.dist-info → natural_pdf-0.1.6.dist-info}/WHEEL +1 -1
  50. {natural_pdf-0.1.5.dist-info → natural_pdf-0.1.6.dist-info}/top_level.txt +0 -1
  51. natural_pdf/templates/ocr_debug.html +0 -517
  52. tests/test_loading.py +0 -50
  53. tests/test_optional_deps.py +0 -298
  54. {natural_pdf-0.1.5.dist-info → natural_pdf-0.1.6.dist-info}/licenses/LICENSE +0 -0
@@ -17,7 +17,7 @@ docs/interactive-widget/index.ipynb,sha256=zY1rz5N34OUW-OtgcbI6iiOjlIJqXjVcx9OoN
17
17
  docs/interactive-widget/index.md,sha256=tZbq0uYI7Zwo9mLbhXpqeBriuAjazkIyEJeP-jasJ-Q,259
18
18
  docs/layout-analysis/index.ipynb,sha256=dkS_-cu-KGir5G2LGRcxBThKnW0dfA5nPPnwpoYGFtU,1869093
19
19
  docs/layout-analysis/index.md,sha256=ZnH5yd7B_eOLgGxW_4rNlzQs4Tn3Xx1cK3jX43CSpSM,5390
20
- docs/ocr/index.md,sha256=e5E9wqY6ehX7sJtrrie6gr6HtQb2neiYEoDKu4Qcjs4,8931
20
+ docs/ocr/index.md,sha256=uuzTqcAgUmMN7jZVq8VkVcbRDHn8Yg2nJVvHJ-bDK-Y,8177
21
21
  docs/pdf-navigation/index.ipynb,sha256=h6yew0HePXK1_c5FmETqzjBQceUBT0MU-vnXx_y91mo,8018
22
22
  docs/pdf-navigation/index.md,sha256=P3b3tsmOcmRtnfRxpsMeTgwm7vApnH_4le_QIwJd51M,2391
23
23
  docs/regions/index.ipynb,sha256=5A-N5A4v4lcXNptOAeI4i7i9Gx66To-Yus8B816dHBk,1303347
@@ -28,38 +28,38 @@ docs/text-analysis/index.ipynb,sha256=iaup8pcQXGp0ZK3IWi-HHssQLdIzWYGYfvZK5i8yjj
28
28
  docs/text-analysis/index.md,sha256=02pfZemOgV37izV7H-XzKmHu7AedDKLidQ-sKhYaMVw,3527
29
29
  docs/text-extraction/index.ipynb,sha256=809y9ZamXT3bc3GhwwFyoDnlyEpO-kUZ3tIsZZWyrj8,2537087
30
30
  docs/text-extraction/index.md,sha256=b1KfQpvIEelc8cPbFETUnK92az7iB4b7-LqK2DRH8vw,6985
31
- docs/tutorials/01-loading-and-extraction.ipynb,sha256=tB1TLios1FaieMUE4RuY_H6fVYpmDwFiMMxW6sillbs,541071
31
+ docs/tutorials/01-loading-and-extraction.ipynb,sha256=-9hFAVQtHmuXsR9Ge3A80wKr-t9wxouAAlW4_Iotdwo,544610
32
32
  docs/tutorials/01-loading-and-extraction.md,sha256=g40J8GhKz-ikM2URj5MqIatKKj4l5kTFozHeVjxDJQA,2191
33
- docs/tutorials/02-finding-elements.ipynb,sha256=oEdkN20PXGM1oH9p0QnSsq8yjQJJ9SU9eQhKO_g4RVQ,524374
33
+ docs/tutorials/02-finding-elements.ipynb,sha256=k1CSz47_atA9D6DXfQzVS64t5-L-KjssU2VuFvdy7oU,524374
34
34
  docs/tutorials/02-finding-elements.md,sha256=qOkjcWUzem05of54aKzKvy-MMzRX_S4CyZisVV-73QM,4162
35
- docs/tutorials/03-extracting-blocks.ipynb,sha256=2e7fc9t_46x0DM5RLI9aUUfLeVzfFZzzzKphBA8G5lY,260729
35
+ docs/tutorials/03-extracting-blocks.ipynb,sha256=1UjdP0j3kPCE3aU8p1jBCBqflG-xRLli2Ltx80DhOVk,260729
36
36
  docs/tutorials/03-extracting-blocks.md,sha256=_kqvhk6rSL7cGp2MSwTJk8LYlJGbK_r_umnCSBdR8XU,1665
37
- docs/tutorials/04-table-extraction.ipynb,sha256=o0LdALyko01oHJbMuuqZkVnoF2pfFnMNgtg1IgpSnRI,3973
37
+ docs/tutorials/04-table-extraction.ipynb,sha256=u92Wppw1qHG__Mx3ZKtETm4AWuGF8X-Ln3kvmF8zCSo,3973
38
38
  docs/tutorials/04-table-extraction.md,sha256=4q4v17VX8K-ZBtWYy0nbWPccyqB_ybd5Vl_IROmxz6Q,2130
39
- docs/tutorials/05-excluding-content.ipynb,sha256=6ZLFm3L_Odr4NJD2iW6mL81y5e3xymQvEVyv-VY5O6U,336197
39
+ docs/tutorials/05-excluding-content.ipynb,sha256=oSg8ll_nuWOfQHGLp0fNKVeyYyn_L8a-F7HJADjjdq8,336857
40
40
  docs/tutorials/05-excluding-content.md,sha256=U52SPlc5knqxiyhRokmxrj06T54r2ENyTfP7BMGykhY,3907
41
- docs/tutorials/06-document-qa.ipynb,sha256=BdFQNRqg6U4trACM8lmYSs9RYHJlxcd6DafXdw5mWR8,10303
41
+ docs/tutorials/06-document-qa.ipynb,sha256=Facyqns8jw2bTvsOSbNnsLskFH8kg1JTz4kmJ16dpcE,10303
42
42
  docs/tutorials/06-document-qa.md,sha256=PzPPgw0Rkkfe6sfz3XyKD9S9JbQ40qf4bDzCBvwH1P0,3026
43
- docs/tutorials/07-layout-analysis.ipynb,sha256=A5HMljUq7AaDSg_-vFywIQCyjKW2tjMmSPyPdaKFAE4,554523
43
+ docs/tutorials/07-layout-analysis.ipynb,sha256=tdNnMro1V66YPx0h96HZnujSm-zDpy7o78euQix4lyU,559517
44
44
  docs/tutorials/07-layout-analysis.md,sha256=NAYVzJTecDnXjo_isbPCSUBSn3c-xM1tELct1Zn5GmI,2533
45
- docs/tutorials/07-working-with-regions.ipynb,sha256=cRkr9VRho7J-dx9aIINO253Uz8io3PhD2mjNrASxql4,69510
46
- docs/tutorials/07-working-with-regions.md,sha256=Hi18sZhiHV1NDYE-EQ82OPMwrz-j1Krjw_ipT9cTkSI,4379
47
- docs/tutorials/08-spatial-navigation.ipynb,sha256=7HAAaK80R82Fy09heZ9WKwijY50DS89qGt_Xf2lB0Vo,193515
45
+ docs/tutorials/07-working-with-regions.ipynb,sha256=s4BFKKbKUemmURCpg6j91rNI8eFFOJUgxY4QN4alK4I,69584
46
+ docs/tutorials/07-working-with-regions.md,sha256=oanbTFSQ-topAVd9kjfkaPiMjHcx6Y8cqyxVbmxLhgs,4365
47
+ docs/tutorials/08-spatial-navigation.ipynb,sha256=jfwF6OHLvrMvaaknp-9AfUvr-pPXjPljUyGnFKF9wsw,194523
48
48
  docs/tutorials/08-spatial-navigation.md,sha256=IMbOYBjayXKE7pHfBjApTxOoKRD8WYj7opf8fsJCtzA,4855
49
- docs/tutorials/09-section-extraction.ipynb,sha256=JqkcPDXaifJSYJjbBB3LxB8XCMhbrWs-y5GcuOIvoNA,1100632
49
+ docs/tutorials/09-section-extraction.ipynb,sha256=Aqcy08oXTJ1pkJCmVVumndje-4WXnbkl_QfJPhps7f8,1100736
50
50
  docs/tutorials/09-section-extraction.md,sha256=Jy_be8ftAl_VPBWl5nEv7_5sKSZPx22DLUcBVHMD3Nc,7832
51
- docs/tutorials/10-form-field-extraction.ipynb,sha256=azOE7nDz-rYm-AqXF1NvO41CthR9DTwA_rbXHtobDZ4,280125
51
+ docs/tutorials/10-form-field-extraction.ipynb,sha256=yyopvBoS5vkKKtUQ6rZ4Kyo5E0Olp2WYnmunhfzSQkQ,281491
52
52
  docs/tutorials/10-form-field-extraction.md,sha256=t9tPlW36vJEhDrKIsHGg_f3P_MK62DT4-ZK1thKFs4Y,5494
53
- docs/tutorials/11-enhanced-table-processing.ipynb,sha256=GWH3xn2LTQztOTvkqjbqsUc6IbmuA0hJVFEPZ_O7Jew,1278
53
+ docs/tutorials/11-enhanced-table-processing.ipynb,sha256=BWpVUhtjaAX7r4OOdiy5gQgrSqREaoB0L5TuHqoHEn8,1278
54
54
  docs/tutorials/11-enhanced-table-processing.md,sha256=2HK-r1UwU7FLn7zWr_pMG7iLk-i0L4U4-t6ubOEeduc,282
55
- docs/tutorials/12-ocr-integration.ipynb,sha256=HeahYziw6aEIzMdTCN8F3XPPBmyVmZ0NU11ZT9JiMy0,23897
56
- docs/tutorials/12-ocr-integration.md,sha256=8FYgRciCkAPFF-tW1rkl5CrMGmvCR6oVWT1-f_tJ5as,4831
57
- docs/tutorials/13-semantic-search.ipynb,sha256=LhqelW0jxcAW1hpvBrEcCeM6gb5AKD10PJ439ywlHrw,73920
55
+ docs/tutorials/12-ocr-integration.ipynb,sha256=xurkoPwgk2p6mhmPdCehy9ccuYHrAhBCb1zGnjRbZ7Y,26724
56
+ docs/tutorials/12-ocr-integration.md,sha256=wU90sfnm1R6BoMFq-orbGpl8OUVcm-wEBTlK0bLgJC4,4572
57
+ docs/tutorials/13-semantic-search.ipynb,sha256=5h806AIal3EwXPVuXJESbXwdUImCx7fo0mo5-f3Dj44,42817
58
58
  docs/tutorials/13-semantic-search.md,sha256=nsNjv0ipYUC3YPSqT5d6dga9ZjObEc04Mc8c0-gsRnU,2914
59
59
  docs/visual-debugging/index.ipynb,sha256=MJ92u3Q9sfRCyDAQM4KWmCrs4QhKwIagbn6ytPF83L4,2175800
60
60
  docs/visual-debugging/index.md,sha256=ueGD2kNFhEAgIHt7qxCfrLRLjHcR7NTD3AU9okBhX9k,4176
61
61
  docs/visual-debugging/region.png,sha256=ULAJs3ZTxMjpD9F4w1DKaZXmhxga3KRq3NrUsXgw28s,67835
62
- natural_pdf/__init__.py,sha256=A3Bc-K2F_LtG08IjkJGngZraLsAT2FSm35Yic7i4Tuk,2913
62
+ natural_pdf/__init__.py,sha256=IjeAfnDU9fpkVc9YvU2DltNtBtIsZm8_DUyXGuyHGB8,2669
63
63
  natural_pdf/analyzers/__init__.py,sha256=dIXjsMqoxKmd9OOnSBzn12wvdIz7D7YNQRAnXslpJSM,142
64
64
  natural_pdf/analyzers/text_options.py,sha256=nE2E1pp4psDPpxmtarvNtEQsgozPkyFRjv0TVP2HTyU,2865
65
65
  natural_pdf/analyzers/text_structure.py,sha256=9h8hKRz0JWnr13xQr3b4FFr_-hDIjue07WvG7LmT8nc,12827
@@ -67,35 +67,38 @@ natural_pdf/analyzers/utils.py,sha256=Lgub1kYSTOnNxeLO1klStHLwH-GIuT4vpdqyVRF-Mc
67
67
  natural_pdf/analyzers/layout/__init__.py,sha256=oq1uJ5UkGGMbBKGirV1aRKK3hxAUyjTLywYkPCQH1f0,33
68
68
  natural_pdf/analyzers/layout/base.py,sha256=9dCR758mAuz7ExlHJ-gwnPnETaM4GZV3W1IRei_t13s,6815
69
69
  natural_pdf/analyzers/layout/docling.py,sha256=4BJYyNVR6VegZGxyisvNIBBRvVk6YKPyDVs7ZdVfzEU,12676
70
+ natural_pdf/analyzers/layout/gemini.py,sha256=Dslt6rOar9S-QSahyjjXN7Z0KEp7CoVStAA4tvB06X8,10894
70
71
  natural_pdf/analyzers/layout/layout_analyzer.py,sha256=6aed1qz5jpndOiakXCBRZAcnyG_waeXi3WPuP5fRvh4,14046
71
- natural_pdf/analyzers/layout/layout_manager.py,sha256=kVBPQ8Ex33SYzzm1fhQOtP4qmHOc92dn4BEfff66Qx4,10053
72
- natural_pdf/analyzers/layout/layout_options.py,sha256=1u8RVdiRwaq5hhGUpVLIdYXCH6TqEq0UxCPdm6JrdTI,3369
72
+ natural_pdf/analyzers/layout/layout_manager.py,sha256=Vh8EKiszKqjELofxQ1eiVLKVjibyjBsZpLFzTf0_21E,11179
73
+ natural_pdf/analyzers/layout/layout_options.py,sha256=s7xr4brE3OutE6aYNAi2PniRy1p2w8a342C2xGpvX2s,3777
73
74
  natural_pdf/analyzers/layout/paddle.py,sha256=gTI9ZqNd5-t4H5IByGfL32WgcE6JrdchW6jRiGI6ulM,13375
74
75
  natural_pdf/analyzers/layout/surya.py,sha256=vhji6ynHPMyQLHuYRPQcplNi7m_lG4P4NYtWv6MzcME,13556
75
76
  natural_pdf/analyzers/layout/tatr.py,sha256=-GJhMy4d0yx6egkO9-ULAIdQkkQRyAKExoIta-b256U,12971
76
- natural_pdf/analyzers/layout/yolo.py,sha256=gy_1DY4sG7jU5rQ7Rb6FUGYI9FFMaozAWiWuxRH5yNw,8294
77
- natural_pdf/collections/pdf_collection.py,sha256=E9GVEgGjTBGpNkuSO_f4GMrSB7Tmi60wnkD7pgvBVOM,12175
77
+ natural_pdf/analyzers/layout/yolo.py,sha256=ANo2U4EZgeN2eYKM1bZIuysiuJLgwl4JeQchrRxOKwA,8388
78
+ natural_pdf/collections/pdf_collection.py,sha256=Qfauo7fskmw3MSzG0C_OjIGLskyFSQxWQkbHrPDYpno,13240
78
79
  natural_pdf/core/__init__.py,sha256=QC8H4M3KbXwMFiQORZ0pdPlzx1Ix6oKKQSS7Ib2KEaA,38
79
- natural_pdf/core/element_manager.py,sha256=R2vY7nYbqrtL1FLRbrJvpUyCpf97zUui-2CaEV2CFQc,21858
80
+ natural_pdf/core/element_manager.py,sha256=rPTkppvU5nQ6Q1_ZtTbcY-KpcRBZV_uBKuNwllHBks0,22100
80
81
  natural_pdf/core/highlighting_service.py,sha256=CTVd7y-fpIreFSe70cTpMu1Pwl6HKMtTHp0bh2U7VXk,32609
81
- natural_pdf/core/page.py,sha256=CQy3zgHT6VBmo7n6cZ5RITSUURIEPzPsWqWQAUGFOZc,78302
82
- natural_pdf/core/pdf.py,sha256=yaShN4vHJ1BXxWAj4lRk7udTcl6F9ddicBFCV6kd--w,41146
82
+ natural_pdf/core/page.py,sha256=Fw01hvK7ekj3iGpj9YbbsVygCmOtTC3qLNvzGBHS4iQ,84784
83
+ natural_pdf/core/pdf.py,sha256=dq2bcxbrbY0zS8t3NKkvqi63Oj2nNzaCHUyHz81OoBI,46383
83
84
  natural_pdf/elements/__init__.py,sha256=S8XeiNWJ1WcgnyYKdYV1yxQlAxCCO3FfITT8MQwNbyk,41
84
- natural_pdf/elements/base.py,sha256=vUga2Nm8DWoRfKMWVTt5N8UMh1q-YzUNbTfDouHzS2U,35698
85
- natural_pdf/elements/collections.py,sha256=2kwOF_-5TePvLbZLVyeEZRt4Im3KlmX8j46giVdxcUE,66000
85
+ natural_pdf/elements/base.py,sha256=hgXpcftlvyUOMGZ8EHEu0WhJz2weqcLrCOFgMEhfm-w,35171
86
+ natural_pdf/elements/collections.py,sha256=Fy5l1Rso-LMunZ6D6Y0n90Uk89h8dzJ2Js7r-8r8NSY,68885
86
87
  natural_pdf/elements/line.py,sha256=7cow3xMUKhAj7zoQz7OaB1eIH2_a8B__LB7iGJ4Mb0o,4612
87
88
  natural_pdf/elements/rect.py,sha256=kiVa3e377ZnqIOXc89d9ZSY4EcmDxtccdtUw-HOQzpw,3796
88
- natural_pdf/elements/region.py,sha256=GOHnq4j4GL-UUQyLdnCLPb0YhBq_YrHn6anecX03t30,67714
89
- natural_pdf/elements/text.py,sha256=Q4hKlXyGhz7njnr_-sON1p8Uqqc8qZBLAqu0VUkT-OE,10958
89
+ natural_pdf/elements/region.py,sha256=-mBZnWoYMB7cLm5RZhHWCnJkJjsfcgH-f2ESktl-lNk,69656
90
+ natural_pdf/elements/text.py,sha256=8PNKSLUgXUhEu9IFfbNbSSpuu0Slm11T6UH8jn4O6hQ,11078
90
91
  natural_pdf/exporters/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
91
92
  natural_pdf/exporters/searchable_pdf.py,sha256=qsaPsnbOOaZHA_aplfZbwQnBoK9KghWm-wzbyRRomeY,16859
92
- natural_pdf/ocr/__init__.py,sha256=8ytKCg4VmiX1LkehnCbBNnL-zLc95CmsLJKDfGFtklE,1916
93
- natural_pdf/ocr/engine.py,sha256=D8B8QHF_8E68JaklyHoNUA3hGn5ld7TGKHD7Ho6mJMg,4316
94
- natural_pdf/ocr/engine_easyocr.py,sha256=aE9alo9rKxZddQAt3liWvlGssH8b2jRtmLwpndttlRM,8617
95
- natural_pdf/ocr/engine_paddle.py,sha256=4ELH9P9-FOTYj_CbUOKiW2gf5U9v2Tscx0fX0nW8j84,9248
96
- natural_pdf/ocr/engine_surya.py,sha256=pzv4CKneXlRvCXsdImAEou81MOTwMYCNhNIVG6Fg3rU,7922
97
- natural_pdf/ocr/ocr_manager.py,sha256=S2ndzKdB-nmK9glbSmn7srotIgKweCByeGIX6SOoEY4,10465
98
- natural_pdf/ocr/ocr_options.py,sha256=JZXRxjsQuKf9GJMt56YikcOqsTQ7SvXOv2XZ7z1qnB8,3794
93
+ natural_pdf/ocr/__init__.py,sha256=8EvoA2poYbtkS8Jmbkgn4hFEwOHbN5fIXdJc9tT4NzI,2477
94
+ natural_pdf/ocr/engine.py,sha256=oTABzt20pEvKadTv1U7zOIv_jSTwv5dty2Q_6vf6HQs,8767
95
+ natural_pdf/ocr/engine_easyocr.py,sha256=zki3-fd-u01E9VPdaBD0Rkel18Nk9xYBg477MXY0C8w,8487
96
+ natural_pdf/ocr/engine_paddle.py,sha256=8OYbcYrjIaYop7h7W4R7bXWHKOCYhJQpqT2cVccNb5E,6209
97
+ natural_pdf/ocr/engine_surya.py,sha256=PtzvDOqxNzhAEeh0rIhTwPXDAbTHMR2IRs0tXb-4pag,4693
98
+ natural_pdf/ocr/ocr_factory.py,sha256=3fxIpgGi6NzxhfYpl5Kblufyx_-RRoT7dlRGktYjB_Y,4425
99
+ natural_pdf/ocr/ocr_manager.py,sha256=sMQrpvAaA4PbjhZOf7G_KGW3KBhXhx1l26ig_Xqf_0g,9190
100
+ natural_pdf/ocr/ocr_options.py,sha256=3njghlnnkcxOL4Td7l6mt-mTEFmL8Z-ryf_BX-EM3i4,3289
101
+ natural_pdf/ocr/utils.py,sha256=AIBkGQExetjl2wyuQLpWJSy0HSxaOBmuCo2QsKmY7Rc,3404
99
102
  natural_pdf/qa/__init__.py,sha256=Pjo62JTnUNEjGNsC437mvsS5KQ5m7X_BibGvavR9AW0,108
100
103
  natural_pdf/qa/document_qa.py,sha256=W4E4vS_Eox_IBsYpVb0ifQbJb0FP-PYEIG93CU3rUkE,15246
101
104
  natural_pdf/search/__init__.py,sha256=EB_HRwlktJn5WGPVtSaRbOQNjLAZTxujeYf_eN-zd2U,4191
@@ -107,16 +110,22 @@ natural_pdf/search/searchable_mixin.py,sha256=M2a6FaFVM0vcfh7FgjDH6BLhS-7ggeVpcf
107
110
  natural_pdf/selectors/__init__.py,sha256=oZGeqSv53EqmIZOhcnawuaGGlRg1h79vArXuZCWKm4A,123
108
111
  natural_pdf/selectors/parser.py,sha256=59_GSsTApM6MFvtqhrrmbKaBfODPbGXMluvvQJcrqhE,15754
109
112
  natural_pdf/templates/__init__.py,sha256=jYBxzfi73vew0f6yhIh1MlRxw4F_TVN2hKQR0YXOFe0,20
110
- natural_pdf/templates/ocr_debug.html,sha256=Zy9StzBeHFQU8ity6cjFSZLe3TY0QOabUux4c5WQUzs,19171
113
+ natural_pdf/templates/spa/index.html,sha256=6hLTp07OeV5Q4jUMp5Sgl-dwfBs3oPzBxqphG4kEs24,787
114
+ natural_pdf/templates/spa/words.txt,sha256=vkGtl5Y7-Nq-3Vhx1daRWWF1Jp1UCVaw-ZZaiFwrurk,2493885
115
+ natural_pdf/templates/spa/css/style.css,sha256=Qdl0U3L5HMyhBDNzyRPklfb3OxW6rMxCfQbzO8i8IW4,7643
116
+ natural_pdf/templates/spa/js/app.js,sha256=Efb7NmcTN9RLdLwKpDcU6CG5Ix0laHtzRHmfUlDMJXw,19679
111
117
  natural_pdf/utils/__init__.py,sha256=s3M8FggaK1P3EBYn6R_-HgSDjNc9C73gyKe1hihtNWg,43
118
+ natural_pdf/utils/debug.py,sha256=56dk0OcDUwjRbYU2g1k0_G_3hfHkAF9Z6vnMVt3myMU,992
112
119
  natural_pdf/utils/highlighting.py,sha256=EIY6ihVGtUTS_DjWyxpnr_UXpcR4btC1KhSGQ9VUfKg,698
120
+ natural_pdf/utils/identifiers.py,sha256=IvXj2q-NW1cmivWAedDOZBFPTRbVl0_J8BP4phREt9U,1092
121
+ natural_pdf/utils/packaging.py,sha256=mNPEqCtc0CVWjKg1RcSldYTgspUWQOLAR_ZEllyKxs4,20175
113
122
  natural_pdf/utils/reading_order.py,sha256=s3DsYq_3g_1YA07qhd4BGEjeIRTeyGtnwc_hNtSzwBY,7290
114
123
  natural_pdf/utils/text_extraction.py,sha256=VlbkXg14GlvwYTjRJWa8FVUigETY3Hq0v8NlIRnzYkM,8619
115
124
  natural_pdf/utils/visualization.py,sha256=ir5PgpptRuVuVeRT9IcdTsNeEpdOYD_69rByjHQ7JhI,8592
116
125
  natural_pdf/widgets/__init__.py,sha256=O2fSDo604wDAP6UwUkmBq3eT91RSqHwBpAOQXq92S8s,214
117
126
  natural_pdf/widgets/viewer.py,sha256=Aiw6kuBc0WkhcZrPNKyLNzzWbmtmU6rvOmHV0IuXCBk,40862
118
127
  natural_pdf/widgets/frontend/viewer.js,sha256=w8ywfz_IOAAv2nP_qaf2VBUkF1KhjT3zorhJxM1-CfU,4371
119
- natural_pdf-0.1.5.dist-info/licenses/LICENSE,sha256=9zfwINwJlarbDmdh6iJV4QUG54QSJlSAUcnC1YiC_Ns,1074
128
+ natural_pdf-0.1.6.dist-info/licenses/LICENSE,sha256=9zfwINwJlarbDmdh6iJV4QUG54QSJlSAUcnC1YiC_Ns,1074
120
129
  notebooks/Examples.ipynb,sha256=l4YMtMEx_DWBzWIjl9CmBkWTo0g_nK8l_XWOyzYooQM,4275170
121
130
  pdfs/.gitkeep,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
122
131
  pdfs/01-practice.pdf,sha256=dxWyJIa2cm7bALE3BWDJ2dg3inyFlo1n8ntVyy0hkTo,7906
@@ -126,9 +135,7 @@ pdfs/2014 Statistics.pdf,sha256=B-30OQVjqj_3718-G9cGUefNddnz-MosPdHAzfGfkcc,9559
126
135
  pdfs/2019 Statistics.pdf,sha256=reuSJxvAlx9_P-pW7IPqzox0jFCxSPbK1i1-WFu-uGA,511439
127
136
  pdfs/Atlanta_Public_Schools_GA_sample.pdf,sha256=PLBh_uWJQH0MnBaSm5ng5Ima63_m6Mi11CjdravB_S8,137689
128
137
  pdfs/needs-ocr.pdf,sha256=vusKiLxSOlELUTetfZfaotNU54RtMj9PCzGfLc2cuNs,139305
129
- tests/test_loading.py,sha256=AHjnIKqEAdtQa28kEAhFQTJ0Nnu49AmxnPM8YE8_EP0,1770
130
- tests/test_optional_deps.py,sha256=e9H3ylLsB4cnyC3TVMgUbBMzmSbq6MlH8jn_pqh4Hus,12111
131
- natural_pdf-0.1.5.dist-info/METADATA,sha256=7lBaQX1e1ibQibz2ZRYt0DsDy84k3sk6dGJqT9lQvWg,5466
132
- natural_pdf-0.1.5.dist-info/WHEEL,sha256=CmyFI0kx5cdEMTLiONQRbGQwjIoR1aIYB7eCAQ4KPJ0,91
133
- natural_pdf-0.1.5.dist-info/top_level.txt,sha256=N44f8aOLMpI6MzrNHsCD8MzElkir_H1nPUGZ4QToWqI,38
134
- natural_pdf-0.1.5.dist-info/RECORD,,
138
+ natural_pdf-0.1.6.dist-info/METADATA,sha256=Yd92-6FRKc6KdEuTpCOWyxBcewnhAoYTAhtbq6qIB0Q,6668
139
+ natural_pdf-0.1.6.dist-info/WHEEL,sha256=pxyMxgL8-pra_rKaQ4drOZAegBVuX-G_4nRHjjgWbmo,91
140
+ natural_pdf-0.1.6.dist-info/top_level.txt,sha256=7nDKUnpkN7B8cBI7DEpW5JM8S7OcOgHw3jXH-1iCX2o,32
141
+ natural_pdf-0.1.6.dist-info/RECORD,,
@@ -1,5 +1,5 @@
1
1
  Wheel-Version: 1.0
2
- Generator: setuptools (78.1.0)
2
+ Generator: setuptools (79.0.0)
3
3
  Root-Is-Purelib: true
4
4
  Tag: py3-none-any
5
5
 
@@ -2,4 +2,3 @@ docs
2
2
  natural_pdf
3
3
  notebooks
4
4
  pdfs
5
- tests