natural-pdf 0.1.32__tar.gz → 0.1.33__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/.gitignore +1 -0
- {natural_pdf-0.1.32/natural_pdf.egg-info → natural_pdf-0.1.33}/PKG-INFO +1 -1
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/core/element_manager.py +62 -42
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/core/page.py +27 -2
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/core/pdf.py +16 -3
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/elements/region.py +19 -6
- {natural_pdf-0.1.32 → natural_pdf-0.1.33/natural_pdf.egg-info}/PKG-INFO +1 -1
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf.egg-info/SOURCES.txt +1 -0
- natural_pdf-0.1.33/tests/test_core/test_text_layer.py +125 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/.cursor/rules/analysis_framework.mdc +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/.cursor/rules/coding-style.mdc +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/.cursor/rules/edit-md-instead-of-ipynb.mdc +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/.cursor/rules/minimal-comments.mdc +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/.cursor/rules/natural-pdf-overview.mdc +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/.cursor/rules/user-friendly-library-code.mdc +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/.github/workflows/docs.yml +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/.pre-commit-config.yaml +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/01-execute_notebooks.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/02-run_all_tutorials.sh +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/CLAUDE.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/LICENSE +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/MANIFEST.in +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/README.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/audit_packaging.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/1A4PPW1_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/analysis/1A4PPW1/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/analysis/1A4PPW1/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/analysis/1A4PPW1/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/analysis/1A4PPW1/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/analysis/1A4PPW1/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/analysis/1A4PPW1/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/analysis/1A4PPW1/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/analysis/1A4PPW1/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/detailed_analysis_final/1A4PPW1_The arabic text_detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/1A4PPW1_The arabic text/detailed_analysis_final/page_11.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/2EAOEvb_The text_ without beeing divided in 2 columns and /2EAOEvb_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/2EAOEvb_The text_ without beeing divided in 2 columns and /analysis/2EAOEvb/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/2EAOEvb_The text_ without beeing divided in 2 columns and /analysis/2EAOEvb/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/2EAOEvb_The text_ without beeing divided in 2 columns and /analysis/2EAOEvb/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/2EAOEvb_The text_ without beeing divided in 2 columns and /analysis/2EAOEvb/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/2EAOEvb_The text_ without beeing divided in 2 columns and /analysis/2EAOEvb/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/2EAOEvb_The text_ without beeing divided in 2 columns and /analysis/2EAOEvb/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/2EAOEvb_The text_ without beeing divided in 2 columns and /analysis/2EAOEvb/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/2EAOEvb_The text_ without beeing divided in 2 columns and /detailed_analysis_final/2EAOEvb_The text_ without beeing divided in 2 columns and _detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/2EAOEvb_The text_ without beeing divided in 2 columns and /detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/2EAOEvb_The text_ without beeing divided in 2 columns and /detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/2EAOEvb_The text_ without beeing divided in 2 columns and /detailed_analysis_final/page_98.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Focus/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Focus/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Focus/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Focus/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Focus/page_1_regions_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Focus/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Focus/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Gx9jayj_A CSV of all the complaints_ officers and details/Gx9jayj_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Gx9jayj_A CSV of all the complaints_ officers and details/analysis/Gx9jayj/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Gx9jayj_A CSV of all the complaints_ officers and details/analysis/Gx9jayj/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Gx9jayj_A CSV of all the complaints_ officers and details/analysis/Gx9jayj/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Gx9jayj_A CSV of all the complaints_ officers and details/analysis/Gx9jayj/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Gx9jayj_A CSV of all the complaints_ officers and details/analysis/Gx9jayj/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Gx9jayj_A CSV of all the complaints_ officers and details/analysis/Gx9jayj/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Gx9jayj_A CSV of all the complaints_ officers and details/analysis/Gx9jayj/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Gx9jayj_A CSV of all the complaints_ officers and details/analysis/Gx9jayj/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/GxpvezO_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/analysis/GxpvezO/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/analysis/GxpvezO/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/analysis/GxpvezO/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/analysis/GxpvezO/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/analysis/GxpvezO/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/analysis/GxpvezO/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/analysis/GxpvezO/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/analysis/GxpvezO/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/analysis/GxpvezO/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/analysis/GxpvezO/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/detailed_analysis_final/GxpvezO_The table in Nepali on page 30 _in between the tex_detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/detailed_analysis_final/page_30.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/enhanced_analysis_10/GxpvezO_The table in Nepali on page 30 _in between the tex_enhanced_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/enhanced_analysis_10/analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/GxpvezO_The table in Nepali on page 30 _in between the tex/enhanced_analysis_10/page_30.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./J9lKd7Y_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./analysis/J9lKd7Y/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./analysis/J9lKd7Y/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./analysis/J9lKd7Y/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./analysis/J9lKd7Y/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./analysis/J9lKd7Y/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./analysis/J9lKd7Y/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./analysis/J9lKd7Y/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./analysis/J9lKd7Y/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./detailed_analysis_final/J9lKd7Y_Table in Slovenian _e.g. on page 80_._detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./detailed_analysis_final/page_80.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./enhanced_analysis_10/J9lKd7Y_Table in Slovenian _e.g. on page 80_._enhanced_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./enhanced_analysis_10/analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9lKd7Y_Table in Slovenian _e.g. on page 80_./enhanced_analysis_10/page_80.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/J9px44R_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/analysis/J9px44R/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/analysis/J9px44R/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/analysis/J9px44R/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/analysis/J9px44R/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/analysis/J9px44R/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/analysis/J9px44R/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_10.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_10_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_10_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_10_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_10_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_10_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_2.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_2_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_2_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_2_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_2_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_2_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_3.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_3_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_3_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_3_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_3_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_3_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_3_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_3_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_4.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_4_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_4_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_4_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_4_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_4_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_5.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_5_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_5_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_5_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_5_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_5_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_5_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_6.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_6_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_6_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_6_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_6_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_6_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_6_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_6_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_6_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_7.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_7_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_7_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_7_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_7_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_7_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_7_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_7_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_7_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_8.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_8_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_8_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_8_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_8_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_8_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_8_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_8_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_8_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_9.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_9_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_9_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_9_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_9_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_9_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_9_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_9_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis/J9px44R/page_9_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis_final/J9px44R_Tables of Senate office expenditures_detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/J9px44R_Tables of Senate office expenditures/detailed_analysis_final/page_1489.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/NplKG2O_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/analysis/NplKG2O/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/analysis/NplKG2O/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/analysis/NplKG2O/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/analysis/NplKG2O/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/analysis/NplKG2O/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/analysis/NplKG2O/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/analysis/NplKG2O/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/analysis/NplKG2O/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/analysis/NplKG2O/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/enhanced_analysis_10/NplKG2O_Try to see if natural-pdf can process non-standard_enhanced_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/enhanced_analysis_10/analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/NplKG2O_Try to see if natural-pdf can process non-standard/enhanced_analysis_10/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/OD49rjM_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/analysis/OD49rjM/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/analysis/OD49rjM/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/analysis/OD49rjM/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/analysis/OD49rjM/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/analysis/OD49rjM/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/analysis/OD49rjM/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/analysis/OD49rjM/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/analysis/OD49rjM/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/detailed_analysis_final/OD49rjM_Just being able to make sense of any of it. It_s b_detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/OD49rjM_Just being able to make sense of any of it. It_s b/detailed_analysis_final/page_17303.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/ODX1DW8_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/analysis/ODX1DW8/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/analysis/ODX1DW8/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/analysis/ODX1DW8/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/analysis/ODX1DW8/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/analysis/ODX1DW8/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/analysis/ODX1DW8/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/analysis/ODX1DW8/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/analysis/ODX1DW8/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/enhanced_analysis/ODX1DW8_enhanced_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/enhanced_analysis/enhanced_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/enhanced_analysis/page_178.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/enhanced_analysis/page_179.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODX1DW8_The large table on page 179/enhanced_analysis/page_180.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/ODXl8aR_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/analysis/ODXl8aR/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/analysis/ODXl8aR/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/analysis/ODXl8aR/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/analysis/ODXl8aR/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/analysis/ODXl8aR/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/analysis/ODXl8aR/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/analysis/ODXl8aR/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/analysis/ODXl8aR/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/analysis/ODXl8aR/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/analysis/ODXl8aR/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/detailed_analysis_final/ODXl8aR_0. ISO code of the business_ business name_ contac_detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ODXl8aR_0. ISO code of the business_ business name_ contac/detailed_analysis_final/page_55.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/Pd1KBb1_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/analysis/Pd1KBb1/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/analysis/Pd1KBb1/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/analysis/Pd1KBb1/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/analysis/Pd1KBb1/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/analysis/Pd1KBb1/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/analysis/Pd1KBb1/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/analysis/Pd1KBb1/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/analysis/Pd1KBb1/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/analysis/Pd1KBb1/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/analysis/Pd1KBb1/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/detailed_analysis_final/Pd1KBb1_the data table _of election results__detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd1KBb1_the data table _of election results_/detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/Pd9WVDb_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/analysis/Pd9WVDb/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/analysis/Pd9WVDb/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/analysis/Pd9WVDb/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/analysis/Pd9WVDb/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/analysis/Pd9WVDb/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/analysis/Pd9WVDb/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/analysis/Pd9WVDb/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/analysis/Pd9WVDb/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/detailed_analysis_final/Pd9WVDb_We want a spreadsheet showing all the columns sepa_detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Pd9WVDb_We want a spreadsheet showing all the columns sepa/detailed_analysis_final/page_12454.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Xxogz9j_This bad PDF is one of the pinnacles of Japanese F/Xxogz9j_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Xxogz9j_This bad PDF is one of the pinnacles of Japanese F/analysis/Xxogz9j/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Xxogz9j_This bad PDF is one of the pinnacles of Japanese F/analysis/Xxogz9j/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Xxogz9j_This bad PDF is one of the pinnacles of Japanese F/analysis/Xxogz9j/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Xxogz9j_This bad PDF is one of the pinnacles of Japanese F/analysis/Xxogz9j/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Xxogz9j_This bad PDF is one of the pinnacles of Japanese F/analysis/Xxogz9j/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Xxogz9j_This bad PDF is one of the pinnacles of Japanese F/analysis/Xxogz9j/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /Y5G72LB_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /analysis/Y5G72LB/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /analysis/Y5G72LB/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /analysis/Y5G72LB/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /analysis/Y5G72LB/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /analysis/Y5G72LB/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /analysis/Y5G72LB/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /analysis/Y5G72LB/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /analysis/Y5G72LB/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /detailed_analysis_final/Y5G72LB_We are trying to get specific information such as _detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Y5G72LB_We are trying to get specific information such as /detailed_analysis_final/page_11.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/analysis/b5eVqGg/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/analysis/b5eVqGg/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/analysis/b5eVqGg/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/analysis/b5eVqGg/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/analysis/b5eVqGg/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/analysis/b5eVqGg/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/analysis/b5eVqGg/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/analysis/b5eVqGg/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/analysis/b5eVqGg/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/b5eVqGg_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/detailed_analysis_final/b5eVqGg_Math formulas in Russian _e.g. on page 181___detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/detailed_analysis_final/page_181.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/enhanced_analysis_10/analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/enhanced_analysis_10/b5eVqGg_Math formulas in Russian _e.g. on page 181___enhanced_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/b5eVqGg_Math formulas in Russian _e.g. on page 181__/enhanced_analysis_10/page_181.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/analysis/eqQ4N7q/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/analysis/eqQ4N7q/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/analysis/eqQ4N7q/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/analysis/eqQ4N7q/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/analysis/eqQ4N7q/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/analysis/eqQ4N7q/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/analysis/eqQ4N7q/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/analysis/eqQ4N7q/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/analysis/eqQ4N7q/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/analysis/eqQ4N7q/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/detailed_analysis_final/eqQ4N7q_election results data table_detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4N7q_election results data table/eqQ4N7q_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/analysis/eqQ4NoQ/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/analysis/eqQ4NoQ/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/analysis/eqQ4NoQ/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/analysis/eqQ4NoQ/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/analysis/eqQ4NoQ/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/analysis/eqQ4NoQ/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/analysis/eqQ4NoQ/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/analysis/eqQ4NoQ/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/analysis/eqQ4NoQ/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/analysis/eqQ4NoQ/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/detailed_analysis_final/eqQ4NoQ_data table_detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqQ4NoQ_data table/eqQ4NoQ_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/analysis/eqrZ5yq/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/analysis/eqrZ5yq/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/analysis/eqrZ5yq/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/analysis/eqrZ5yq/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/analysis/eqrZ5yq/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/analysis/eqrZ5yq/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/analysis/eqrZ5yq/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/analysis/eqrZ5yq/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/enhanced_analysis/enhanced_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/enhanced_analysis/eqrZ5yq_enhanced_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/enhanced_analysis/page_89.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/enhanced_analysis/page_90.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/enhanced_analysis/page_91.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/enhanced_analysis/page_92.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZ5yq_The long table _Annex 6_ spanning across pages fro/eqrZ5yq_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/analysis/eqrZZbq/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/analysis/eqrZZbq/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/analysis/eqrZZbq/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/analysis/eqrZZbq/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/analysis/eqrZZbq/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/analysis/eqrZZbq/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/analysis/eqrZZbq/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/analysis/eqrZZbq/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/analysis/eqrZZbq/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/analysis/eqrZZbq/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/enhanced_analysis_10/analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/enhanced_analysis_10/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab_enhanced_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/enhanced_analysis_10/page_4.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/eqrZZbq_The categorize chart _E1_ on page 4_ The chart_tab/eqrZZbq_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ja6EqV1_A spreadsheet of use of force records__/analysis/ja6EqV1/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ja6EqV1_A spreadsheet of use of force records__/analysis/ja6EqV1/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ja6EqV1_A spreadsheet of use of force records__/analysis/ja6EqV1/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ja6EqV1_A spreadsheet of use of force records__/analysis/ja6EqV1/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ja6EqV1_A spreadsheet of use of force records__/analysis/ja6EqV1/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ja6EqV1_A spreadsheet of use of force records__/analysis/ja6EqV1/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ja6EqV1_A spreadsheet of use of force records__/ja6EqV1_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./analysis/lbODDK6/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./analysis/lbODDK6/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./analysis/lbODDK6/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./analysis/lbODDK6/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./analysis/lbODDK6/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./analysis/lbODDK6/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./analysis/lbODDK6/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./analysis/lbODDK6/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./detailed_analysis_final/lbODDK6_The text in Ethiopian._detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./detailed_analysis_final/page_32.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODDK6_The text in Ethiopian./lbODDK6_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/analysis/lbODqev/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/analysis/lbODqev/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/analysis/lbODqev/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/analysis/lbODqev/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/analysis/lbODqev/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/analysis/lbODqev/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/analysis/lbODqev/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/analysis/lbODqev/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/analysis/lbODqev/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/analysis/lbODqev/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/detailed_analysis_final/lbODqev_Large wide tables in Serbian _from page 63 and on__detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/detailed_analysis_final/page_63.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/enhanced_analysis_10/analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/enhanced_analysis_10/lbODqev_Large wide tables in Serbian _from page 63 and on__enhanced_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/enhanced_analysis_10/page_63.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/enhanced_analysis_10/page_64.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/enhanced_analysis_10/page_65.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/lbODqev_Large wide tables in Serbian _from page 63 and on_/lbODqev_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR1XQb_Animal-related 911 calls and their descriptions fo/analysis/obR1XQb/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR1XQb_Animal-related 911 calls and their descriptions fo/analysis/obR1XQb/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR1XQb_Animal-related 911 calls and their descriptions fo/analysis/obR1XQb/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR1XQb_Animal-related 911 calls and their descriptions fo/analysis/obR1XQb/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR1XQb_Animal-related 911 calls and their descriptions fo/analysis/obR1XQb/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR1XQb_Animal-related 911 calls and their descriptions fo/analysis/obR1XQb/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR1XQb_Animal-related 911 calls and their descriptions fo/analysis/obR1XQb/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR1XQb_Animal-related 911 calls and their descriptions fo/analysis/obR1XQb/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR1XQb_Animal-related 911 calls and their descriptions fo/analysis/obR1XQb/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR1XQb_Animal-related 911 calls and their descriptions fo/analysis/obR1XQb/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR1XQb_Animal-related 911 calls and their descriptions fo/obR1XQb_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./analysis/obR6Dxb/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./analysis/obR6Dxb/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./analysis/obR6Dxb/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./analysis/obR6Dxb/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./analysis/obR6Dxb/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./analysis/obR6Dxb/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./analysis/obR6Dxb/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./analysis/obR6Dxb/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./analysis/obR6Dxb/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./analysis/obR6Dxb/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./detailed_analysis_final/obR6Dxb_Large table that spans across pages in Serbian _e._detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./detailed_analysis_final/page_60.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./enhanced_analysis_10/analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./enhanced_analysis_10/obR6Dxb_Large table that spans across pages in Serbian _e._enhanced_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./enhanced_analysis_10/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./enhanced_analysis_10/page_2.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./enhanced_analysis_10/page_3.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obR6Dxb_Large table that spans across pages in Serbian _e./obR6Dxb_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/analysis/obe1Vq5/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/analysis/obe1Vq5/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/analysis/obe1Vq5/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/analysis/obe1Vq5/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/analysis/obe1Vq5/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/analysis/obe1Vq5/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/analysis/obe1Vq5/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/analysis/obe1Vq5/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/analysis/obe1Vq5/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/analysis/obe1Vq5/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_2.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_2_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_2_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_2_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_2_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_2_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_2_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_2_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_2_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_3.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_3_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_3_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_3_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_3_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_3_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_3_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_3_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_3_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_4.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_4_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_4_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_4_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_4_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_4_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_4_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_4_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_4_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_5.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_5_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_5_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_5_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_5_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_5_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis/obe1Vq5/page_5_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis_final/obe1Vq5_MARKED UP text -- underline and strikethu__for bon_detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/enhanced_analysis_10/analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/enhanced_analysis_10/obe1Vq5_MARKED UP text -- underline and strikethu__for bon_enhanced_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/enhanced_analysis_10/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obe1Vq5_MARKED UP text -- underline and strikethu__for bon/obe1Vq5_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obeW0bN_The data table/analysis/obeW0bN/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obeW0bN_The data table/analysis/obeW0bN/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obeW0bN_The data table/analysis/obeW0bN/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obeW0bN_The data table/analysis/obeW0bN/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obeW0bN_The data table/analysis/obeW0bN/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obeW0bN_The data table/analysis/obeW0bN/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obeW0bN_The data table/analysis/obeW0bN/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obeW0bN_The data table/analysis/obeW0bN/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/obeW0bN_The data table/obeW0bN_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/analysis/ober4db/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/analysis/ober4db/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/analysis/ober4db/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/analysis/ober4db/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/analysis/ober4db/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/analysis/ober4db/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/analysis/ober4db/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/analysis/ober4db/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/enhanced_analysis_10/analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/enhanced_analysis_10/ober4db_The graph and table on page 180 and 181_enhanced_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/enhanced_analysis_10/page_180.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/enhanced_analysis_10/page_181.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/ober4db_The graph and table on page 180 and 181/ober4db_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/oberryX_The survery question table_ such as the one on pag/analysis/oberryX/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/oberryX_The survery question table_ such as the one on pag/analysis/oberryX/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/oberryX_The survery question table_ such as the one on pag/analysis/oberryX/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/oberryX_The survery question table_ such as the one on pag/analysis/oberryX/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/oberryX_The survery question table_ such as the one on pag/analysis/oberryX/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/oberryX_The survery question table_ such as the one on pag/analysis/oberryX/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/oberryX_The survery question table_ such as the one on pag/analysis/oberryX/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/oberryX_The survery question table_ such as the one on pag/analysis/oberryX/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/oberryX_The survery question table_ such as the one on pag/enhanced_analysis_10/analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/oberryX_The survery question table_ such as the one on pag/enhanced_analysis_10/oberryX_The survery question table_ such as the one on pag_enhanced_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/oberryX_The survery question table_ such as the one on pag/enhanced_analysis_10/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/oberryX_The survery question table_ such as the one on pag/oberryX_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/pbDb4PP_This PDF is titled _Creating a Regional Circulatin/analysis/pbDb4PP/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/pbDb4PP_This PDF is titled _Creating a Regional Circulatin/analysis/pbDb4PP/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/pbDb4PP_This PDF is titled _Creating a Regional Circulatin/analysis/pbDb4PP/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/pbDb4PP_This PDF is titled _Creating a Regional Circulatin/analysis/pbDb4PP/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/pbDb4PP_This PDF is titled _Creating a Regional Circulatin/analysis/pbDb4PP/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/pbDb4PP_This PDF is titled _Creating a Regional Circulatin/analysis/pbDb4PP/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/pbDb4PP_This PDF is titled _Creating a Regional Circulatin/analysis/pbDb4PP/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/pbDb4PP_This PDF is titled _Creating a Regional Circulatin/analysis/pbDb4PP/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/pbDb4PP_This PDF is titled _Creating a Regional Circulatin/pbDb4PP_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/analysis/q4DXYk8/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/analysis/q4DXYk8/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/analysis/q4DXYk8/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/analysis/q4DXYk8/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/analysis/q4DXYk8/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/analysis/q4DXYk8/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/analysis/q4DXYk8/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/analysis/q4DXYk8/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/analysis/q4DXYk8/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/detailed_analysis_final/q4DXYk8_The disciplinary log table_detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/q4DXYk8_The disciplinary log table/q4DXYk8_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/analysis/zxyRByM/analysis_summary.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/analysis/zxyRByM/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/analysis/zxyRByM/page_1_all_elements_inspect.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/analysis/zxyRByM/page_1_all_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/analysis/zxyRByM/page_1_describe.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/analysis/zxyRByM/page_1_table.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/analysis/zxyRByM/page_1_tatr_layout.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/analysis/zxyRByM/page_1_tatr_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/analysis/zxyRByM/page_1_text.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/analysis/zxyRByM/page_1_yolo_regions.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/detailed_analysis_final/detailed_analysis_results.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/detailed_analysis_final/page_1.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/detailed_analysis_final/page_6.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/detailed_analysis_final/zxyRByM_Tables_ Have never managed to get other python lib_detailed_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/zxyRByM_Tables_ Have never managed to get other python lib/zxyRByM_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/check_run_md.sh +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/api/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/assets/favicon.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/assets/favicon.svg +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/assets/javascripts/custom.js +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/assets/logo.svg +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/assets/sample-screen.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/assets/social-preview.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/assets/social-preview.svg +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/assets/stylesheets/custom.css +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/categorizing-documents/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/data-extraction/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/describe/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/describe/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/document-qa/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/document-qa/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/element-selection/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/element-selection/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/extracting-clean-text/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/extracting-clean-text/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/finetuning/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/fix-messy-tables/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/fix-messy-tables/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/fix-messy-tables/table_1.csv +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/fix-messy-tables/table_2.csv +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/fix-messy-tables/table_3.csv +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/installation/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/interactive-widget/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/interactive-widget/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/layout-analysis/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/layout-analysis/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/loops-and-groups/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/loops-and-groups/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/css/style.css +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/index.html +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/js/app.js +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/js/vendor/FileSaver.min.js +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/js/vendor/babel.min.js +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/js/vendor/hooks.umd.js +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/js/vendor/htm-preact.umd.min.js +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/js/vendor/htm.umd.min.js +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/js/vendor/jszip.min.js +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/js/vendor/preact.umd.min.js +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/js/vendor/react-dom.development.js +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/js/vendor/react.development.js +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/ocr-tool/words.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/pdf-navigation/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/pdf-navigation/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/process-forms-and-invoices/extracted_form_data.csv +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/process-forms-and-invoices/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/process-forms-and-invoices/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/quick-reference/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/quick-reference/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/reflowing-pages/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/reflowing-pages/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/regions/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/regions/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tables/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tables/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/text-analysis/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/text-analysis/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/text-extraction/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/01-loading-and-extraction.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/01-loading-and-extraction.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/02-finding-elements.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/02-finding-elements.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/03-extracting-blocks.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/03-extracting-blocks.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/04-table-extraction.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/04-table-extraction.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/05-excluding-content.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/05-excluding-content.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/06-document-qa.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/06-document-qa.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/07-layout-analysis.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/07-layout-analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/07-working-with-regions.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/07-working-with-regions.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/08-spatial-navigation.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/08-spatial-navigation.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/09-section-extraction.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/09-section-extraction.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/10-form-field-extraction.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/10-form-field-extraction.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/11-enhanced-table-processing.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/11-enhanced-table-processing.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/12-ocr-integration.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/12-ocr-integration.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/13-semantic-search.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/13-semantic-search.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/14-categorizing-documents.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/tutorials/14-categorizing-documents.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/visual-debugging/index.ipynb +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/visual-debugging/index.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/docs/visual-debugging/region.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/mkdocs.yml +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/guides.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/base.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/docling.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/gemini.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/layout_analyzer.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/layout_manager.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/layout_options.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/paddle.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/pdfplumber_table_finder.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/surya.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/table_structure_utils.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/tatr.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/layout/yolo.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/shape_detection_mixin.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/text_options.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/text_structure.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/analyzers/utils.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/classification/manager.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/classification/mixin.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/classification/results.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/cli.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/collections/mixins.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/collections/pdf_collection.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/core/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/core/highlighting_service.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/describe/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/describe/base.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/describe/elements.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/describe/mixin.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/describe/summary.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/elements/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/elements/base.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/elements/collections.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/elements/image.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/elements/line.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/elements/rect.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/elements/text.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/export/mixin.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/exporters/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/exporters/base.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/exporters/data/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/exporters/data/pdf.ttf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/exporters/data/sRGB.icc +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/exporters/hocr.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/exporters/hocr_font.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/exporters/original_pdf.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/exporters/paddleocr.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/exporters/searchable_pdf.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/extraction/manager.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/extraction/mixin.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/extraction/result.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/flows/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/flows/collections.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/flows/element.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/flows/flow.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/flows/region.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/ocr/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/ocr/engine.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/ocr/engine_doctr.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/ocr/engine_easyocr.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/ocr/engine_paddle.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/ocr/engine_surya.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/ocr/ocr_factory.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/ocr/ocr_manager.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/ocr/ocr_options.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/ocr/utils.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/qa/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/qa/document_qa.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/qa/qa_result.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/search/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/search/lancedb_search_service.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/search/numpy_search_service.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/search/search_options.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/search/search_service_protocol.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/search/searchable_mixin.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/selectors/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/selectors/parser.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/tables/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/tables/result.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/templates/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/templates/finetune/fine_tune_paddleocr.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/templates/spa/css/style.css +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/templates/spa/index.html +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/templates/spa/js/app.js +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/templates/spa/words.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/utils/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/utils/bidi_mirror.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/utils/debug.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/utils/highlighting.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/utils/identifiers.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/utils/locks.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/utils/packaging.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/utils/reading_order.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/utils/text_extraction.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/utils/visualization.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/widgets/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf/widgets/viewer.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf.egg-info/dependency_links.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf.egg-info/entry_points.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf.egg-info/requires.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/natural_pdf.egg-info/top_level.txt +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/noxfile.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/optimization/memory_comparison.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/optimization/pdf_analyzer.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/optimization/performance_analysis.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/optimization/performance_results/image_heavy_snapshots.csv +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/optimization/performance_results/image_heavy_snapshots.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/optimization/performance_results/text_heavy_snapshots.csv +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/optimization/performance_results/text_heavy_snapshots.json +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/optimization/test_cleanup_methods.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/optimization/test_memory_fix.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/.gitkeep +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/01-practice.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/0500000US42001.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/0500000US42007.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/1107231007033739008.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/2014 Statistics.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/2019 Statistics.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/30.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/Atlanta_Public_Schools_GA_sample.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/July 2023 N4 Temp Logs.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/anexo_edital_6604_1743480-table.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/appendix_fy2026.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/arabic.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/cia-doc.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/geometry.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/hebrew-table.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/image.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/image.png.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/multi-page-table.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/multicolumn.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/needs-ocr.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/red.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/shapes-and-text.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/tiny-ocr-2.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/tiny-ocr-3.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/tiny-ocr-small.jpg +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/tiny-ocr-wide.jpg +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/tiny-ocr.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/tiny-text-tables.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/tiny.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/types-of-type.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pdfs/word-counter.pdf +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/publish.sh +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/pyproject.toml +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/sample-screen.png +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/setup.cfg +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/test_install.sh +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/conftest.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/exporters/test_paddleocr_exporter.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_arabic_performance.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_arabic_real_world.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_core/test_containment_geometry.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_core/test_elements.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_core/test_loading.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_core/test_spatial.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_core/test_text_extraction.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_guides.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_guides_integration.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_highlight_detection.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_loading_original.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_optional_deps.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_strikethrough_detection.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_tiny_text_tables.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_tiny_text_tables_table.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_tutorials.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tests/test_underline_detection.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/todo/bad_pdf_analysis.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/todo/evaluation.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tools/bad_pdf_eval/LLM_NaturalPDF_CheatSheet.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tools/bad_pdf_eval/LLM_NaturalPDF_Workflows.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tools/bad_pdf_eval/README.md +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tools/bad_pdf_eval/__init__.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tools/bad_pdf_eval/analyser.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tools/bad_pdf_eval/collate_summaries.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tools/bad_pdf_eval/eval_suite.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tools/bad_pdf_eval/export_enrichment_csv.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tools/bad_pdf_eval/llm_enrich.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tools/bad_pdf_eval/reporter.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/tools/bad_pdf_eval/utils.py +0 -0
- {natural_pdf-0.1.32 → natural_pdf-0.1.33}/uv.lock +0 -0
@@ -146,7 +146,7 @@ class ElementManager:
|
|
146
146
|
contained in the Page class, providing better separation of concerns.
|
147
147
|
"""
|
148
148
|
|
149
|
-
def __init__(self, page, font_attrs=None):
|
149
|
+
def __init__(self, page, font_attrs=None, load_text: bool = True):
|
150
150
|
"""
|
151
151
|
Initialize the ElementManager.
|
152
152
|
|
@@ -156,9 +156,11 @@ class ElementManager:
|
|
156
156
|
Default: ['fontname', 'size', 'bold', 'italic']
|
157
157
|
None: Only consider spatial relationships
|
158
158
|
List: Custom attributes to consider
|
159
|
+
load_text: Whether to load text elements from the PDF (default: True).
|
159
160
|
"""
|
160
161
|
self._page = page
|
161
162
|
self._elements = None # Lazy-loaded
|
163
|
+
self._load_text = load_text
|
162
164
|
# Default to splitting by fontname, size, bold, italic if not specified
|
163
165
|
# Renamed internal variable for clarity
|
164
166
|
self._word_split_attributes = (
|
@@ -175,11 +177,15 @@ class ElementManager:
|
|
175
177
|
|
176
178
|
logger.debug(f"Page {self._page.number}: Loading elements...")
|
177
179
|
|
178
|
-
# 1. Prepare character dictionaries
|
179
|
-
|
180
|
-
|
181
|
-
|
182
|
-
|
180
|
+
# 1. Prepare character dictionaries only if loading text
|
181
|
+
if self._load_text:
|
182
|
+
prepared_char_dicts = self._prepare_char_dicts()
|
183
|
+
logger.debug(
|
184
|
+
f"Page {self._page.number}: Prepared {len(prepared_char_dicts)} character dictionaries."
|
185
|
+
)
|
186
|
+
else:
|
187
|
+
prepared_char_dicts = []
|
188
|
+
logger.debug(f"Page {self._page.number}: Skipping text loading (load_text=False)")
|
183
189
|
|
184
190
|
# -------------------------------------------------------------
|
185
191
|
# Detect strikethrough (horizontal strike-out lines) on raw
|
@@ -189,61 +195,75 @@ class ElementManager:
|
|
189
195
|
# belong to the same word.
|
190
196
|
# -------------------------------------------------------------
|
191
197
|
|
192
|
-
|
193
|
-
|
194
|
-
|
195
|
-
|
196
|
-
|
197
|
-
|
198
|
-
|
198
|
+
if self._load_text and prepared_char_dicts:
|
199
|
+
try:
|
200
|
+
self._mark_strikethrough_chars(prepared_char_dicts)
|
201
|
+
except Exception as strike_err: # pragma: no cover – strike detection must never crash loading
|
202
|
+
logger.warning(
|
203
|
+
f"Page {self._page.number}: Strikethrough detection failed – {strike_err}",
|
204
|
+
exc_info=True,
|
205
|
+
)
|
199
206
|
|
200
207
|
# -------------------------------------------------------------
|
201
208
|
# Detect underlines on raw characters (must come after strike so
|
202
209
|
# both attributes are present before word grouping).
|
203
210
|
# -------------------------------------------------------------
|
204
211
|
|
205
|
-
|
206
|
-
|
207
|
-
|
208
|
-
|
209
|
-
|
210
|
-
|
211
|
-
|
212
|
+
if self._load_text and prepared_char_dicts:
|
213
|
+
try:
|
214
|
+
self._mark_underline_chars(prepared_char_dicts)
|
215
|
+
except Exception as u_err: # pragma: no cover
|
216
|
+
logger.warning(
|
217
|
+
f"Page {self._page.number}: Underline detection failed – {u_err}",
|
218
|
+
exc_info=True,
|
219
|
+
)
|
212
220
|
|
213
221
|
# Detect highlights
|
214
|
-
|
215
|
-
|
216
|
-
|
217
|
-
|
218
|
-
|
219
|
-
|
220
|
-
|
222
|
+
if self._load_text and prepared_char_dicts:
|
223
|
+
try:
|
224
|
+
self._mark_highlight_chars(prepared_char_dicts)
|
225
|
+
except Exception as h_err:
|
226
|
+
logger.warning(
|
227
|
+
f"Page {self._page.number}: Highlight detection failed – {h_err}",
|
228
|
+
exc_info=True,
|
229
|
+
)
|
221
230
|
|
222
231
|
# Create a mapping from character dict to index for efficient lookup
|
223
|
-
|
224
|
-
|
225
|
-
|
226
|
-
|
227
|
-
|
228
|
-
|
229
|
-
|
230
|
-
|
232
|
+
if self._load_text:
|
233
|
+
char_to_index = {}
|
234
|
+
for idx, char_dict in enumerate(prepared_char_dicts):
|
235
|
+
key = (
|
236
|
+
char_dict.get("x0", 0),
|
237
|
+
char_dict.get("top", 0),
|
238
|
+
char_dict.get("text", ""),
|
239
|
+
)
|
240
|
+
char_to_index[key] = idx
|
241
|
+
else:
|
242
|
+
char_to_index = {}
|
231
243
|
|
232
244
|
# 2. Instantiate the custom word extractor
|
233
245
|
# Prefer page-level config over PDF-level for tolerance lookup
|
246
|
+
word_elements: List[TextElement] = []
|
247
|
+
|
248
|
+
# Get config objects (needed for auto_text_tolerance check)
|
234
249
|
page_config = getattr(self._page, "_config", {})
|
235
250
|
pdf_config = getattr(self._page._parent, "_config", {})
|
236
|
-
|
237
|
-
#
|
238
|
-
xt =
|
239
|
-
yt =
|
251
|
+
|
252
|
+
# Initialize tolerance variables
|
253
|
+
xt = None
|
254
|
+
yt = None
|
240
255
|
use_flow = pdf_config.get("use_text_flow", False)
|
256
|
+
|
257
|
+
if self._load_text and prepared_char_dicts:
|
258
|
+
# Start with any explicitly supplied tolerances (may be None)
|
259
|
+
xt = page_config.get("x_tolerance", pdf_config.get("x_tolerance"))
|
260
|
+
yt = page_config.get("y_tolerance", pdf_config.get("y_tolerance"))
|
241
261
|
|
242
262
|
# ------------------------------------------------------------------
|
243
263
|
# Auto-adaptive tolerance: scale based on median character size when
|
244
264
|
# requested and explicit values are absent.
|
245
265
|
# ------------------------------------------------------------------
|
246
|
-
if pdf_config.get("auto_text_tolerance", True):
|
266
|
+
if self._load_text and pdf_config.get("auto_text_tolerance", True):
|
247
267
|
import statistics
|
248
268
|
|
249
269
|
sizes = [c.get("size", 0) for c in prepared_char_dicts if c.get("size")]
|
@@ -323,7 +343,6 @@ class ElementManager:
|
|
323
343
|
current_line_key = line_key
|
324
344
|
lines[-1].append(char_dict)
|
325
345
|
|
326
|
-
word_elements: List[TextElement] = []
|
327
346
|
# Process each line separately with direction detection
|
328
347
|
for line_chars in lines:
|
329
348
|
if not line_chars:
|
@@ -480,7 +499,8 @@ class ElementManager:
|
|
480
499
|
except Exception:
|
481
500
|
w._obj["highlight_color"] = dominant_color
|
482
501
|
|
483
|
-
generated_words
|
502
|
+
# generated_words defaults to empty list if text loading is disabled
|
503
|
+
generated_words = word_elements if self._load_text else []
|
484
504
|
logger.debug(
|
485
505
|
f"Page {self._page.number}: Generated {len(generated_words)} words using NaturalWordExtractor."
|
486
506
|
)
|
@@ -101,7 +101,7 @@ class Page(ClassificationMixin, ExtractionMixin, ShapeDetectionMixin, DescribeMi
|
|
101
101
|
with improved selection, navigation, extraction, and question-answering capabilities.
|
102
102
|
"""
|
103
103
|
|
104
|
-
def __init__(self, page: "pdfplumber.page.Page", parent: "PDF", index: int, font_attrs=None):
|
104
|
+
def __init__(self, page: "pdfplumber.page.Page", parent: "PDF", index: int, font_attrs=None, load_text: bool = True):
|
105
105
|
"""
|
106
106
|
Initialize a page wrapper.
|
107
107
|
|
@@ -110,10 +110,12 @@ class Page(ClassificationMixin, ExtractionMixin, ShapeDetectionMixin, DescribeMi
|
|
110
110
|
parent: Parent PDF object
|
111
111
|
index: Index of this page in the PDF (0-based)
|
112
112
|
font_attrs: Font attributes to consider when grouping characters into words.
|
113
|
+
load_text: Whether to load text elements from the PDF (default: True).
|
113
114
|
"""
|
114
115
|
self._page = page
|
115
116
|
self._parent = parent
|
116
117
|
self._index = index
|
118
|
+
self._load_text = load_text
|
117
119
|
self._text_styles = None # Lazy-loaded text style analyzer results
|
118
120
|
self._exclusions = [] # List to store exclusion functions/regions
|
119
121
|
self._skew_angle: Optional[float] = None # Stores detected skew angle
|
@@ -136,7 +138,7 @@ class Page(ClassificationMixin, ExtractionMixin, ShapeDetectionMixin, DescribeMi
|
|
136
138
|
self._config = dict(getattr(self._parent, "_config", {}))
|
137
139
|
|
138
140
|
# Initialize ElementManager, passing font_attrs
|
139
|
-
self._element_mgr = ElementManager(self, font_attrs=font_attrs)
|
141
|
+
self._element_mgr = ElementManager(self, font_attrs=font_attrs, load_text=self._load_text)
|
140
142
|
# self._highlighter = HighlightingService(self) # REMOVED - Use property accessor
|
141
143
|
# --- NEW --- Central registry for analysis results
|
142
144
|
self.analyses: Dict[str, Any] = {}
|
@@ -2998,6 +3000,29 @@ class Page(ClassificationMixin, ExtractionMixin, ShapeDetectionMixin, DescribeMi
|
|
2998
3000
|
"""
|
2999
3001
|
return self.find_all('*').inspect(limit=limit)
|
3000
3002
|
|
3003
|
+
def remove_text_layer(self) -> "Page":
|
3004
|
+
"""
|
3005
|
+
Remove all text elements from this page.
|
3006
|
+
|
3007
|
+
This removes all text elements (words and characters) from the page,
|
3008
|
+
effectively clearing the text layer.
|
3009
|
+
|
3010
|
+
Returns:
|
3011
|
+
Self for method chaining
|
3012
|
+
"""
|
3013
|
+
logger.info(f"Page {self.number}: Removing all text elements...")
|
3014
|
+
|
3015
|
+
# Remove all words and chars from the element manager
|
3016
|
+
removed_words = len(self._element_mgr.words)
|
3017
|
+
removed_chars = len(self._element_mgr.chars)
|
3018
|
+
|
3019
|
+
# Clear the lists
|
3020
|
+
self._element_mgr._elements["words"] = []
|
3021
|
+
self._element_mgr._elements["chars"] = []
|
3022
|
+
|
3023
|
+
logger.info(f"Page {self.number}: Removed {removed_words} words and {removed_chars} characters")
|
3024
|
+
return self
|
3025
|
+
|
3001
3026
|
@property
|
3002
3027
|
def lines(self) -> List[Any]:
|
3003
3028
|
"""Get all line elements on this page."""
|
@@ -108,12 +108,13 @@ class _LazyPageList(Sequence):
|
|
108
108
|
also supported and will materialise pages on demand.
|
109
109
|
"""
|
110
110
|
|
111
|
-
def __init__(self, parent_pdf: "PDF", plumber_pdf: "pdfplumber.PDF", font_attrs=None):
|
111
|
+
def __init__(self, parent_pdf: "PDF", plumber_pdf: "pdfplumber.PDF", font_attrs=None, load_text=True):
|
112
112
|
self._parent_pdf = parent_pdf
|
113
113
|
self._plumber_pdf = plumber_pdf
|
114
114
|
self._font_attrs = font_attrs
|
115
115
|
# One slot per pdfplumber page – initially all None
|
116
116
|
self._cache: List[Optional["Page"]] = [None] * len(self._plumber_pdf.pages)
|
117
|
+
self._load_text = load_text
|
117
118
|
|
118
119
|
# Internal helper -----------------------------------------------------
|
119
120
|
def _create_page(self, index: int) -> "Page":
|
@@ -123,7 +124,7 @@ class _LazyPageList(Sequence):
|
|
123
124
|
from natural_pdf.core.page import Page
|
124
125
|
|
125
126
|
plumber_page = self._plumber_pdf.pages[index]
|
126
|
-
cached = Page(plumber_page, parent=self._parent_pdf, index=index, font_attrs=self._font_attrs)
|
127
|
+
cached = Page(plumber_page, parent=self._parent_pdf, index=index, font_attrs=self._font_attrs, load_text=self._load_text)
|
127
128
|
self._cache[index] = cached
|
128
129
|
return cached
|
129
130
|
|
@@ -170,6 +171,7 @@ class PDF(ExtractionMixin, ExportMixin, ClassificationMixin):
|
|
170
171
|
keep_spaces: bool = True,
|
171
172
|
text_tolerance: Optional[dict] = None,
|
172
173
|
auto_text_tolerance: bool = True,
|
174
|
+
text_layer: bool = True,
|
173
175
|
):
|
174
176
|
"""
|
175
177
|
Initialize the enhanced PDF object.
|
@@ -181,11 +183,14 @@ class PDF(ExtractionMixin, ExportMixin, ClassificationMixin):
|
|
181
183
|
keep_spaces: Whether to include spaces in word elements
|
182
184
|
text_tolerance: PDFplumber-style tolerance settings
|
183
185
|
auto_text_tolerance: Whether to automatically scale text tolerance
|
186
|
+
text_layer: Whether to keep the existing text layer from the PDF (default: True).
|
187
|
+
If False, removes all existing text elements during initialization.
|
184
188
|
"""
|
185
189
|
self._original_path_or_stream = path_or_url_or_stream
|
186
190
|
self._temp_file = None
|
187
191
|
self._resolved_path = None
|
188
192
|
self._is_stream = False
|
193
|
+
self._text_layer = text_layer
|
189
194
|
stream_to_open = None
|
190
195
|
|
191
196
|
if hasattr(path_or_url_or_stream, "read"): # Check if it's file-like
|
@@ -257,7 +262,7 @@ class PDF(ExtractionMixin, ExportMixin, ClassificationMixin):
|
|
257
262
|
self._manager_registry = {}
|
258
263
|
|
259
264
|
# Lazily instantiate pages only when accessed
|
260
|
-
self._pages = _LazyPageList(self, self._pdf, font_attrs=font_attrs)
|
265
|
+
self._pages = _LazyPageList(self, self._pdf, font_attrs=font_attrs, load_text=self._text_layer)
|
261
266
|
|
262
267
|
self._element_cache = {}
|
263
268
|
self._exclusions = []
|
@@ -267,6 +272,13 @@ class PDF(ExtractionMixin, ExportMixin, ClassificationMixin):
|
|
267
272
|
|
268
273
|
self._initialize_managers()
|
269
274
|
self._initialize_highlighter()
|
275
|
+
|
276
|
+
# Remove text layer if requested
|
277
|
+
if not self._text_layer:
|
278
|
+
logger.info("Removing text layer as requested (text_layer=False)")
|
279
|
+
# Text layer is not loaded when text_layer=False, so no need to remove
|
280
|
+
pass
|
281
|
+
|
270
282
|
# Analysis results accessed via self.analyses property (see below)
|
271
283
|
|
272
284
|
# --- Automatic cleanup when object is garbage-collected ---
|
@@ -1463,6 +1475,7 @@ class PDF(ExtractionMixin, ExportMixin, ClassificationMixin):
|
|
1463
1475
|
reading_order=self._reading_order,
|
1464
1476
|
font_attrs=self._font_attrs,
|
1465
1477
|
keep_spaces=self._config.get("keep_spaces", True),
|
1478
|
+
text_layer=self._text_layer,
|
1466
1479
|
)
|
1467
1480
|
return new_pdf
|
1468
1481
|
except Exception as e:
|
@@ -2282,15 +2282,28 @@ class Region(DirectionalMixin, ClassificationMixin, ExtractionMixin, ShapeDetect
|
|
2282
2282
|
if success:
|
2283
2283
|
removed_count += 1
|
2284
2284
|
|
2285
|
-
# Remove OCR elements overlapping this region
|
2285
|
+
# Remove ALL OCR elements overlapping this region
|
2286
|
+
# Remove elements with source=="ocr" (built-in OCR) or matching the source_label (previous custom OCR)
|
2286
2287
|
for word in list(self.page._element_mgr.words):
|
2287
|
-
|
2288
|
+
word_source = getattr(word, "source", "")
|
2289
|
+
# Match built-in OCR behavior: remove elements with source "ocr" exactly
|
2290
|
+
# Also remove elements with the same source_label to avoid duplicates
|
2291
|
+
if (word_source == "ocr" or word_source == source_label) and self.intersects(word):
|
2288
2292
|
_safe_remove(word)
|
2289
2293
|
|
2290
|
-
# Also
|
2291
|
-
for
|
2292
|
-
|
2293
|
-
|
2294
|
+
# Also remove char dicts if needed (matching built-in OCR)
|
2295
|
+
for char in list(self.page._element_mgr.chars):
|
2296
|
+
# char can be dict or TextElement; normalize
|
2297
|
+
char_src = char.get("source") if isinstance(char, dict) else getattr(char, "source", None)
|
2298
|
+
if char_src == "ocr" or char_src == source_label:
|
2299
|
+
# Rough bbox for dicts
|
2300
|
+
if isinstance(char, dict):
|
2301
|
+
cx0, ctop, cx1, cbottom = char.get("x0", 0), char.get("top", 0), char.get("x1", 0), char.get("bottom", 0)
|
2302
|
+
else:
|
2303
|
+
cx0, ctop, cx1, cbottom = char.x0, char.top, char.x1, char.bottom
|
2304
|
+
# Quick overlap check
|
2305
|
+
if not (cx1 < self.x0 or cx0 > self.x1 or cbottom < self.top or ctop > self.bottom):
|
2306
|
+
_safe_remove(char)
|
2294
2307
|
|
2295
2308
|
if removed_count > 0:
|
2296
2309
|
logger.info(
|
@@ -824,6 +824,7 @@ tests/test_core/test_elements.py
|
|
824
824
|
tests/test_core/test_loading.py
|
825
825
|
tests/test_core/test_spatial.py
|
826
826
|
tests/test_core/test_text_extraction.py
|
827
|
+
tests/test_core/test_text_layer.py
|
827
828
|
todo/bad_pdf_analysis.md
|
828
829
|
todo/evaluation.md
|
829
830
|
tools/bad_pdf_eval/LLM_NaturalPDF_CheatSheet.md
|
@@ -0,0 +1,125 @@
|
|
1
|
+
"""
|
2
|
+
Test text layer functionality including text_layer=False parameter and remove_text_layer() method.
|
3
|
+
"""
|
4
|
+
|
5
|
+
import pytest
|
6
|
+
from natural_pdf import PDF
|
7
|
+
|
8
|
+
|
9
|
+
def test_pdf_has_text_layer():
|
10
|
+
"""Test that pdfs/01-practice.pdf has a text layer by default."""
|
11
|
+
pdf = PDF("pdfs/01-practice.pdf")
|
12
|
+
page = pdf.pages[0]
|
13
|
+
|
14
|
+
# Check that text elements exist
|
15
|
+
assert len(page.words) > 0, "PDF should have word elements"
|
16
|
+
assert len(page.chars) > 0, "PDF should have character elements"
|
17
|
+
|
18
|
+
# Check that we can extract text
|
19
|
+
text = page.extract_text()
|
20
|
+
assert text.strip() != "", "Should be able to extract text from PDF"
|
21
|
+
assert "Jungle Health and Safety" in text, "Expected text should be in the extracted text"
|
22
|
+
|
23
|
+
pdf.close()
|
24
|
+
|
25
|
+
|
26
|
+
def test_text_layer_false_parameter():
|
27
|
+
"""Test that text_layer=False prevents loading text elements."""
|
28
|
+
pdf = PDF("pdfs/01-practice.pdf", text_layer=False)
|
29
|
+
page = pdf.pages[0]
|
30
|
+
|
31
|
+
# Check that no text elements exist
|
32
|
+
assert len(page.words) == 0, "PDF should have no word elements when text_layer=False"
|
33
|
+
assert len(page.chars) == 0, "PDF should have no character elements when text_layer=False"
|
34
|
+
|
35
|
+
# Check that extract_text returns empty
|
36
|
+
text = page.extract_text()
|
37
|
+
assert text.strip() == "", "extract_text should return empty string when text_layer=False"
|
38
|
+
|
39
|
+
# But other elements should still exist
|
40
|
+
assert len(page.rects) > 0, "Rectangle elements should still be loaded"
|
41
|
+
assert len(page.lines) >= 0, "Line elements should still be accessible"
|
42
|
+
|
43
|
+
pdf.close()
|
44
|
+
|
45
|
+
|
46
|
+
def test_remove_text_layer_method():
|
47
|
+
"""Test that remove_text_layer() removes existing text elements."""
|
48
|
+
pdf = PDF("pdfs/01-practice.pdf")
|
49
|
+
page = pdf.pages[0]
|
50
|
+
|
51
|
+
# First verify text exists
|
52
|
+
initial_words = len(page.words)
|
53
|
+
initial_chars = len(page.chars)
|
54
|
+
assert initial_words > 0, "Should have words initially"
|
55
|
+
assert initial_chars > 0, "Should have chars initially"
|
56
|
+
|
57
|
+
# Extract text before removal
|
58
|
+
text_before = page.extract_text()
|
59
|
+
assert text_before.strip() != "", "Should have text before removal"
|
60
|
+
|
61
|
+
# Remove text layer
|
62
|
+
page.remove_text_layer()
|
63
|
+
|
64
|
+
# Check that text elements are gone
|
65
|
+
assert len(page.words) == 0, "Should have no words after remove_text_layer()"
|
66
|
+
assert len(page.chars) == 0, "Should have no chars after remove_text_layer()"
|
67
|
+
|
68
|
+
# Check that extract_text returns empty
|
69
|
+
text_after = page.extract_text()
|
70
|
+
assert text_after.strip() == "", "extract_text should return empty after remove_text_layer()"
|
71
|
+
|
72
|
+
# But other elements should still exist
|
73
|
+
assert len(page.rects) > 0, "Rectangle elements should still exist after text removal"
|
74
|
+
|
75
|
+
pdf.close()
|
76
|
+
|
77
|
+
|
78
|
+
def test_text_layer_false_then_ocr():
|
79
|
+
"""Test that we can apply OCR to a PDF loaded with text_layer=False."""
|
80
|
+
# Skip if OCR dependencies are not available
|
81
|
+
pytest.importorskip("easyocr")
|
82
|
+
|
83
|
+
pdf = PDF("pdfs/01-practice.pdf", text_layer=False)
|
84
|
+
page = pdf.pages[0]
|
85
|
+
|
86
|
+
# Verify no text initially
|
87
|
+
assert len(page.words) == 0, "Should have no words with text_layer=False"
|
88
|
+
|
89
|
+
# Apply OCR
|
90
|
+
page.apply_ocr(engine="easyocr", languages=["en"])
|
91
|
+
|
92
|
+
# Now we should have OCR text
|
93
|
+
assert len(page.words) > 0, "Should have words after OCR"
|
94
|
+
|
95
|
+
# Check that all words are from OCR
|
96
|
+
for word in page.words:
|
97
|
+
assert word.source == "ocr", "All words should have source='ocr'"
|
98
|
+
|
99
|
+
pdf.close()
|
100
|
+
|
101
|
+
|
102
|
+
def test_multiple_pages_text_layer():
|
103
|
+
"""Test text_layer=False works across multiple pages."""
|
104
|
+
pdf = PDF("pdfs/01-practice.pdf", text_layer=False)
|
105
|
+
|
106
|
+
# Check all pages have no text
|
107
|
+
for page in pdf.pages:
|
108
|
+
assert len(page.words) == 0, f"Page {page.number} should have no words"
|
109
|
+
assert len(page.chars) == 0, f"Page {page.number} should have no chars"
|
110
|
+
assert page.extract_text().strip() == "", f"Page {page.number} should extract empty text"
|
111
|
+
|
112
|
+
pdf.close()
|
113
|
+
|
114
|
+
|
115
|
+
def test_text_layer_parameter_types():
|
116
|
+
"""Test that text_layer parameter accepts proper boolean values."""
|
117
|
+
# Test with explicit True (default behavior)
|
118
|
+
pdf_true = PDF("pdfs/01-practice.pdf", text_layer=True)
|
119
|
+
assert len(pdf_true.pages[0].words) > 0, "text_layer=True should load text"
|
120
|
+
pdf_true.close()
|
121
|
+
|
122
|
+
# Test with explicit False
|
123
|
+
pdf_false = PDF("pdfs/01-practice.pdf", text_layer=False)
|
124
|
+
assert len(pdf_false.pages[0].words) == 0, "text_layer=False should not load text"
|
125
|
+
pdf_false.close()
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{natural_pdf-0.1.32 → natural_pdf-0.1.33}/bad_pdf_analysis/Focus/page_1_all_elements_inspect.txt
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|