natural-pdf 0.1.13__tar.gz → 0.1.15__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/CLAUDE.md +1 -1
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/PKG-INFO +1 -1
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/api/index.md +1 -1
- natural_pdf-0.1.15/docs/layout-analysis/index.ipynb +897 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/layout-analysis/index.md +1 -1
- natural_pdf-0.1.15/docs/tables/index.ipynb +665 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tables/index.md +1 -1
- natural_pdf-0.1.15/docs/text-extraction/index.ipynb +1447 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/text-extraction/index.md +3 -3
- natural_pdf-0.1.15/docs/tutorials/01-loading-and-extraction.ipynb +3089 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/02-finding-elements.ipynb +67 -44
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/03-extracting-blocks.ipynb +27 -19
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/03-extracting-blocks.md +1 -1
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/04-table-extraction.ipynb +33 -25
- natural_pdf-0.1.15/docs/tutorials/05-excluding-content.ipynb +8410 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/06-document-qa.ipynb +38 -30
- natural_pdf-0.1.15/docs/tutorials/07-layout-analysis.ipynb +280 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/07-working-with-regions.ipynb +67 -59
- natural_pdf-0.1.15/docs/tutorials/08-spatial-navigation.ipynb +528 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/08-spatial-navigation.md +1 -1
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/09-section-extraction.ipynb +106 -98
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/10-form-field-extraction.ipynb +59 -51
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/11-enhanced-table-processing.ipynb +6 -6
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/12-ocr-integration.ipynb +1013 -896
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/13-semantic-search.ipynb +138 -130
- natural_pdf-0.1.15/docs/tutorials/14-categorizing-documents.ipynb +2150 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/shape_detection_mixin.py +554 -273
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/core/page.py +127 -13
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/elements/base.py +20 -20
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/elements/region.py +167 -33
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/flows/element.py +2 -2
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf.egg-info/PKG-INFO +1 -1
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf.egg-info/SOURCES.txt +1 -0
- natural_pdf-0.1.15/pdfs/30.pdf +0 -0
- natural_pdf-0.1.13/docs/layout-analysis/index.ipynb +0 -1974
- natural_pdf-0.1.13/docs/tables/index.ipynb +0 -662
- natural_pdf-0.1.13/docs/text-extraction/index.ipynb +0 -1454
- natural_pdf-0.1.13/docs/tutorials/01-loading-and-extraction.ipynb +0 -3082
- natural_pdf-0.1.13/docs/tutorials/05-excluding-content.ipynb +0 -8402
- natural_pdf-0.1.13/docs/tutorials/07-layout-analysis.ipynb +0 -262
- natural_pdf-0.1.13/docs/tutorials/08-spatial-navigation.ipynb +0 -520
- natural_pdf-0.1.13/docs/tutorials/14-categorizing-documents.ipynb +0 -2142
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/.cursor/rules/analysis_framework.mdc +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/.cursor/rules/coding-style.mdc +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/.cursor/rules/edit-md-instead-of-ipynb.mdc +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/.cursor/rules/minimal-comments.mdc +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/.cursor/rules/natural-pdf-overview.mdc +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/.cursor/rules/user-friendly-library-code.mdc +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/.github/workflows/docs.yml +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/.gitignore +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/01-execute_notebooks.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/02-run_all_tutorials.sh +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/LICENSE +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/MANIFEST.in +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/README.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/audit_packaging.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/check_run_md.sh +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/assets/favicon.png +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/assets/favicon.svg +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/assets/javascripts/custom.js +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/assets/logo.svg +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/assets/sample-screen.png +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/assets/social-preview.png +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/assets/social-preview.svg +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/assets/stylesheets/custom.css +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/categorizing-documents/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/data-extraction/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/document-qa/index.ipynb +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/document-qa/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/element-selection/index.ipynb +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/element-selection/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/finetuning/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/installation/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/interactive-widget/index.ipynb +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/interactive-widget/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/loops-and-groups/index.ipynb +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/loops-and-groups/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/ocr/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/pdf-navigation/index.ipynb +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/pdf-navigation/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/reflowing-pages/index.ipynb +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/reflowing-pages/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/regions/index.ipynb +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/regions/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/text-analysis/index.ipynb +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/text-analysis/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/01-loading-and-extraction.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/02-finding-elements.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/04-table-extraction.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/05-excluding-content.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/06-document-qa.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/07-layout-analysis.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/07-working-with-regions.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/09-section-extraction.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/10-form-field-extraction.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/11-enhanced-table-processing.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/12-ocr-integration.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/13-semantic-search.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/tutorials/14-categorizing-documents.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/visual-debugging/index.ipynb +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/visual-debugging/index.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/docs/visual-debugging/region.png +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/mkdocs.yml +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/layout/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/layout/base.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/layout/docling.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/layout/gemini.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/layout/layout_analyzer.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/layout/layout_manager.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/layout/layout_options.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/layout/paddle.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/layout/pdfplumber_table_finder.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/layout/surya.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/layout/tatr.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/layout/yolo.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/text_options.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/text_structure.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/analyzers/utils.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/classification/manager.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/classification/mixin.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/classification/results.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/collections/mixins.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/collections/pdf_collection.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/core/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/core/element_manager.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/core/highlighting_service.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/core/pdf.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/elements/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/elements/collections.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/elements/line.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/elements/rect.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/elements/text.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/export/mixin.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/exporters/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/exporters/base.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/exporters/data/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/exporters/data/pdf.ttf +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/exporters/data/sRGB.icc +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/exporters/hocr.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/exporters/hocr_font.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/exporters/original_pdf.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/exporters/paddleocr.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/exporters/searchable_pdf.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/extraction/manager.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/extraction/mixin.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/extraction/result.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/flows/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/flows/collections.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/flows/flow.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/flows/region.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/ocr/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/ocr/engine.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/ocr/engine_doctr.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/ocr/engine_easyocr.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/ocr/engine_paddle.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/ocr/engine_surya.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/ocr/ocr_factory.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/ocr/ocr_manager.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/ocr/ocr_options.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/ocr/utils.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/qa/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/qa/document_qa.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/search/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/search/lancedb_search_service.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/search/numpy_search_service.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/search/search_options.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/search/search_service_protocol.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/search/searchable_mixin.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/selectors/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/selectors/parser.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/templates/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/templates/finetune/fine_tune_paddleocr.md +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/templates/spa/css/style.css +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/templates/spa/index.html +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/templates/spa/js/app.js +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/templates/spa/words.txt +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/utils/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/utils/debug.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/utils/highlighting.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/utils/identifiers.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/utils/locks.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/utils/packaging.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/utils/reading_order.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/utils/text_extraction.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/utils/visualization.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/widgets/__init__.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/widgets/frontend/viewer.js +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf/widgets/viewer.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf.egg-info/dependency_links.txt +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf.egg-info/requires.txt +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/natural_pdf.egg-info/top_level.txt +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/noxfile.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pdfs/.gitkeep +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pdfs/01-practice.pdf +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pdfs/0500000US42001.pdf +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pdfs/0500000US42007.pdf +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pdfs/2014 Statistics.pdf +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pdfs/2019 Statistics.pdf +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pdfs/Atlanta_Public_Schools_GA_sample.pdf +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pdfs/anexo_edital_6604_1743480-table.pdf +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pdfs/cia-doc.pdf +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pdfs/geometry.pdf +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pdfs/multicolumn.pdf +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pdfs/needs-ocr.pdf +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/publish.sh +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/pyproject.toml +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/sample-screen.png +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/setup.cfg +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/tests/conftest.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/tests/exporters/test_paddleocr_exporter.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/tests/test_core/test_containment_geometry.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/tests/test_core/test_elements.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/tests/test_core/test_loading.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/tests/test_core/test_spatial.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/tests/test_core/test_text_extraction.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/tests/test_loading_original.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/tests/test_optional_deps.py +0 -0
- {natural_pdf-0.1.13 → natural_pdf-0.1.15}/uv.lock +0 -0
@@ -865,7 +865,7 @@ data = table.extract_table()
|
|
865
865
|
|
866
866
|
# Or explicitly specify the method to use
|
867
867
|
data_tatr = table.extract_table(method='tatr') # Uses detected table structure
|
868
|
-
data_plumber = table.extract_table(method='
|
868
|
+
data_plumber = table.extract_table(method='pdfplumber') # Uses pdfplumber's algorithm
|
869
869
|
|
870
870
|
# Work with table components directly
|
871
871
|
rows = page.find_all('region[type=table-row][model=tatr]')
|
@@ -107,7 +107,7 @@ class Region:
|
|
107
107
|
| `save_image(path, resolution=72, crop_only=False)` | Save an image of just the region | `path`: Path to save image<br>`resolution`: Image resolution in DPI<br>`crop_only`: Whether to exclude border | `None` |
|
108
108
|
| `get_sections(start_elements, end_elements=None, boundary_inclusion='start')` | Get sections within the region | `start_elements`: Elements marking section starts<br>`end_elements`: Elements marking section ends<br>`boundary_inclusion`: How to include boundaries | `list[Region]` |
|
109
109
|
| `ask(question, min_confidence=0.0, model=None, debug=False)` | Ask a question about the region content | `question`: Question to ask<br>`min_confidence`: Minimum confidence threshold<br>`model`: Optional model name or path<br>`debug`: Whether to save debug files | `dict`: Result with answer and metadata |
|
110
|
-
| `extract_table(method=None, table_settings=None, use_ocr=False)` | Extract table data from the region | `method`: Extraction method ("
|
110
|
+
| `extract_table(method=None, table_settings=None, use_ocr=False)` | Extract table data from the region | `method`: Extraction method ("pdfplumber", "tatr")<br>`table_settings`: Custom settings for extraction<br>`use_ocr`: Whether to use OCR text | `list`: Table data as rows and columns |
|
111
111
|
| `intersects(other)` | Check if this region intersects with another | `other`: Another region | `bool`: True if regions intersect |
|
112
112
|
| `contains(x, y)` | Check if a point is within the region | `x`: X coordinate<br>`y`: Y coordinate | `bool`: True if point is in region |
|
113
113
|
|