fmtr.tools 1.0.33__py3-none-any.whl → 1.0.34__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of fmtr.tools might be problematic. Click here for more details.

fmtr/tools/pdf_tools.py CHANGED
@@ -97,7 +97,7 @@ class Block(data_modelling_tools.Base):
97
97
  Simple text representation
98
98
 
99
99
  """
100
- return ' '.join([span.text for span in self.spans])
100
+ return ' '.join([line.text for line in self.lines])
101
101
 
102
102
  @classmethod
103
103
  def from_dict(cls, data: Dict) -> Self:
@@ -138,7 +138,7 @@ class Document(pm.Document):
138
138
  blocks = []
139
139
 
140
140
  for page in self:
141
- for block in page.get_text("dict")["blocks"]:
141
+ for block in page.get_text("dict", flags=pm.TEXTFLAGS_TEXT | pm.TEXT_ACCURATE_BBOXES)["blocks"]:
142
142
  obj = Block.from_dict(block)
143
143
  blocks.append(obj)
144
144
 
@@ -162,11 +162,6 @@ if __name__ == '__main__':
162
162
  assert PATH_PDF.exists()
163
163
 
164
164
  doc = Document(PATH_PDF)
165
- doc.data
166
-
167
- for page in doc:
168
- print(page.get_text('dict'))
169
- print(page.get_text('html'))
170
-
165
+ data = doc.data
171
166
  md = doc.to_markdown()
172
167
  md
fmtr/tools/version CHANGED
@@ -1 +1 @@
1
- 1.0.33
1
+ 1.0.34
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: fmtr.tools
3
- Version: 1.0.33
3
+ Version: 1.0.34
4
4
  Summary: Collection of high-level tools to simplify everyday development tasks, with a focus on AI/ML
5
5
  Home-page: https://github.com/fmtr/fmtr.tools
6
6
  Author: Frontmatter
@@ -31,7 +31,7 @@ fmtr/tools/netrc_tools.py,sha256=PpNpz_mWlQi6VHGromKwFfTyLpHUXsd4LY6-OKLCbeI,376
31
31
  fmtr/tools/openai_tools.py,sha256=6SUgejgzUzmlKKct2_ePXntvMegu3FJgfk9x7aqtqYc,742
32
32
  fmtr/tools/parallel_tools.py,sha256=G__ZbLRRx4cP5OyqY1hKwnE-VI3m5prYABB0tnZHnes,3132
33
33
  fmtr/tools/path_tools.py,sha256=1GeWXdhV5rH99IfLI5ZFEnOJfs4Q4mYTT2R-rA791iQ,4273
34
- fmtr/tools/pdf_tools.py,sha256=3XZ6Tpvuf46oeYENsYQsYn-6hbTqHDSJesqNZeJ1Rko,3563
34
+ fmtr/tools/pdf_tools.py,sha256=mCLPJJlN2izIvSIjhJkEUZKT0GYQGmr96dPq9oIRsuo,3524
35
35
  fmtr/tools/platform_tools.py,sha256=7p69CmAHe_sF68Fx9uVhns1k5EewTHTWgUYzkl6ZQKA,308
36
36
  fmtr/tools/process_tools.py,sha256=Ysh5Dk2QFBhXQerArjKdt7xZd3JrN5Ho02AaOjH0Nnw,1425
37
37
  fmtr/tools/profiling_tools.py,sha256=jpXVjaNKPydTasEQVNXvxzGtMhXPit08AnJddkU8uIc,46
@@ -42,7 +42,7 @@ fmtr/tools/string_tools.py,sha256=U2EptMWR6KDOP22ZQ4ReUHV4i25SP7xwCmZScI1sy4M,32
42
42
  fmtr/tools/tokenization_tools.py,sha256=9FP5vgPufWv0XA961eVKObFll0d_2mM0W3ut3rtZyeo,4329
43
43
  fmtr/tools/tools.py,sha256=xnfUrOnrT4OxFYez6vV5tAhydzCICJFiGVnviiZDEQo,796
44
44
  fmtr/tools/unicode_tools.py,sha256=yS_9wpu8ogNoiIL7s1G_8bETFFO_YQlo4LNPv1NLDeY,52
45
- fmtr/tools/version,sha256=V-CY1GAptD08dwDUv8tP0IXGjOPKFQq8iTv5XUR7qhc,6
45
+ fmtr/tools/version,sha256=95PJL7GqZ_Ze5aKBt6zAx5dswp7AauJVBg2AJ6DPaFU,6
46
46
  fmtr/tools/version_tools.py,sha256=axzzHBS9V1n6YuSacsDKG3VfAvRqR8qr6aENCibR8vs,1248
47
47
  fmtr/tools/yaml_tools.py,sha256=Ol43ZwbnSXGnn1K98Uxx61KPGSqfC4axE-X2q1LKMwk,349
48
48
  fmtr/tools/tests/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -53,9 +53,9 @@ fmtr/tools/tests/test_environment.py,sha256=iHaiMQfECYZPkPKwfuIZV9uHuWe3aE-p_dN_
53
53
  fmtr/tools/tests/test_json.py,sha256=IeSP4ziPvRcmS8kq7k9tHonC9rN5YYq9GSNT2ul6Msk,287
54
54
  fmtr/tools/tests/test_path.py,sha256=AkZQa6_8BQ-VaCyL_J-iKmdf2ZaM-xFYR37Kun3k4_g,2188
55
55
  fmtr/tools/tests/test_yaml.py,sha256=jc0TwwKu9eC0LvFGNMERdgBue591xwLxYXFbtsRwXVM,287
56
- fmtr.tools-1.0.33.dist-info/LICENSE,sha256=FW9aa6vVN5IjRQWLT43hs4_koYSmpcbIovlKeAJ0_cI,10757
57
- fmtr.tools-1.0.33.dist-info/METADATA,sha256=G6ybzpAyBJfpfyoTPLQBXB6HJRrG-3lKwc84YaSI9nI,13438
58
- fmtr.tools-1.0.33.dist-info/WHEEL,sha256=oiQVh_5PnQM0E3gPdiz09WCNmwiHDMaGer_elqB3coM,92
59
- fmtr.tools-1.0.33.dist-info/entry_points.txt,sha256=CEStVkwJ1mTFvhN1WV5RdW83SkNW1d5Syj-KZ6A19ng,72
60
- fmtr.tools-1.0.33.dist-info/top_level.txt,sha256=t5341a8ii3n4RFizwTeXGmcq_pf4GqL1h9ylE5LIWRk,12
61
- fmtr.tools-1.0.33.dist-info/RECORD,,
56
+ fmtr.tools-1.0.34.dist-info/LICENSE,sha256=FW9aa6vVN5IjRQWLT43hs4_koYSmpcbIovlKeAJ0_cI,10757
57
+ fmtr.tools-1.0.34.dist-info/METADATA,sha256=n17dBm5yzzI_ktSH_1hqUxN7cXJtCSRa_Fh4Vc_vqYQ,13438
58
+ fmtr.tools-1.0.34.dist-info/WHEEL,sha256=oiQVh_5PnQM0E3gPdiz09WCNmwiHDMaGer_elqB3coM,92
59
+ fmtr.tools-1.0.34.dist-info/entry_points.txt,sha256=CEStVkwJ1mTFvhN1WV5RdW83SkNW1d5Syj-KZ6A19ng,72
60
+ fmtr.tools-1.0.34.dist-info/top_level.txt,sha256=t5341a8ii3n4RFizwTeXGmcq_pf4GqL1h9ylE5LIWRk,12
61
+ fmtr.tools-1.0.34.dist-info/RECORD,,