parsagon 0.17.0__tar.gz → 0.17.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (38) hide show
  1. {parsagon-0.17.0 → parsagon-0.17.2}/PKG-INFO +4 -2
  2. {parsagon-0.17.0 → parsagon-0.17.2}/pyproject.toml +4 -2
  3. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/executor.py +10 -0
  4. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon.egg-info/PKG-INFO +4 -2
  5. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon.egg-info/requires.txt +3 -1
  6. {parsagon-0.17.0 → parsagon-0.17.2}/README.md +0 -0
  7. {parsagon-0.17.0 → parsagon-0.17.2}/setup.cfg +0 -0
  8. {parsagon-0.17.0 → parsagon-0.17.2}/src/__init__.py +0 -0
  9. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/__init__.py +0 -0
  10. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/api.py +0 -0
  11. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/assistant.py +0 -0
  12. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/create.py +0 -0
  13. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/custom_function.py +0 -0
  14. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/edit.py +0 -0
  15. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/exceptions.py +0 -0
  16. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/gui/__init__.py +0 -0
  17. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/gui/controller.py +0 -0
  18. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/gui/menu.py +0 -0
  19. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/gui/window.py +0 -0
  20. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/gui_entry.py +0 -0
  21. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/highlights.js +0 -0
  22. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/main.py +0 -0
  23. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/print.py +0 -0
  24. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/runs.py +0 -0
  25. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/secrets.py +0 -0
  26. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/settings.py +0 -0
  27. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/tests/__init__.py +0 -0
  28. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/tests/api_mocks.py +0 -0
  29. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/tests/conftest.py +0 -0
  30. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/tests/test_executor.py +0 -0
  31. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/tests/test_invalid_args.py +0 -0
  32. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/tests/test_pipeline_operations.py +0 -0
  33. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/tests/test_print.py +0 -0
  34. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon/tests/test_secrets.py +0 -0
  35. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon.egg-info/SOURCES.txt +0 -0
  36. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon.egg-info/dependency_links.txt +0 -0
  37. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon.egg-info/entry_points.txt +0 -0
  38. {parsagon-0.17.0 → parsagon-0.17.2}/src/parsagon.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: parsagon
3
- Version: 0.17.0
3
+ Version: 0.17.2
4
4
  Summary: Allows you to create browser automations with natural language
5
5
  Author-email: Sandy Suh <sandy@parsagon.io>
6
6
  Project-URL: Homepage, https://parsagon.io
@@ -20,7 +20,9 @@ Requires-Dist: undetected-chromedriver==3.5.5
20
20
  Requires-Dist: webdriver-manager==4.0.2
21
21
  Requires-Dist: jsonpath-ng==1.5.3
22
22
  Requires-Dist: simplejson==3.19.1
23
- Requires-Dist: pypdf==4.2.0
23
+ Requires-Dist: PyMuPDF==1.26.4
24
+ Requires-Dist: pymupdf4llm==0.0.27
25
+ Requires-Dist: pypdf==5.9.0
24
26
  Requires-Dist: python-dateutil==2.9.0.post0
25
27
  Requires-Dist: html2text==2024.2.26
26
28
  Requires-Dist: feedparser==6.0.11
@@ -16,7 +16,7 @@ line-length = 120
16
16
 
17
17
  [project]
18
18
  name = "parsagon"
19
- version = "0.17.0"
19
+ version = "0.17.2"
20
20
  description = "Allows you to create browser automations with natural language"
21
21
  readme = "README.md"
22
22
  requires-python = ">=3.8"
@@ -43,7 +43,9 @@ dependencies = [
43
43
  'webdriver-manager==4.0.2',
44
44
  'jsonpath-ng==1.5.3',
45
45
  'simplejson==3.19.1',
46
- 'pypdf==4.2.0',
46
+ 'PyMuPDF==1.26.4',
47
+ 'pymupdf4llm==0.0.27',
48
+ 'pypdf==5.9.0',
47
49
  'python-dateutil==2.9.0.post0',
48
50
  'html2text==2024.2.26',
49
51
  'feedparser==6.0.11',
@@ -16,6 +16,7 @@ import httpx
16
16
  from lxml import etree
17
17
  import lxml.html
18
18
  from lxml.html.clean import Cleaner
19
+ import pymupdf4llm
19
20
  from pypdf import PdfReader
20
21
  from pyvirtualdisplay import Display
21
22
  import undetected_chromedriver as uc
@@ -706,6 +707,15 @@ class Executor:
706
707
  os.remove(most_recent_file)
707
708
  return text
708
709
 
710
+ def get_pdf_md(self, url):
711
+ window_id = self.goto(url)
712
+ self.close_window(window_id)
713
+ files = glob.glob("*")
714
+ most_recent_file = max(files, key=os.path.getmtime)
715
+ md_text = pymupdf4llm.to_markdown(most_recent_file)
716
+ os.remove(most_recent_file)
717
+ return md_text
718
+
709
719
  def str_to_iso8601(self, s):
710
720
  while s:
711
721
  try:
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: parsagon
3
- Version: 0.17.0
3
+ Version: 0.17.2
4
4
  Summary: Allows you to create browser automations with natural language
5
5
  Author-email: Sandy Suh <sandy@parsagon.io>
6
6
  Project-URL: Homepage, https://parsagon.io
@@ -20,7 +20,9 @@ Requires-Dist: undetected-chromedriver==3.5.5
20
20
  Requires-Dist: webdriver-manager==4.0.2
21
21
  Requires-Dist: jsonpath-ng==1.5.3
22
22
  Requires-Dist: simplejson==3.19.1
23
- Requires-Dist: pypdf==4.2.0
23
+ Requires-Dist: PyMuPDF==1.26.4
24
+ Requires-Dist: pymupdf4llm==0.0.27
25
+ Requires-Dist: pypdf==5.9.0
24
26
  Requires-Dist: python-dateutil==2.9.0.post0
25
27
  Requires-Dist: html2text==2024.2.26
26
28
  Requires-Dist: feedparser==6.0.11
@@ -10,7 +10,9 @@ undetected-chromedriver==3.5.5
10
10
  webdriver-manager==4.0.2
11
11
  jsonpath-ng==1.5.3
12
12
  simplejson==3.19.1
13
- pypdf==4.2.0
13
+ PyMuPDF==1.26.4
14
+ pymupdf4llm==0.0.27
15
+ pypdf==5.9.0
14
16
  python-dateutil==2.9.0.post0
15
17
  html2text==2024.2.26
16
18
  feedparser==6.0.11
File without changes
File without changes
File without changes
File without changes