pembot 0.0.4__tar.gz → 0.0.5__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of pembot might be problematic. Click here for more details.

Files changed (139) hide show
  1. {pembot-0.0.4 → pembot-0.0.5}/PKG-INFO +1 -1
  2. pembot-0.0.5/pembot/.git/COMMIT_EDITMSG +1 -0
  3. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/index +0 -0
  4. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/logs/HEAD +1 -0
  5. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/logs/refs/heads/main +1 -0
  6. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/logs/refs/remotes/origin/main +1 -0
  7. pembot-0.0.5/pembot/.git/objects/0b/db4169fc0f312b8698f1df17a258fff163aeaa +0 -0
  8. pembot-0.0.5/pembot/.git/objects/1f/83a471c8119f7794d98c049170a5d7d07a4b71 +0 -0
  9. pembot-0.0.5/pembot/.git/objects/41/cbeb6bcb4c6fa9ef9be571082d95ecb4ea0ee3 +0 -0
  10. pembot-0.0.5/pembot/.git/objects/63/1700a51c8fa97b543991f5f61bfcd1e7e1327d +0 -0
  11. pembot-0.0.5/pembot/.git/objects/ab/139d2cd4798dd8e2c565b80440b1a44b376126 +0 -0
  12. pembot-0.0.5/pembot/.git/objects/bf/068a0714e2145de83a5c004f4213b091439d0e +0 -0
  13. pembot-0.0.5/pembot/.git/objects/d0/937f7d832266337289d5ec09459f931a46fcf7 +0 -0
  14. pembot-0.0.5/pembot/.git/objects/fc/988aab7e2d46396dc595ad24345e8e77dda0e4 +0 -0
  15. pembot-0.0.5/pembot/.git/refs/heads/main +1 -0
  16. pembot-0.0.5/pembot/.git/refs/remotes/origin/main +1 -0
  17. {pembot-0.0.4 → pembot-0.0.5}/pembot/__init__.py +1 -1
  18. {pembot-0.0.4 → pembot-0.0.5}/pembot/config/config.yaml +1 -1
  19. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/extract.py +12 -3
  20. {pembot-0.0.4 → pembot-0.0.5}/pembot/query.py +15 -9
  21. pembot-0.0.4/pembot/.git/COMMIT_EDITMSG +0 -1
  22. pembot-0.0.4/pembot/.git/refs/heads/main +0 -1
  23. pembot-0.0.4/pembot/.git/refs/remotes/origin/main +0 -1
  24. {pembot-0.0.4 → pembot-0.0.5}/LICENSE +0 -0
  25. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/HEAD +0 -0
  26. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/config +0 -0
  27. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/description +0 -0
  28. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/applypatch-msg.sample +0 -0
  29. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/commit-msg.sample +0 -0
  30. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/fsmonitor-watchman.sample +0 -0
  31. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/post-update.sample +0 -0
  32. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/pre-applypatch.sample +0 -0
  33. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/pre-commit.sample +0 -0
  34. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/pre-merge-commit.sample +0 -0
  35. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/pre-push.sample +0 -0
  36. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/pre-rebase.sample +0 -0
  37. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/pre-receive.sample +0 -0
  38. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/prepare-commit-msg.sample +0 -0
  39. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/push-to-checkout.sample +0 -0
  40. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/sendemail-validate.sample +0 -0
  41. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/hooks/update.sample +0 -0
  42. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/info/exclude +0 -0
  43. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/logs/refs/remotes/origin/HEAD +0 -0
  44. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/0a/fb3a98cdc55b1434b44534ec2bf22c56cfa26c +0 -0
  45. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/0c/8d9b2690545bf1906b05cd9f18b783b3eb74f1 +0 -0
  46. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/18/28e18ab80aa64d334b26428708140e280cbc63 +0 -0
  47. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/19/f61df7dbd562d04f561288677bbf2f18f5dff7 +0 -0
  48. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/28/db0ab48059acccd7d257aa02e52e9b6b83a4a5 +0 -0
  49. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/35/97e518a8658280be9f377f78edf1dfa1f23814 +0 -0
  50. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/3d/07d3b29ff53d95de3898fb786d61732f210515 +0 -0
  51. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/3e/cf23eb95123287531d708a21d4ba88d92ccabb +0 -0
  52. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/3f/78215d7e17da726fb352fd92b3c117db9b63ba +0 -0
  53. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/3f/e072cf3cb6a9f30c3e9936e3ddf622e80270d0 +0 -0
  54. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/51/9e780574933d7627a083222bd10dd74f430904 +0 -0
  55. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/61/46a371b9c1bd9f51af273f11f986cfd1bedeba +0 -0
  56. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/64/00040794955d17c9a1fe1aaaea59f2c4822177 +0 -0
  57. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/6d/7a865a23b1cb4182f67907820104ced48b11c9 +0 -0
  58. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/72/f047cda92abcd1ddc857f6461de605f8668331 +0 -0
  59. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/73/2e98f08bc806c331b06847fc8c743f545499e5 +0 -0
  60. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/86/cdaec229f1fbebf43042266b03878944669f25 +0 -0
  61. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/87/d6df5217a4a374f8c1211a05f9bd657f72c9a7 +0 -0
  62. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/8b/5be2af9b16f290549193859c214cd9072212e8 +0 -0
  63. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/93/8f29d9b4b1ae86e39dddf9e3d115a82ddfc9b6 +0 -0
  64. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/9b/123713e30fc9e225f9ac8ff5b02f8f8cf86456 +0 -0
  65. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/ab/c6b15265171457b41e2cfdaf3b8c3994a59eb7 +0 -0
  66. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/ac/9c9018c62fa30dc142665c1b5a375f4e056880 +0 -0
  67. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/b1/1173d9b68db117437ccb9551461152e1e8a77d +0 -0
  68. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/b2/4e79ab07fe9e68781961a25ff9f1dbb1546fbb +0 -0
  69. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/b8/eea52176ffa4d88c5a9976bee26092421565d3 +0 -0
  70. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/bf/32a7e6872e5dc4025ee3df3c921ec7ade0855f +0 -0
  71. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/c0/793458db6e1bee7f79f1a504fb8ff4963f8ed3 +0 -0
  72. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/c2/443060c07101948487cfa93cc39e082e9e0f5f +0 -0
  73. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/e5/3070f2b07f45d031444b09b1b38658f3caf29e +0 -0
  74. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/e7/911a702079a6144997ea4e70f59abbe59ec2bc +0 -0
  75. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/e9/1172752e9a421ae463112d2b0506b37498c98d +0 -0
  76. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/ea/0af89e61a882c5afc2a8c281b2d96f174bfe58 +0 -0
  77. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/eb/75e1c49f1e5b79dca17ccdbec8067756523238 +0 -0
  78. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/f1/655afa1c5636c8d58969e3194bb770aefbc552 +0 -0
  79. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/f4/e991088a63def67a30a2b8bbdb4d58514abab8 +0 -0
  80. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/f8/cbb5bfd1503e66cec2c593362c60a317b6d300 +0 -0
  81. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/f9/98e1f01c2bf0a20159fc851327af05beb3ac88 +0 -0
  82. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/fa/9c9a62ec1203a5868b033ded428c2382c4e1b6 +0 -0
  83. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/fb/6c90c9ce5e0cdfbe074a3f060afc66f62eefde +0 -0
  84. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/fc/e56f1e09d09a05b9babf796fb40bece176f3a2 +0 -0
  85. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/pack/pack-d5469edc8c36e3bb1de5e0070e4d5b1eae935dd4.idx +0 -0
  86. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/pack/pack-d5469edc8c36e3bb1de5e0070e4d5b1eae935dd4.pack +0 -0
  87. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/objects/pack/pack-d5469edc8c36e3bb1de5e0070e4d5b1eae935dd4.rev +0 -0
  88. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/packed-refs +0 -0
  89. {pembot-0.0.4 → pembot-0.0.5}/pembot/.git/refs/remotes/origin/HEAD +0 -0
  90. {pembot-0.0.4 → pembot-0.0.5}/pembot/.gitignore +0 -0
  91. {pembot-0.0.4 → pembot-0.0.5}/pembot/AnyToText/__init__.py +0 -0
  92. {pembot-0.0.4 → pembot-0.0.5}/pembot/AnyToText/convertor.py +0 -0
  93. {pembot-0.0.4 → pembot-0.0.5}/pembot/LICENSE +0 -0
  94. {pembot-0.0.4 → pembot-0.0.5}/pembot/TextEmbedder/__init__.py +0 -0
  95. {pembot-0.0.4 → pembot-0.0.5}/pembot/TextEmbedder/gemini_embedder.py +0 -0
  96. {pembot-0.0.4 → pembot-0.0.5}/pembot/TextEmbedder/mongodb_embedder.py +0 -0
  97. {pembot-0.0.4 → pembot-0.0.5}/pembot/TextEmbedder/mongodb_index_creator.py +0 -0
  98. {pembot-0.0.4 → pembot-0.0.5}/pembot/TextEmbedder/vector_query.py +0 -0
  99. {pembot-0.0.4 → pembot-0.0.5}/pembot/gartner.py +0 -0
  100. {pembot-0.0.4 → pembot-0.0.5}/pembot/main.py +0 -0
  101. {pembot-0.0.4 → pembot-0.0.5}/pembot/output_structure_local.py +0 -0
  102. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/HEAD +0 -0
  103. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/config +0 -0
  104. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/description +0 -0
  105. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/applypatch-msg.sample +0 -0
  106. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/commit-msg.sample +0 -0
  107. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/fsmonitor-watchman.sample +0 -0
  108. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/post-update.sample +0 -0
  109. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/pre-applypatch.sample +0 -0
  110. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/pre-commit.sample +0 -0
  111. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/pre-merge-commit.sample +0 -0
  112. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/pre-push.sample +0 -0
  113. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/pre-rebase.sample +0 -0
  114. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/pre-receive.sample +0 -0
  115. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/prepare-commit-msg.sample +0 -0
  116. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/push-to-checkout.sample +0 -0
  117. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/sendemail-validate.sample +0 -0
  118. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/hooks/update.sample +0 -0
  119. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/index +0 -0
  120. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/info/exclude +0 -0
  121. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/logs/HEAD +0 -0
  122. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/logs/refs/heads/main +0 -0
  123. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/logs/refs/remotes/origin/HEAD +0 -0
  124. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/objects/pack/pack-d3051affdd6c31306dc53489168fc870872085d1.idx +0 -0
  125. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/objects/pack/pack-d3051affdd6c31306dc53489168fc870872085d1.pack +0 -0
  126. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/objects/pack/pack-d3051affdd6c31306dc53489168fc870872085d1.rev +0 -0
  127. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/packed-refs +0 -0
  128. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/refs/heads/main +0 -0
  129. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/.git/refs/remotes/origin/HEAD +0 -0
  130. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/LICENSE +0 -0
  131. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/README.md +0 -0
  132. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/__init__.py +0 -0
  133. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/config/config.yaml +0 -0
  134. {pembot-0.0.4 → pembot-0.0.5}/pembot/pdf2markdown/requirements.txt +0 -0
  135. {pembot-0.0.4 → pembot-0.0.5}/pembot/pem.py +0 -0
  136. {pembot-0.0.4 → pembot-0.0.5}/pembot/utils/__init__.py +0 -0
  137. {pembot-0.0.4 → pembot-0.0.5}/pembot/utils/inference_client.py +0 -0
  138. {pembot-0.0.4 → pembot-0.0.5}/pembot/utils/string_tools.py +0 -0
  139. {pembot-0.0.4 → pembot-0.0.5}/pyproject.toml +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: pembot
3
- Version: 0.0.4
3
+ Version: 0.0.5
4
4
  Summary: A Python Package to convert PEM blog content to usseful information by leveraging LLMs
5
5
  Author-email: cyto <aryan_sidhwani@protonmail.com>
6
6
  License-Expression: MIT
@@ -0,0 +1 @@
1
+ fixed the output_dir bug; fixed the excel to json function; ran some tests on convertor; incremented the version on the package; removed dependency on schema / structure, and shifted required fields to a pickle file path in the cli args;
@@ -4,3 +4,4 @@ ac9c9018c62fa30dc142665c1b5a375f4e056880 72f047cda92abcd1ddc857f6461de605f866833
4
4
  72f047cda92abcd1ddc857f6461de605f8668331 e91172752e9a421ae463112d2b0506b37498c98d cyto <silverstone965@gmail.com> 1748881846 +0530 commit: added gemini to the embedders and llms ladders; redeclared the required fields;
5
5
  e91172752e9a421ae463112d2b0506b37498c98d 0c8d9b2690545bf1906b05cd9f18b783b3eb74f1 cyto <silverstone965@gmail.com> 1749716350 +0530 commit: added a pem blog chunking module for updating from local, and, an embedding loop to embed all the blogs, with document id as the filter in the search, and the first line title as the filter in updation
6
6
  0c8d9b2690545bf1906b05cd9f18b783b3eb74f1 eb75e1c49f1e5b79dca17ccdbec8067756523238 cyto <silverstone965@gmail.com> 1750856653 +0530 commit: made arrangements for the cases when custom file bytes are to be processed to text output; handled a ollama running / crashing error
7
+ eb75e1c49f1e5b79dca17ccdbec8067756523238 0bdb4169fc0f312b8698f1df17a258fff163aeaa cyto <silverstone965@gmail.com> 1750937276 +0530 commit: fixed the output_dir bug; fixed the excel to json function; ran some tests on convertor; incremented the version on the package; removed dependency on schema / structure, and shifted required fields to a pickle file path in the cli args;
@@ -4,3 +4,4 @@ ac9c9018c62fa30dc142665c1b5a375f4e056880 72f047cda92abcd1ddc857f6461de605f866833
4
4
  72f047cda92abcd1ddc857f6461de605f8668331 e91172752e9a421ae463112d2b0506b37498c98d cyto <silverstone965@gmail.com> 1748881846 +0530 commit: added gemini to the embedders and llms ladders; redeclared the required fields;
5
5
  e91172752e9a421ae463112d2b0506b37498c98d 0c8d9b2690545bf1906b05cd9f18b783b3eb74f1 cyto <silverstone965@gmail.com> 1749716350 +0530 commit: added a pem blog chunking module for updating from local, and, an embedding loop to embed all the blogs, with document id as the filter in the search, and the first line title as the filter in updation
6
6
  0c8d9b2690545bf1906b05cd9f18b783b3eb74f1 eb75e1c49f1e5b79dca17ccdbec8067756523238 cyto <silverstone965@gmail.com> 1750856653 +0530 commit: made arrangements for the cases when custom file bytes are to be processed to text output; handled a ollama running / crashing error
7
+ eb75e1c49f1e5b79dca17ccdbec8067756523238 0bdb4169fc0f312b8698f1df17a258fff163aeaa cyto <silverstone965@gmail.com> 1750937276 +0530 commit: fixed the output_dir bug; fixed the excel to json function; ran some tests on convertor; incremented the version on the package; removed dependency on schema / structure, and shifted required fields to a pickle file path in the cli args;
@@ -3,3 +3,4 @@ ac9c9018c62fa30dc142665c1b5a375f4e056880 72f047cda92abcd1ddc857f6461de605f866833
3
3
  72f047cda92abcd1ddc857f6461de605f8668331 e91172752e9a421ae463112d2b0506b37498c98d cyto <silverstone965@gmail.com> 1748881859 +0530 update by push
4
4
  e91172752e9a421ae463112d2b0506b37498c98d 0c8d9b2690545bf1906b05cd9f18b783b3eb74f1 cyto <silverstone965@gmail.com> 1749716371 +0530 update by push
5
5
  0c8d9b2690545bf1906b05cd9f18b783b3eb74f1 eb75e1c49f1e5b79dca17ccdbec8067756523238 cyto <silverstone965@gmail.com> 1750856672 +0530 update by push
6
+ eb75e1c49f1e5b79dca17ccdbec8067756523238 0bdb4169fc0f312b8698f1df17a258fff163aeaa cyto <silverstone965@gmail.com> 1750937389 +0530 update by push
@@ -0,0 +1 @@
1
+ 0bdb4169fc0f312b8698f1df17a258fff163aeaa
@@ -0,0 +1 @@
1
+ 0bdb4169fc0f312b8698f1df17a258fff163aeaa
@@ -1,6 +1,6 @@
1
1
  """
2
2
  A Python Package to convert PEM blog content to usseful information by leveraging LLMs
3
3
  """
4
- __version__ = '0.0.4'
4
+ __version__ = '0.0.5'
5
5
  from .main import save_to_json_file, make_query
6
6
  __all__ = ["save_to_json_file", "make_query"]
@@ -2,4 +2,4 @@ OUTPUT_DIR: /home/cyto/dev/pembotdir
2
2
  PAGE_DELIMITER: ___________________________ NEXT PAGE ___________________________
3
3
  app:
4
4
  name: pembot
5
- version: 0.0.4
5
+ version: 0.0.5
@@ -24,8 +24,17 @@ import mimetypes
24
24
 
25
25
  warnings.filterwarnings("ignore")
26
26
 
27
- with open(Path("config/config.yaml").resolve(), "r", encoding="utf-8") as f:
28
- config = yaml.safe_load(f)
27
+ config= {}
28
+ try:
29
+ with open(Path("config/config.yaml").resolve(), "r", encoding="utf-8") as f:
30
+ config = yaml.safe_load(f)
31
+ except FileNotFoundError:
32
+ config= {
33
+ 'OUTPUT_DIR': '.',
34
+ 'PAGE_DELIMITER': '____NEXT PAGE____'
35
+ }
36
+ except Exception as e:
37
+ print("unhandled while opening default config in pdf2markdown: ", e)
29
38
 
30
39
 
31
40
  class PDFExtractor(ABC):
@@ -62,7 +71,7 @@ class MarkdownPDFExtractor(PDFExtractor):
62
71
 
63
72
  BULLET_POINTS = "•◦▪▫●○"
64
73
 
65
- def __init__(self, pdf_path, output_path= config["OUTPUT_DIR"], page_delimiter= config["PAGE_DELIMITER"], model_name: str | None= None):
74
+ def __init__(self, pdf_path, output_path= config.get("OUTPUT_DIR", '.'), page_delimiter= config.get("PAGE_DELIMITER", ''), model_name: str | None= None):
66
75
  super().__init__(pdf_path)
67
76
 
68
77
  if model_name is None:
@@ -97,16 +97,22 @@ def rag_query_llm(db_client, llm_client, inference_client, user_query: str, docu
97
97
  str: The generated response from the Ollama model.
98
98
  """
99
99
 
100
- models = llm_client.list()
101
- found= False
102
100
  embed_locally= False
103
-
104
- for model in models.models:
105
- # print(model.model)
106
- if model.model == model_name:
107
- found= True
108
- if model.model == embedding_model:
109
- embed_locally= True
101
+ found= False
102
+ try:
103
+ models = llm_client.list()
104
+ for model in models.models:
105
+ # print(model.model)
106
+ if model.model == model_name:
107
+ found= True
108
+ if model.model == embedding_model:
109
+ embed_locally= True
110
+ except AttributeError as ae:
111
+ print("cant find ollama", ae)
112
+ print("continuing with other models")
113
+ except Exception as e:
114
+ print("unhandled error: ", e)
115
+ raise e
110
116
 
111
117
 
112
118
 
@@ -1 +0,0 @@
1
- made arrangements for the cases when custom file bytes are to be processed to text output; handled a ollama running / crashing error
@@ -1 +0,0 @@
1
- eb75e1c49f1e5b79dca17ccdbec8067756523238
@@ -1 +0,0 @@
1
- eb75e1c49f1e5b79dca17ccdbec8067756523238
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes