my-aws-helpers 3.1.0.dev1__tar.gz → 3.1.0.dev3__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of my-aws-helpers might be problematic. Click here for more details.
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/PKG-INFO +1 -1
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/bedrock.py +9 -16
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers.egg-info/PKG-INFO +1 -1
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/setup.py +1 -1
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/MANIFEST.in +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/README.md +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/api.py +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/auth.py +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/cognito.py +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/dynamo.py +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/errors.py +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/event.py +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/logging.py +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/prompts/__init__.py +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/prompts/markdown_system_prompt.txt +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/prompts/transactions_headers_prompt.txt +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/prompts/transactions_headers_prompt_v2.txt +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/prompts/transactions_prompt.txt +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/s3.py +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers/sfn.py +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers.egg-info/SOURCES.txt +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers.egg-info/dependency_links.txt +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers.egg-info/requires.txt +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers.egg-info/top_level.txt +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers.egg-info/zip-safe +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/setup.cfg +0 -0
- {my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/tests/test_event.py +0 -0
|
@@ -146,26 +146,19 @@ class Bedrock:
|
|
|
146
146
|
def _parallel_ocr(
|
|
147
147
|
self,
|
|
148
148
|
image_bytes_list: List[bytes],
|
|
149
|
-
|
|
149
|
+
prompt: str,
|
|
150
150
|
max_workers: int = 10,
|
|
151
151
|
):
|
|
152
|
-
|
|
153
|
-
prompt = self._get_prompt(prompt_type=prompt_type)
|
|
152
|
+
execution_futures = []
|
|
154
153
|
with concurrent.futures.ThreadPoolExecutor(max_workers=max_workers) as executor:
|
|
155
154
|
for i, img in enumerate(image_bytes_list):
|
|
156
155
|
self.logger.info(f"Starting OCR for page: {i}")
|
|
157
|
-
time.sleep(self.sleep_time)
|
|
158
|
-
|
|
159
|
-
|
|
160
|
-
|
|
161
|
-
|
|
162
|
-
|
|
163
|
-
)
|
|
164
|
-
}
|
|
165
|
-
for future in concurrent.futures.as_completed(execution_futures):
|
|
166
|
-
result = future.result()
|
|
167
|
-
if result:
|
|
168
|
-
results.append(result)
|
|
156
|
+
time.sleep(self.sleep_time) # Stagger start time
|
|
157
|
+
future = executor.submit(self._ocr, prompt=prompt, image_bytes=img)
|
|
158
|
+
execution_futures.append(future)
|
|
159
|
+
|
|
160
|
+
# Wait for all tasks and collect results in order of submission
|
|
161
|
+
results = [future.result() for future in execution_futures if future.result() is not None]
|
|
169
162
|
return results
|
|
170
163
|
|
|
171
164
|
def get_ocr_result(
|
|
@@ -208,7 +201,7 @@ class Bedrock:
|
|
|
208
201
|
self.logger.info("Got Prompt")
|
|
209
202
|
results = list()
|
|
210
203
|
|
|
211
|
-
results = self._parallel_ocr(image_bytes_list=image_bytes_list)
|
|
204
|
+
results = self._parallel_ocr(image_bytes_list=image_bytes_list, prompt=transactions_prompt)
|
|
212
205
|
|
|
213
206
|
# for i, image_bytes in enumerate(image_bytes_list):
|
|
214
207
|
# self.logger.info(f"Starting OCR for page: {i}")
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
{my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers.egg-info/requires.txt
RENAMED
|
File without changes
|
{my_aws_helpers-3.1.0.dev1 → my_aws_helpers-3.1.0.dev3}/my_aws_helpers.egg-info/top_level.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|