my-aws-helpers 3.1.0.dev3__tar.gz → 3.2.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of my-aws-helpers might be problematic. Click here for more details.
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/PKG-INFO +1 -1
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/bedrock.py +4 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/s3.py +5 -2
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers.egg-info/PKG-INFO +1 -1
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/setup.py +1 -1
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/MANIFEST.in +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/README.md +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/api.py +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/auth.py +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/cognito.py +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/dynamo.py +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/errors.py +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/event.py +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/logging.py +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/prompts/__init__.py +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/prompts/markdown_system_prompt.txt +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/prompts/transactions_headers_prompt.txt +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/prompts/transactions_headers_prompt_v2.txt +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/prompts/transactions_prompt.txt +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/sfn.py +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers.egg-info/SOURCES.txt +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers.egg-info/dependency_links.txt +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers.egg-info/requires.txt +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers.egg-info/top_level.txt +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers.egg-info/zip-safe +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/setup.cfg +0 -0
- {my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/tests/test_event.py +0 -0
|
@@ -180,6 +180,7 @@ class Bedrock:
|
|
|
180
180
|
except Exception as e:
|
|
181
181
|
self.logger.error(f"Could not get pix map for page {i}")
|
|
182
182
|
continue
|
|
183
|
+
skip_page_zero = False
|
|
183
184
|
header_ocr_result = None
|
|
184
185
|
if len(image_bytes_list) > 1:
|
|
185
186
|
headers_prompt = self._get_prompt(prompt_type=PromptType.transaction_headers.value)
|
|
@@ -190,6 +191,7 @@ class Bedrock:
|
|
|
190
191
|
self.logger.info(f"No ocr result returned when getting headers {PromptType.transaction_headers.value}")
|
|
191
192
|
headers = header_ocr_result.content.get("headers")
|
|
192
193
|
if (len(headers) < 1) or (headers is None):
|
|
194
|
+
skip_page_zero = True
|
|
193
195
|
continue
|
|
194
196
|
else:
|
|
195
197
|
break
|
|
@@ -201,6 +203,8 @@ class Bedrock:
|
|
|
201
203
|
self.logger.info("Got Prompt")
|
|
202
204
|
results = list()
|
|
203
205
|
|
|
206
|
+
if skip_page_zero:
|
|
207
|
+
image_bytes_list = image_bytes_list[1:] #page zero often has account summary info
|
|
204
208
|
results = self._parallel_ocr(image_bytes_list=image_bytes_list, prompt=transactions_prompt)
|
|
205
209
|
|
|
206
210
|
# for i, image_bytes in enumerate(image_bytes_list):
|
|
@@ -51,7 +51,7 @@ class S3:
|
|
|
51
51
|
resource: Optional[boto3.resource] = None,
|
|
52
52
|
) -> None:
|
|
53
53
|
self.client = client if client else self._get_client()
|
|
54
|
-
self.resource = resource if resource else boto3.resource('s3')
|
|
54
|
+
self.resource = resource if resource else boto3.resource('s3', region_name = os.environ["AWS_DEFAULT_REGION"])
|
|
55
55
|
|
|
56
56
|
def _get_client(self) -> boto3.client:
|
|
57
57
|
region_name = os.environ["AWS_DEFAULT_REGION"]
|
|
@@ -77,7 +77,10 @@ class S3:
|
|
|
77
77
|
return self._streaming_body_to_dict(response["Body"])
|
|
78
78
|
|
|
79
79
|
def get_presigned_url(
|
|
80
|
-
self,
|
|
80
|
+
self,
|
|
81
|
+
bucket_name: str,
|
|
82
|
+
file_name: str,
|
|
83
|
+
expires_in: int = 3600,
|
|
81
84
|
):
|
|
82
85
|
return self.client.generate_presigned_url(
|
|
83
86
|
"get_object",
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/prompts/markdown_system_prompt.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers/prompts/transactions_prompt.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{my_aws_helpers-3.1.0.dev3 → my_aws_helpers-3.2.0}/my_aws_helpers.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|