data-science-document-ai 1.40.0__tar.gz → 1.40.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/PKG-INFO +1 -1
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/pyproject.toml +1 -1
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/pdf_processing.py +0 -2
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/postprocessing/postprocess_partner_invoice.py +0 -4
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/constants.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/constants_sandbox.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/docai.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/docai_processor_config.yaml +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/excel_processing.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/io.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/llm.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/log_setup.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/postprocessing/common.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/postprocessing/postprocess_booking_confirmation.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/postprocessing/postprocess_commercial_invoice.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/evergreen/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/evergreen/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/hapag-lloyd/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/hapag-lloyd/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/maersk/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/maersk/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/msc/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/msc/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/oocl/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/oocl/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/other/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/other/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/yangming/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/yangming/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bundeskasse/other/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bundeskasse/other/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/commercialInvoice/other/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/customsAssessment/other/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/customsAssessment/other/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/customsInvoice/other/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/customsInvoice/other/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/deliveryOrder/other/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/deliveryOrder/other/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/draftMbl/hapag-lloyd/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/draftMbl/maersk/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/draftMbl/other/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/draftMbl/other/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/finalMbL/hapag-lloyd/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/finalMbL/maersk/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/finalMbL/other/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/finalMbL/other/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/packingList/other/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/partnerInvoice/other/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/partnerInvoice/other/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/postprocessing/port_code/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/postprocessing/port_code/prompt_port_code.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/preprocessing/carrier/placeholders.json +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/preprocessing/carrier/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/shippingInstruction/other/prompt.txt +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/prompt_library.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/setup.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/tms.py +0 -0
- {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/utils.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
[tool.poetry]
|
|
2
2
|
name = "data-science-document-ai"
|
|
3
|
-
version = "1.40.
|
|
3
|
+
version = "1.40.2"
|
|
4
4
|
description = "\"Document AI repo for data science\""
|
|
5
5
|
authors = ["Naomi Nguyen <naomi.nguyen@forto.com>", "Kumar Rajendrababu <kumar.rajendrababu@forto.com>", "Igor Tonko <igor.tonko@forto.com>", "Osman Demirel <osman.demirel@forto.com>"]
|
|
6
6
|
packages = [
|
|
@@ -366,7 +366,6 @@ async def data_extraction_manual_flow(
|
|
|
366
366
|
meta (DocumentMeta): Metadata associated with the document.
|
|
367
367
|
processor_client (DocumentProcessorClient): Client for the Document AI processor.
|
|
368
368
|
schema_client (DocumentSchemaClient): Client for the Document AI schema.
|
|
369
|
-
embed_manager (EmbeddingsManager): Manager for embeddings.
|
|
370
369
|
|
|
371
370
|
Returns:
|
|
372
371
|
dict: A dictionary containing the processed document information.
|
|
@@ -406,7 +405,6 @@ async def data_extraction_manual_flow(
|
|
|
406
405
|
params=params,
|
|
407
406
|
input_doc_type=meta.documentTypeCode,
|
|
408
407
|
file_content=file_content,
|
|
409
|
-
schema_client=schema_client,
|
|
410
408
|
mime_type=mime_type,
|
|
411
409
|
)
|
|
412
410
|
|
|
@@ -301,10 +301,6 @@ def associate_forto_item_code(input_string, params):
|
|
|
301
301
|
if forto_item_code is None:
|
|
302
302
|
# 2. Fallback to embedding function if no good fuzzy match
|
|
303
303
|
forto_item_code = get_tms_mappings(input_string, "line_items")
|
|
304
|
-
# embeddings_dict = embed_manager.embeddings_dict
|
|
305
|
-
# forto_item_code = embed_manager._find_most_similar_option(
|
|
306
|
-
# input_string, *embeddings_dict["item_codes_label"]
|
|
307
|
-
# )
|
|
308
304
|
|
|
309
305
|
result = {"documentValue": input_string, "formattedValue": forto_item_code}
|
|
310
306
|
return result
|
|
File without changes
|
{data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/constants_sandbox.py
RENAMED
|
File without changes
|
|
File without changes
|
{data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/docai_processor_config.yaml
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/postprocessing/common.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/prompt_library.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|