data-science-document-ai 1.40.0__tar.gz → 1.40.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (58) hide show
  1. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/PKG-INFO +1 -1
  2. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/pyproject.toml +1 -1
  3. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/pdf_processing.py +0 -2
  4. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/postprocessing/postprocess_partner_invoice.py +0 -4
  5. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/constants.py +0 -0
  6. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/constants_sandbox.py +0 -0
  7. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/docai.py +0 -0
  8. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/docai_processor_config.yaml +0 -0
  9. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/excel_processing.py +0 -0
  10. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/io.py +0 -0
  11. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/llm.py +0 -0
  12. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/log_setup.py +0 -0
  13. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/postprocessing/common.py +0 -0
  14. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/postprocessing/postprocess_booking_confirmation.py +0 -0
  15. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/postprocessing/postprocess_commercial_invoice.py +0 -0
  16. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/evergreen/placeholders.json +0 -0
  17. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/evergreen/prompt.txt +0 -0
  18. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/hapag-lloyd/placeholders.json +0 -0
  19. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/hapag-lloyd/prompt.txt +0 -0
  20. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/maersk/placeholders.json +0 -0
  21. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/maersk/prompt.txt +0 -0
  22. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/msc/placeholders.json +0 -0
  23. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/msc/prompt.txt +0 -0
  24. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/oocl/placeholders.json +0 -0
  25. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/oocl/prompt.txt +0 -0
  26. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/other/placeholders.json +0 -0
  27. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/other/prompt.txt +0 -0
  28. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/yangming/placeholders.json +0 -0
  29. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bookingConfirmation/yangming/prompt.txt +0 -0
  30. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bundeskasse/other/placeholders.json +0 -0
  31. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/bundeskasse/other/prompt.txt +0 -0
  32. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/commercialInvoice/other/prompt.txt +0 -0
  33. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/customsAssessment/other/placeholders.json +0 -0
  34. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/customsAssessment/other/prompt.txt +0 -0
  35. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/customsInvoice/other/placeholders.json +0 -0
  36. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/customsInvoice/other/prompt.txt +0 -0
  37. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/deliveryOrder/other/placeholders.json +0 -0
  38. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/deliveryOrder/other/prompt.txt +0 -0
  39. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/draftMbl/hapag-lloyd/prompt.txt +0 -0
  40. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/draftMbl/maersk/prompt.txt +0 -0
  41. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/draftMbl/other/placeholders.json +0 -0
  42. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/draftMbl/other/prompt.txt +0 -0
  43. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/finalMbL/hapag-lloyd/prompt.txt +0 -0
  44. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/finalMbL/maersk/prompt.txt +0 -0
  45. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/finalMbL/other/placeholders.json +0 -0
  46. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/finalMbL/other/prompt.txt +0 -0
  47. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/packingList/other/prompt.txt +0 -0
  48. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/partnerInvoice/other/placeholders.json +0 -0
  49. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/partnerInvoice/other/prompt.txt +0 -0
  50. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/postprocessing/port_code/placeholders.json +0 -0
  51. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/postprocessing/port_code/prompt_port_code.txt +0 -0
  52. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/preprocessing/carrier/placeholders.json +0 -0
  53. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/preprocessing/carrier/prompt.txt +0 -0
  54. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/library/shippingInstruction/other/prompt.txt +0 -0
  55. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/prompts/prompt_library.py +0 -0
  56. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/setup.py +0 -0
  57. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/tms.py +0 -0
  58. {data_science_document_ai-1.40.0 → data_science_document_ai-1.40.2}/src/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: data-science-document-ai
3
- Version: 1.40.0
3
+ Version: 1.40.2
4
4
  Summary: "Document AI repo for data science"
5
5
  Author: Naomi Nguyen
6
6
  Author-email: naomi.nguyen@forto.com
@@ -1,6 +1,6 @@
1
1
  [tool.poetry]
2
2
  name = "data-science-document-ai"
3
- version = "1.40.0"
3
+ version = "1.40.2"
4
4
  description = "\"Document AI repo for data science\""
5
5
  authors = ["Naomi Nguyen <naomi.nguyen@forto.com>", "Kumar Rajendrababu <kumar.rajendrababu@forto.com>", "Igor Tonko <igor.tonko@forto.com>", "Osman Demirel <osman.demirel@forto.com>"]
6
6
  packages = [
@@ -366,7 +366,6 @@ async def data_extraction_manual_flow(
366
366
  meta (DocumentMeta): Metadata associated with the document.
367
367
  processor_client (DocumentProcessorClient): Client for the Document AI processor.
368
368
  schema_client (DocumentSchemaClient): Client for the Document AI schema.
369
- embed_manager (EmbeddingsManager): Manager for embeddings.
370
369
 
371
370
  Returns:
372
371
  dict: A dictionary containing the processed document information.
@@ -406,7 +405,6 @@ async def data_extraction_manual_flow(
406
405
  params=params,
407
406
  input_doc_type=meta.documentTypeCode,
408
407
  file_content=file_content,
409
- schema_client=schema_client,
410
408
  mime_type=mime_type,
411
409
  )
412
410
 
@@ -301,10 +301,6 @@ def associate_forto_item_code(input_string, params):
301
301
  if forto_item_code is None:
302
302
  # 2. Fallback to embedding function if no good fuzzy match
303
303
  forto_item_code = get_tms_mappings(input_string, "line_items")
304
- # embeddings_dict = embed_manager.embeddings_dict
305
- # forto_item_code = embed_manager._find_most_similar_option(
306
- # input_string, *embeddings_dict["item_codes_label"]
307
- # )
308
304
 
309
305
  result = {"documentValue": input_string, "formattedValue": forto_item_code}
310
306
  return result