data-science-document-ai 1.42.4__tar.gz → 1.42.5__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (56) hide show
  1. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/PKG-INFO +1 -1
  2. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/pyproject.toml +1 -1
  3. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/postprocessing/common.py +7 -1
  4. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/constants.py +0 -0
  5. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/constants_sandbox.py +0 -0
  6. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/docai.py +0 -0
  7. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/docai_processor_config.yaml +0 -0
  8. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/excel_processing.py +0 -0
  9. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/io.py +0 -0
  10. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/llm.py +0 -0
  11. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/log_setup.py +0 -0
  12. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/pdf_processing.py +0 -0
  13. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/postprocessing/postprocess_booking_confirmation.py +0 -0
  14. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/postprocessing/postprocess_commercial_invoice.py +0 -0
  15. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/postprocessing/postprocess_partner_invoice.py +0 -0
  16. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/evergreen/placeholders.json +0 -0
  17. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/evergreen/prompt.txt +0 -0
  18. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/hapag-lloyd/placeholders.json +0 -0
  19. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/hapag-lloyd/prompt.txt +0 -0
  20. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/maersk/placeholders.json +0 -0
  21. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/maersk/prompt.txt +0 -0
  22. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/msc/placeholders.json +0 -0
  23. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/msc/prompt.txt +0 -0
  24. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/oocl/placeholders.json +0 -0
  25. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/oocl/prompt.txt +0 -0
  26. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/other/placeholders.json +0 -0
  27. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/other/prompt.txt +0 -0
  28. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/yangming/placeholders.json +0 -0
  29. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bookingConfirmation/yangming/prompt.txt +0 -0
  30. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bundeskasse/other/placeholders.json +0 -0
  31. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/bundeskasse/other/prompt.txt +0 -0
  32. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/commercialInvoice/other/prompt.txt +0 -0
  33. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/customsAssessment/other/prompt.txt +0 -0
  34. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/customsInvoice/other/placeholders.json +0 -0
  35. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/customsInvoice/other/prompt.txt +0 -0
  36. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/deliveryOrder/other/placeholders.json +0 -0
  37. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/deliveryOrder/other/prompt.txt +0 -0
  38. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/draftMbl/hapag-lloyd/prompt.txt +0 -0
  39. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/draftMbl/maersk/prompt.txt +0 -0
  40. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/draftMbl/other/placeholders.json +0 -0
  41. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/draftMbl/other/prompt.txt +0 -0
  42. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/finalMbL/hapag-lloyd/prompt.txt +0 -0
  43. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/finalMbL/maersk/prompt.txt +0 -0
  44. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/finalMbL/other/prompt.txt +0 -0
  45. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/packingList/other/prompt.txt +0 -0
  46. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/partnerInvoice/other/placeholders.json +0 -0
  47. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/partnerInvoice/other/prompt.txt +0 -0
  48. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/postprocessing/port_code/placeholders.json +0 -0
  49. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/postprocessing/port_code/prompt_port_code.txt +0 -0
  50. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/preprocessing/carrier/placeholders.json +0 -0
  51. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/preprocessing/carrier/prompt.txt +0 -0
  52. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/library/shippingInstruction/other/prompt.txt +0 -0
  53. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/prompts/prompt_library.py +0 -0
  54. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/setup.py +0 -0
  55. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/tms.py +0 -0
  56. {data_science_document_ai-1.42.4 → data_science_document_ai-1.42.5}/src/utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: data-science-document-ai
3
- Version: 1.42.4
3
+ Version: 1.42.5
4
4
  Summary: "Document AI repo for data science"
5
5
  Author: Naomi Nguyen
6
6
  Author-email: naomi.nguyen@forto.com
@@ -1,6 +1,6 @@
1
1
  [tool.poetry]
2
2
  name = "data-science-document-ai"
3
- version = "1.42.4"
3
+ version = "1.42.5"
4
4
  description = "\"Document AI repo for data science\""
5
5
  authors = ["Naomi Nguyen <naomi.nguyen@forto.com>", "Kumar Rajendrababu <kumar.rajendrababu@forto.com>", "Igor Tonko <igor.tonko@forto.com>", "Osman Demirel <osman.demirel@forto.com>"]
6
6
  packages = [
@@ -136,7 +136,7 @@ def extract_number(data_field_value):
136
136
  """
137
137
  formatted_value = ""
138
138
  for c in data_field_value:
139
- if c.isnumeric() or c in [",", "."]:
139
+ if c.isnumeric() or c in [",", ".", "-"]:
140
140
  formatted_value += c
141
141
 
142
142
  # First and last characters should not be [",", "."]
@@ -539,6 +539,9 @@ def decimal_convertor(value, quantity=False):
539
539
  # Remove spaces
540
540
  value = value.strip().replace(" ", "")
541
541
 
542
+ # Check "-" and remove it for processing
543
+ is_negative, value = (True, value[1:]) if value.startswith("-") else (False, value)
544
+
542
545
  if not quantity:
543
546
  # Convert comma to dot for decimal point (e.g., 4.123,45 -> 4123.45)
544
547
  if re.match(r"^\d{1,3}(\.\d{3})*,\d{1,2}$", value):
@@ -573,6 +576,9 @@ def decimal_convertor(value, quantity=False):
573
576
  elif re.match(r"^\d+\.\d{3,}$", value):
574
577
  value = value[: value.index(".") + 3]
575
578
 
579
+ # Re-add negative sign if applicable
580
+ value = "-" + value if is_negative else value
581
+
576
582
  return value
577
583
 
578
584