data-science-document-ai 1.60.3__py3-none-any.whl → 1.61.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: data-science-document-ai
3
- Version: 1.60.3
3
+ Version: 1.61.0
4
4
  Summary: "Document AI repo for data science"
5
5
  Author: Naomi Nguyen
6
6
  Author-email: naomi.nguyen@forto.com
@@ -33,8 +33,8 @@ src/prompts/library/commercialInvoice/other/placeholders.json,sha256=zUK2mg9MnHi
33
33
  src/prompts/library/commercialInvoice/other/prompt.txt,sha256=CJapcVrmcvynJUanETDklkzU-0N9hHdhq5wL4MK7OIY,2683
34
34
  src/prompts/library/customsAssessment/other/placeholders.json,sha256=scIV--C9HNWAQbU9zEz3GT_FoAvJqbfuY85YUtt7t-Q,3850
35
35
  src/prompts/library/customsAssessment/other/prompt.txt,sha256=z3FuoHZ588Pz1WBJDW7ISAC3J6n7hPJCcS92CdHDTFw,2494
36
- src/prompts/library/customsInvoice/other/placeholders.json,sha256=Y3nztiKvaqll7Oq2Vo1MjhjqNBG_HyiB_4lYtwCOB0g,12263
37
- src/prompts/library/customsInvoice/other/prompt.txt,sha256=i1ox7ZuWuK69DOllzYIB8sKduFYmxyI-OAtSP_tf6IQ,10297
36
+ src/prompts/library/customsInvoice/other/placeholders.json,sha256=EaYSF6CUjzpjB35H9TYQjXMj1eXdtCDgDpl2YyZsWA0,12739
37
+ src/prompts/library/customsInvoice/other/prompt.txt,sha256=d28rEJhjOSRHxuFe5cLf7ESjJckrqBLjZUXu1JOf5GM,11025
38
38
  src/prompts/library/deliveryOrder/other/placeholders.json,sha256=j-9F4V3yDg4610PPsOwU3oOj_S9vAvAB9Ix155WGIwc,3827
39
39
  src/prompts/library/deliveryOrder/other/prompt.txt,sha256=RD076vq0x0IjoEVQfh-G0u4nxITCpgKZGrwMlR9YAvk,2695
40
40
  src/prompts/library/draftMbl/other/placeholders.json,sha256=Gn8kQ8cMmrzRGLSFH7_8wO1_j2jxhqHd4zeivZP2SjU,4304
@@ -43,8 +43,8 @@ src/prompts/library/finalMbL/other/placeholders.json,sha256=Gn8kQ8cMmrzRGLSFH7_8
43
43
  src/prompts/library/finalMbL/other/prompt.txt,sha256=68IHh7DDAoxQAID2dsRmKPUVQmX9vxxmMcUqnDN8-j0,2458
44
44
  src/prompts/library/packingList/other/placeholders.json,sha256=cGUUvEFoi4Lm0BAiyD29KbNFbUgzO1s7eit_qK3F0ig,4478
45
45
  src/prompts/library/packingList/other/prompt.txt,sha256=6Q9d0KBG6YWmNtzFivvmtQmitaUE2jytfwwc5YwsUgQ,2872
46
- src/prompts/library/partnerInvoice/other/placeholders.json,sha256=S5zWxVM6Ex23drBg6wGKLk_Vd2KJon6mdK1ag3E4RBs,10988
47
- src/prompts/library/partnerInvoice/other/prompt.txt,sha256=Qw27Tj9Kd3exJi1Wd57Ne_sIaFa8j5qSPwI2y1xj55M,8483
46
+ src/prompts/library/partnerInvoice/other/placeholders.json,sha256=6Jgl7R1Jbp5shh5Q7tiH1O5z6r2hyfABBEwB-233tts,11464
47
+ src/prompts/library/partnerInvoice/other/prompt.txt,sha256=3mNLkzzuPkvn6kf1Tm2eJaf-xp9VHfqPRZURD53EOcw,9193
48
48
  src/prompts/library/postprocessing/port_code/placeholders.json,sha256=2TiXf3zSzrglOMPtDOlCntIa5RSvyZQAKG2-IgrCY5A,22
49
49
  src/prompts/library/postprocessing/port_code/prompt_port_code.txt,sha256=--1wunSqEr2ox958lEhjO-0JFBfOLzA3qfKYIzG_Iok,884
50
50
  src/prompts/library/preprocessing/carrier/placeholders.json,sha256=tQeVDtvembhVqvel9vGoy4qcKp1hOvg-bLCgZRdQj0g,192
@@ -55,6 +55,6 @@ src/prompts/prompt_library.py,sha256=VJWHeXN-s501C2GiidIIvQQuZdU6T1R27hE2dKBiI40
55
55
  src/setup.py,sha256=8-vZWjC8Iwa3xxdk3iR4412VCjtNtgzVqkXcFon7UBE,7309
56
56
  src/tms.py,sha256=UXbIo1QE--hIX6NZi5Qyp2R_CP338syrY9pCTPrfgnE,1741
57
57
  src/utils.py,sha256=Ow5_Jals88o8mbZ1BoHfZpHZoCfig_UQb5aalH-mpWE,17278
58
- data_science_document_ai-1.60.3.dist-info/METADATA,sha256=FyamkknqoADm8IVibk-09-6grFI8qfofMblJTHabohE,2152
59
- data_science_document_ai-1.60.3.dist-info/WHEEL,sha256=zp0Cn7JsFoX2ATtOhtaFYIiE2rmFAD4OcMhtUki8W3U,88
60
- data_science_document_ai-1.60.3.dist-info/RECORD,,
58
+ data_science_document_ai-1.61.0.dist-info/METADATA,sha256=dmTTQxd4p6VM9mW8O8AgZkuXoCXjClPdWJPXzFmVuRw,2152
59
+ data_science_document_ai-1.61.0.dist-info/WHEEL,sha256=zp0Cn7JsFoX2ATtOhtaFYIiE2rmFAD4OcMhtUki8W3U,88
60
+ data_science_document_ai-1.61.0.dist-info/RECORD,,
@@ -75,18 +75,26 @@
75
75
  },
76
76
  "lineItemDescription": {"type": "STRING", "nullable": true,
77
77
  "description": "A description of the line item (COGS or Customs line items), which can include details about the service provided."},
78
+ "totalAmountCurrency": {"type": "STRING", "nullable": true,
79
+ "description": "The currency code for the line item's total amount, such as EUR, USD, etc."},
78
80
  "totalAmount": {"type": "STRING", "nullable": true,
79
81
  "description": "The total amount for the line item, which may include the cost of services, and applicable taxes."},
80
- "totalAmountCurrency": {"type": "STRING", "nullable": true,
81
- "description": "The currency code for the total amount, such as EUR, USD, etc."},
82
+ "totalAmountInOriginalCurrency": {
83
+ "type": "STRING",
84
+ "description": "The total amount for the line item in original currency"
85
+ },
86
+ "totalAmountInInvoiceCurrency": {
87
+ "type": "STRING",
88
+ "description": "The total amount for the line item in the currency code the whole invoice's total uses"
89
+ },
82
90
  "totalAmountEuro": {"type": "STRING", "nullable": true,
83
91
  "description": "The total amount converted to Euro, if applicable. You can find it by looking for the term 'Total EUR' or 'Amount in Euro' in the line item."},
84
92
  "quantity": {"type": "STRING", "nullable": true,
85
93
  "description": "The quantity of the item or service provided in the line item."},
86
- "unitPrice": {"type": "STRING", "nullable": true,
87
- "description": "The price per unit of the item or service in the line item. Check the naming in a different languages, such as 'Einzelpreis', 'Unit Price', 'Prezzo unitario', 'Preis pro Einheit', etc.. Refer to 'Prezzo unitario' field in the italian invoice example"},
88
94
  "unitPriceCurrency": {"type": "STRING", "nullable": true,
89
95
  "description": "The currency code for the unit price, such as EUR, USD, etc."},
96
+ "unitPrice": {"type": "STRING", "nullable": true,
97
+ "description": "The price per unit of the item or service in the line item. Check the naming in a different languages, such as 'Einzelpreis', 'Unit Price', 'Prezzo unitario', 'Preis pro Einheit', etc.. Refer to 'Prezzo unitario' field in the italian invoice example"},
90
98
  "vatAmount": {"type": "STRING", "nullable": true,
91
99
  "description": "The VAT amount applied to the line item. This is the tax charged on the totalAmount of the line item."},
92
100
  "vatPercentage": {"type": "STRING", "nullable": true,
@@ -55,11 +55,18 @@ Your role is to accurately extract specific entities from these invoices to supp
55
55
  - lineItem: Details of each COGS and Customs line item on the invoice from each page. Make sure to extract each amount and currency separately.
56
56
  - uniqueId: A unique id which associated with the lineItem as each line item can belong to a different shipment. Extract only if its available in the line item. Either a shipmentId starting with an S and followed by 6 or 8 numeric values or a mblNumber. If shipmentId or mblNumber does not exist, set it to containerNumber.
57
57
  - lineItemDescription: The name or description of the item. Usually, it will be a one line sentence.
58
- - unitPrice: Even if the quantity is not mentioned, you can still extract the unit price. Check the naming of the columns in a different languages, it can be "Unit Price", "Prezzo unitario", "Prix Unitaire", "Unitario", etc. Refer to "Prezzo unitario" field in the italian invoice example.
59
- - totalAmount: The total amount for the item. It can be in different currencies, so ensure to capture the currency as well for the totalAmountCurrency.
58
+ - totalAmountCurrency: the original/native currency code for the line item's total amount. In 3 letters such as USD, EUR
59
+ - totalAmount: The total amount for the item. It can be in different currencies, so ensure to capture the amount according to the totalAmountCurrency.
60
+ - totalAmountInOriginalCurrency: line item amount in its original/native currency
61
+ - totalAmountInInvoiceCurrency: line item amount converted to the invoice's main currency (the currency used for grandTotal)
60
62
  - totalAmountEuro: Few line items contains a total amount in Euro. You can find it by looking for the term "Total EUR" or "Amount in Euro" in the line item but it's always in the EURO / € currency. Sometimes, it can be same as totalAmount if the line item is already in Euro.
61
- - quantity: The quantity of the item or service provided in the line item. Pay attention to 2 x 40HC or 2x40HC. It means, quantity is 2 and 40HC is containerSize but not 240.
62
- - containerNumber: Container Number always starts with 4 letters and is followed by 7 digits (e.g., ABCD1234567). Do not get confused between 0 vs O in the 7 digits of container number.
63
+ - quantity: The quantity of the item or service provided in the line item. Pay attention to 2 x 40HC or 2x40HC. It means, quantity is 2 and 40HC is containerSize
64
+ - unitPriceCurrency: The original/native currency code for the unit price. 3 letters
65
+ - unitPrice: Even if the quantity is not mentioned, you can still extract the unit price. Check the naming of the columns in a different languages, it can be "Unit Price", "Prezzo unitario", "Prix Unitaire", "Unitario", etc. Refer to "Prezzo unitario" field in the italian invoice example.
66
+ - vatAmount: The VAT amount applied to the line item. This is the tax charged on the totalAmount of the line item
67
+ - vatPercentage: The percentage rate of VAT applied to the totalAmount of the line item. This is used to calculate the vatAmount
68
+ - containerNumber: Container Number always starts with 4 letters and is followed by 7 digits (e.g., ABCD1234567, XALU 8593678).
69
+ - containerSize: The size of the container associated with the containerNumber, such as 20ft, 40ft, 40HC, 20DC etc.
63
70
 
64
71
  - hblNumber and mblNumber:
65
72
  - The Master Bill of Lading number. Commonly known as "Bill of Lading Number", "BILL OF LADING NO.", "BL Number", "BL No.", "B/L No.", "BL-Nr.", "B/L", or "HBL No.".
@@ -73,18 +73,26 @@
73
73
  },
74
74
  "lineItemDescription": {"type": "STRING", "nullable": true,
75
75
  "description": "A description of the line item (COGS or Customs line items), which can include details about the service provided."},
76
+ "totalAmountCurrency": {"type": "STRING", "nullable": true,
77
+ "description": "The currency code for the line item's total amount, such as EUR, USD, etc."},
76
78
  "totalAmount": {"type": "STRING", "nullable": true,
77
79
  "description": "The total amount for the line item, which may include the cost of services, and applicable taxes."},
78
- "totalAmountCurrency": {"type": "STRING", "nullable": true,
79
- "description": "The currency code for the total amount, such as EUR, USD, etc."},
80
+ "totalAmountInOriginalCurrency": {
81
+ "type": "STRING",
82
+ "description": "The total amount for the line item in original currency"
83
+ },
84
+ "totalAmountInInvoiceCurrency": {
85
+ "type": "STRING",
86
+ "description": "The total amount for the line item in the currency code the whole invoice's total uses"
87
+ },
80
88
  "totalAmountEuro": {"type": "STRING", "nullable": true,
81
89
  "description": "The total amount converted to Euro, if applicable. You can find it by looking for the term 'Total EUR' or 'Amount in Euro' in the line item."},
82
90
  "quantity": {"type": "STRING", "nullable": true,
83
91
  "description": "The quantity of the item or service provided in the line item."},
84
- "unitPrice": {"type": "STRING", "nullable": true,
85
- "description": "The price per unit of the item or service in the line item. Check the naming in a different languages, such as 'Einzelpreis', 'Unit Price', 'Prezzo unitario', 'Preis pro Einheit', etc.. Refer to 'Prezzo unitario' field in the italian invoice example"},
86
92
  "unitPriceCurrency": {"type": "STRING", "nullable": true,
87
93
  "description": "The currency code for the unit price, such as EUR, USD, etc."},
94
+ "unitPrice": {"type": "STRING", "nullable": true,
95
+ "description": "The price per unit of the item or service in the line item. Check the naming in a different languages, such as 'Einzelpreis', 'Unit Price', 'Prezzo unitario', 'Preis pro Einheit', etc.. Refer to 'Prezzo unitario' field in the italian invoice example"},
88
96
  "vatAmount": {"type": "STRING", "nullable": true,
89
97
  "description": "The VAT amount applied to the line item. This is the tax charged on the totalAmount of the line item."},
90
98
  "vatPercentage": {"type": "STRING", "nullable": true,
@@ -53,11 +53,18 @@ Your role is to accurately extract specific entities from these invoices to supp
53
53
  - lineItem: Details of each COGS and Customs line item on the invoice from each page. Make sure to extract each amount and currency separately.
54
54
  - uniqueId: A unique id which associated with the lineItem as each line item can belong to a different shipment. Extract only if its available in the line item. Either a shipmentId starting with an S and followed by 6 or 8 numeric values or a mblNumber. If shipmentId or mblNumber does not exist, set it to containerNumber.
55
55
  - lineItemDescription: The name or description of the item. Usually, it will be a one line sentence.
56
- - unitPrice: Even if the quantity is not mentioned, you can still extract the unit price. Check the naming of the columns in a different languages, it can be "Unit Price", "Prezzo unitario", "Prix Unitaire", "Unitario", etc. Refer to "Prezzo unitario" field in the italian invoice example.
57
- - totalAmount: The total amount for the item. It can be in different currencies, so ensure to capture the currency as well for the totalAmountCurrency.
56
+ - totalAmountCurrency: original/native currency code for the line item's total amount. In 3 letters such as USD, EUR
57
+ - totalAmount: The total amount for the item. It can be in different currencies, so ensure to capture the amount according to the totalAmountCurrency.
58
+ - totalAmountInOriginalCurrency: line item amount in its original/native currency
59
+ - totalAmountInInvoiceCurrency: line item amount converted to the invoice's main currency (the currency used for grandTotal)
58
60
  - totalAmountEuro: Few line items contains a total amount in Euro. You can find it by looking for the term "Total EUR" or "Amount in Euro" in the line item but it's always in the EURO / € currency. Sometimes, it can be same as totalAmount if the line item is already in Euro.
59
- - quantity: The quantity of the item or service provided in the line item. Pay attention to 2 x 40HC or 2x40HC. It means, quantity is 2 and 40HC is containerSize but not 240.
60
- - containerNumber: Container Number always starts with 4 letters and is followed by 7 digits (e.g., ABCD1234567, XALU 8593678). Do not get confused between 0 vs O in the 7 digits of container number.
61
+ - quantity: The quantity of the item or service provided in the line item. Pay attention to 2 x 40HC or 2x40HC. It means, quantity is 2 and 40HC is containerSize
62
+ - unitPriceCurrency: The original/native currency code for the unit price. 3 letters
63
+ - unitPrice: Even if the quantity is not mentioned, you can still extract the unit price. Check the naming of the columns in a different languages, it can be "Unit Price", "Prezzo unitario", "Prix Unitaire", "Unitario", etc. Refer to "Prezzo unitario" field in the italian invoice example.
64
+ - vatAmount: The VAT amount applied to the line item. This is the tax charged on the totalAmount of the line item
65
+ - vatPercentage: The percentage rate of VAT applied to the totalAmount of the line item. This is used to calculate the vatAmount
66
+ - containerNumber: Container Number always starts with 4 letters and is followed by 7 digits (e.g., ABCD1234567, XALU 8593678).
67
+ - containerSize: The size of the container associated with the containerNumber, such as 20ft, 40ft, 40HC, 20DC etc.
61
68
 
62
69
  - hblNumber and mblNumber:
63
70
  - The Master Bill of Lading number. Commonly known as "Bill of Lading Number", "BILL OF LADING NO.", "BL Number", "BL No.", "B/L No.", "BL-Nr.", "B/L", or "HBL No.".